diff --git "a/trainer_state.json" "b/trainer_state.json" --- "a/trainer_state.json" +++ "b/trainer_state.json" @@ -1,35095 +1,2635 @@ { - "best_metric": 0.5390881299972534, - "best_model_checkpoint": "ai-light-dance_singing3_ft_wav2vec2-large-xlsr-53-v1/checkpoint-26542", - "epoch": 49.999566912083154, - "global_step": 57700, + "best_metric": 0.5352242588996887, + "best_model_checkpoint": "ai-light-dance_singing3_ft_wav2vec2-large-xlsr-53-v1/checkpoint-1152", + "epoch": 49.996539792387544, + "global_step": 3600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { - "epoch": 0.01, - "learning_rate": 7.2e-08, - "loss": 0.4498, + "epoch": 0.14, + "learning_rate": 4e-07, + "loss": 0.3794, "step": 10 }, { - "epoch": 0.02, - "learning_rate": 1.5199999999999998e-07, - "loss": 0.389, + "epoch": 0.28, + "learning_rate": 8e-07, + "loss": 0.4002, "step": 20 }, { - "epoch": 0.03, - "learning_rate": 2.24e-07, - "loss": 0.4604, + "epoch": 0.42, + "learning_rate": 1.2e-06, + "loss": 0.37, "step": 30 }, { - "epoch": 0.03, - "learning_rate": 3.0399999999999997e-07, - "loss": 0.369, + "epoch": 0.55, + "learning_rate": 1.6e-06, + "loss": 0.3778, "step": 40 }, { - "epoch": 0.04, - "learning_rate": 3.84e-07, - "loss": 0.4513, + "epoch": 0.69, + "learning_rate": 2e-06, + "loss": 0.3623, "step": 50 }, { - "epoch": 0.05, - "learning_rate": 4.64e-07, - "loss": 0.4209, + "epoch": 0.83, + "learning_rate": 1.9943661971830985e-06, + "loss": 0.3546, "step": 60 }, { - "epoch": 0.06, - "learning_rate": 5.44e-07, - "loss": 0.4298, + "epoch": 0.97, + "learning_rate": 1.988732394366197e-06, + "loss": 0.3818, "step": 70 }, { - "epoch": 0.07, - "learning_rate": 6.24e-07, - "loss": 0.4385, + "epoch": 1.0, + "eval_loss": 0.55694180727005, + "eval_runtime": 126.5731, + "eval_samples_per_second": 4.203, + "eval_steps_per_second": 0.529, + "eval_wer": 0.25345503631805616, + "step": 72 + }, + { + "epoch": 1.11, + "learning_rate": 1.9830985915492956e-06, + "loss": 0.3717, "step": 80 }, { - "epoch": 0.08, - "learning_rate": 7.04e-07, - "loss": 0.4532, + "epoch": 1.25, + "learning_rate": 1.977464788732394e-06, + "loss": 0.3721, "step": 90 }, { - "epoch": 0.09, - "learning_rate": 7.84e-07, - "loss": 0.4732, + "epoch": 1.39, + "learning_rate": 1.971830985915493e-06, + "loss": 0.3563, "step": 100 }, { - "epoch": 0.1, - "learning_rate": 8.639999999999999e-07, - "loss": 0.4583, + "epoch": 1.53, + "learning_rate": 1.9661971830985916e-06, + "loss": 0.3679, "step": 110 }, { - "epoch": 0.1, - "learning_rate": 9.439999999999999e-07, - "loss": 0.403, + "epoch": 1.66, + "learning_rate": 1.96056338028169e-06, + "loss": 0.3668, "step": 120 }, { - "epoch": 0.11, - "learning_rate": 1.024e-06, - "loss": 0.3758, + "epoch": 1.8, + "learning_rate": 1.9549295774647887e-06, + "loss": 0.3909, "step": 130 }, { - "epoch": 0.12, - "learning_rate": 1.1040000000000001e-06, - "loss": 0.417, + "epoch": 1.94, + "learning_rate": 1.9492957746478873e-06, + "loss": 0.3686, "step": 140 }, { - "epoch": 0.13, - "learning_rate": 1.1839999999999998e-06, - "loss": 0.4178, + "epoch": 2.0, + "eval_loss": 0.5535001754760742, + "eval_runtime": 126.7334, + "eval_samples_per_second": 4.198, + "eval_steps_per_second": 0.529, + "eval_wer": 0.25011248955454135, + "step": 144 + }, + { + "epoch": 2.08, + "learning_rate": 1.943661971830986e-06, + "loss": 0.3804, "step": 150 }, { - "epoch": 0.14, - "learning_rate": 1.2639999999999999e-06, - "loss": 0.4161, + "epoch": 2.22, + "learning_rate": 1.9380281690140844e-06, + "loss": 0.3713, "step": 160 }, { - "epoch": 0.15, - "learning_rate": 1.344e-06, - "loss": 0.3947, + "epoch": 2.36, + "learning_rate": 1.932394366197183e-06, + "loss": 0.3722, "step": 170 }, { - "epoch": 0.16, - "learning_rate": 1.4239999999999998e-06, - "loss": 0.4235, + "epoch": 2.5, + "learning_rate": 1.926760563380282e-06, + "loss": 0.3636, "step": 180 }, { - "epoch": 0.16, - "learning_rate": 1.504e-06, - "loss": 0.4218, + "epoch": 2.64, + "learning_rate": 1.9211267605633805e-06, + "loss": 0.3554, "step": 190 }, { - "epoch": 0.17, - "learning_rate": 1.576e-06, - "loss": 0.5228, + "epoch": 2.78, + "learning_rate": 1.9154929577464786e-06, + "loss": 0.3742, "step": 200 }, { - "epoch": 0.18, - "learning_rate": 1.656e-06, - "loss": 0.3904, + "epoch": 2.91, + "learning_rate": 1.909859154929577e-06, + "loss": 0.3562, "step": 210 }, { - "epoch": 0.19, - "learning_rate": 1.736e-06, - "loss": 0.3903, + "epoch": 3.0, + "eval_loss": 0.5526291728019714, + "eval_runtime": 126.7164, + "eval_samples_per_second": 4.198, + "eval_steps_per_second": 0.529, + "eval_wer": 0.25011248955454135, + "step": 216 + }, + { + "epoch": 3.06, + "learning_rate": 1.904225352112676e-06, + "loss": 0.3695, "step": 220 }, { - "epoch": 0.2, - "learning_rate": 1.816e-06, - "loss": 0.4197, + "epoch": 3.19, + "learning_rate": 1.8985915492957744e-06, + "loss": 0.3681, "step": 230 }, { - "epoch": 0.21, - "learning_rate": 1.8959999999999997e-06, - "loss": 0.3821, + "epoch": 3.33, + "learning_rate": 1.892957746478873e-06, + "loss": 0.3837, "step": 240 }, { - "epoch": 0.22, - "learning_rate": 1.976e-06, - "loss": 0.4262, + "epoch": 3.47, + "learning_rate": 1.8873239436619718e-06, + "loss": 0.3692, "step": 250 }, { - "epoch": 0.23, - "learning_rate": 2.056e-06, - "loss": 0.4515, + "epoch": 3.61, + "learning_rate": 1.8816901408450703e-06, + "loss": 0.3657, "step": 260 }, { - "epoch": 0.23, - "learning_rate": 2.136e-06, - "loss": 0.4216, + "epoch": 3.75, + "learning_rate": 1.8760563380281689e-06, + "loss": 0.3619, "step": 270 }, { - "epoch": 0.24, - "learning_rate": 2.216e-06, - "loss": 0.3975, + "epoch": 3.89, + "learning_rate": 1.8704225352112674e-06, + "loss": 0.3506, "step": 280 }, { - "epoch": 0.25, - "learning_rate": 2.2959999999999997e-06, - "loss": 0.4543, + "epoch": 4.0, + "eval_loss": 0.5460096597671509, + "eval_runtime": 125.8887, + "eval_samples_per_second": 4.226, + "eval_steps_per_second": 0.532, + "eval_wer": 0.2519766021726554, + "step": 288 + }, + { + "epoch": 4.03, + "learning_rate": 1.8647887323943662e-06, + "loss": 0.3831, "step": 290 }, { - "epoch": 0.26, - "learning_rate": 2.3759999999999998e-06, - "loss": 0.4256, + "epoch": 4.17, + "learning_rate": 1.8591549295774647e-06, + "loss": 0.3693, "step": 300 }, { - "epoch": 0.27, - "learning_rate": 2.456e-06, - "loss": 0.4268, + "epoch": 4.3, + "learning_rate": 1.8535211267605633e-06, + "loss": 0.3649, "step": 310 }, { - "epoch": 0.28, - "learning_rate": 2.536e-06, - "loss": 0.4296, + "epoch": 4.44, + "learning_rate": 1.8478873239436618e-06, + "loss": 0.3662, "step": 320 }, { - "epoch": 0.29, - "learning_rate": 2.616e-06, - "loss": 0.4022, + "epoch": 4.58, + "learning_rate": 1.8422535211267604e-06, + "loss": 0.3728, "step": 330 }, { - "epoch": 0.29, - "learning_rate": 2.696e-06, - "loss": 0.395, + "epoch": 4.72, + "learning_rate": 1.8366197183098591e-06, + "loss": 0.3744, "step": 340 }, { - "epoch": 0.3, - "learning_rate": 2.7759999999999998e-06, - "loss": 0.4097, + "epoch": 4.86, + "learning_rate": 1.8309859154929577e-06, + "loss": 0.3634, "step": 350 }, { - "epoch": 0.31, - "learning_rate": 2.856e-06, - "loss": 0.459, + "epoch": 5.0, + "learning_rate": 1.8253521126760562e-06, + "loss": 0.369, + "step": 360 + }, + { + "epoch": 5.0, + "eval_loss": 0.5389720797538757, + "eval_runtime": 127.3997, + "eval_samples_per_second": 4.176, + "eval_steps_per_second": 0.526, + "eval_wer": 0.24844121617278395, "step": 360 }, { - "epoch": 0.32, - "learning_rate": 2.936e-06, - "loss": 0.4474, + "epoch": 5.14, + "learning_rate": 1.8197183098591548e-06, + "loss": 0.3617, "step": 370 }, { - "epoch": 0.33, - "learning_rate": 3.016e-06, - "loss": 0.478, + "epoch": 5.28, + "learning_rate": 1.8140845070422535e-06, + "loss": 0.3786, "step": 380 }, { - "epoch": 0.34, - "learning_rate": 3.096e-06, - "loss": 0.4229, + "epoch": 5.42, + "learning_rate": 1.808450704225352e-06, + "loss": 0.3606, "step": 390 }, { - "epoch": 0.35, - "learning_rate": 3.176e-06, - "loss": 0.4721, + "epoch": 5.55, + "learning_rate": 1.8028169014084506e-06, + "loss": 0.3748, "step": 400 }, { - "epoch": 0.36, - "learning_rate": 3.256e-06, - "loss": 0.4086, + "epoch": 5.69, + "learning_rate": 1.7971830985915492e-06, + "loss": 0.3747, "step": 410 }, { - "epoch": 0.36, - "learning_rate": 3.336e-06, - "loss": 0.403, + "epoch": 5.83, + "learning_rate": 1.791549295774648e-06, + "loss": 0.3648, "step": 420 }, { - "epoch": 0.37, - "learning_rate": 3.4159999999999996e-06, - "loss": 0.4572, + "epoch": 5.97, + "learning_rate": 1.7859154929577465e-06, + "loss": 0.3683, "step": 430 }, { - "epoch": 0.38, - "learning_rate": 3.4959999999999996e-06, - "loss": 0.4601, + "epoch": 6.0, + "eval_loss": 0.5425658822059631, + "eval_runtime": 127.6397, + "eval_samples_per_second": 4.168, + "eval_steps_per_second": 0.525, + "eval_wer": 0.24741274024554863, + "step": 432 + }, + { + "epoch": 6.11, + "learning_rate": 1.780281690140845e-06, + "loss": 0.3886, "step": 440 }, { - "epoch": 0.39, - "learning_rate": 3.5759999999999997e-06, - "loss": 0.3899, + "epoch": 6.25, + "learning_rate": 1.7746478873239436e-06, + "loss": 0.3608, "step": 450 }, { - "epoch": 0.4, - "learning_rate": 3.656e-06, - "loss": 0.4057, + "epoch": 6.39, + "learning_rate": 1.7690140845070422e-06, + "loss": 0.3566, "step": 460 }, { - "epoch": 0.41, - "learning_rate": 3.736e-06, - "loss": 0.4259, + "epoch": 6.53, + "learning_rate": 1.763380281690141e-06, + "loss": 0.383, "step": 470 }, { - "epoch": 0.42, - "learning_rate": 3.8159999999999995e-06, - "loss": 0.4377, + "epoch": 6.66, + "learning_rate": 1.7577464788732395e-06, + "loss": 0.3775, "step": 480 }, { - "epoch": 0.42, - "learning_rate": 3.896e-06, - "loss": 0.4794, + "epoch": 6.8, + "learning_rate": 1.752112676056338e-06, + "loss": 0.3611, "step": 490 }, { - "epoch": 0.43, - "learning_rate": 3.976e-06, - "loss": 0.3526, + "epoch": 6.94, + "learning_rate": 1.7464788732394364e-06, + "loss": 0.3541, "step": 500 }, { - "epoch": 0.44, - "learning_rate": 3.999510489510489e-06, - "loss": 0.4127, + "epoch": 7.0, + "eval_loss": 0.5451989769935608, + "eval_runtime": 127.6555, + "eval_samples_per_second": 4.167, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2495339718454715, + "step": 504 + }, + { + "epoch": 7.08, + "learning_rate": 1.7408450704225351e-06, + "loss": 0.3877, "step": 510 }, { - "epoch": 0.45, - "learning_rate": 3.998811188811188e-06, - "loss": 0.4779, + "epoch": 7.22, + "learning_rate": 1.7352112676056337e-06, + "loss": 0.3706, "step": 520 }, { - "epoch": 0.46, - "learning_rate": 3.998111888111888e-06, - "loss": 0.4301, + "epoch": 7.36, + "learning_rate": 1.7295774647887322e-06, + "loss": 0.3728, "step": 530 }, { - "epoch": 0.47, - "learning_rate": 3.997412587412587e-06, - "loss": 0.4345, + "epoch": 7.5, + "learning_rate": 1.7239436619718308e-06, + "loss": 0.3731, "step": 540 }, { - "epoch": 0.48, - "learning_rate": 3.996713286713287e-06, - "loss": 0.4821, + "epoch": 7.64, + "learning_rate": 1.7183098591549295e-06, + "loss": 0.3525, "step": 550 }, { - "epoch": 0.49, - "learning_rate": 3.996013986013986e-06, - "loss": 0.4621, + "epoch": 7.78, + "learning_rate": 1.712676056338028e-06, + "loss": 0.3648, "step": 560 }, { - "epoch": 0.49, - "learning_rate": 3.995314685314685e-06, - "loss": 0.4367, + "epoch": 7.91, + "learning_rate": 1.7070422535211266e-06, + "loss": 0.369, "step": 570 }, { - "epoch": 0.5, - "learning_rate": 3.994615384615384e-06, - "loss": 0.476, + "epoch": 8.0, + "eval_loss": 0.5468263030052185, + "eval_runtime": 126.4836, + "eval_samples_per_second": 4.206, + "eval_steps_per_second": 0.53, + "eval_wer": 0.24901973388185383, + "step": 576 + }, + { + "epoch": 8.06, + "learning_rate": 1.7014084507042252e-06, + "loss": 0.377, "step": 580 }, { - "epoch": 0.51, - "learning_rate": 3.993916083916084e-06, - "loss": 0.4139, + "epoch": 8.19, + "learning_rate": 1.6957746478873237e-06, + "loss": 0.3661, "step": 590 }, { - "epoch": 0.52, - "learning_rate": 3.993216783216783e-06, - "loss": 0.4758, + "epoch": 8.33, + "learning_rate": 1.6901408450704225e-06, + "loss": 0.3637, "step": 600 }, { - "epoch": 0.53, - "learning_rate": 3.992517482517483e-06, - "loss": 0.4698, + "epoch": 8.47, + "learning_rate": 1.684507042253521e-06, + "loss": 0.3685, "step": 610 }, { - "epoch": 0.54, - "learning_rate": 3.9918181818181816e-06, - "loss": 0.4321, + "epoch": 8.61, + "learning_rate": 1.6788732394366196e-06, + "loss": 0.366, "step": 620 }, { - "epoch": 0.55, - "learning_rate": 3.991118881118881e-06, - "loss": 0.3903, + "epoch": 8.75, + "learning_rate": 1.6732394366197181e-06, + "loss": 0.375, "step": 630 }, { - "epoch": 0.55, - "learning_rate": 3.9904195804195806e-06, - "loss": 0.4298, + "epoch": 8.89, + "learning_rate": 1.667605633802817e-06, + "loss": 0.358, "step": 640 }, { - "epoch": 0.56, - "learning_rate": 3.989720279720279e-06, - "loss": 0.4029, + "epoch": 9.0, + "eval_loss": 0.5470597147941589, + "eval_runtime": 127.3076, + "eval_samples_per_second": 4.179, + "eval_steps_per_second": 0.526, + "eval_wer": 0.24529150864562577, + "step": 648 + }, + { + "epoch": 9.03, + "learning_rate": 1.6619718309859155e-06, + "loss": 0.384, "step": 650 }, { - "epoch": 0.57, - "learning_rate": 3.989020979020979e-06, - "loss": 0.3981, + "epoch": 9.17, + "learning_rate": 1.656338028169014e-06, + "loss": 0.3688, "step": 660 }, { - "epoch": 0.58, - "learning_rate": 3.988321678321678e-06, - "loss": 0.4351, + "epoch": 9.3, + "learning_rate": 1.6507042253521126e-06, + "loss": 0.3833, "step": 670 }, { - "epoch": 0.59, - "learning_rate": 3.987622377622378e-06, - "loss": 0.3695, + "epoch": 9.44, + "learning_rate": 1.6450704225352113e-06, + "loss": 0.3762, "step": 680 }, { - "epoch": 0.6, - "learning_rate": 3.986923076923076e-06, - "loss": 0.3704, + "epoch": 9.58, + "learning_rate": 1.6394366197183099e-06, + "loss": 0.3667, "step": 690 }, { - "epoch": 0.61, - "learning_rate": 3.986223776223776e-06, - "loss": 0.473, + "epoch": 9.72, + "learning_rate": 1.6338028169014084e-06, + "loss": 0.3657, "step": 700 }, { - "epoch": 0.61, - "learning_rate": 3.985524475524475e-06, - "loss": 0.4391, + "epoch": 9.86, + "learning_rate": 1.628169014084507e-06, + "loss": 0.3698, "step": 710 }, { - "epoch": 0.62, - "learning_rate": 3.984825174825175e-06, - "loss": 0.5259, + "epoch": 10.0, + "learning_rate": 1.6225352112676055e-06, + "loss": 0.3765, "step": 720 }, { - "epoch": 0.63, - "learning_rate": 3.9841258741258735e-06, - "loss": 0.3641, + "epoch": 10.0, + "eval_loss": 0.5376302003860474, + "eval_runtime": 126.264, + "eval_samples_per_second": 4.213, + "eval_steps_per_second": 0.531, + "eval_wer": 0.24587002635469563, + "step": 720 + }, + { + "epoch": 10.14, + "learning_rate": 1.6169014084507043e-06, + "loss": 0.3595, "step": 730 }, { - "epoch": 0.64, - "learning_rate": 3.983426573426573e-06, - "loss": 0.4462, + "epoch": 10.28, + "learning_rate": 1.611830985915493e-06, + "loss": 0.4081, "step": 740 }, { - "epoch": 0.65, - "learning_rate": 3.9827272727272725e-06, - "loss": 0.4094, + "epoch": 10.42, + "learning_rate": 1.6061971830985915e-06, + "loss": 0.3759, "step": 750 }, { - "epoch": 0.66, - "learning_rate": 3.982027972027972e-06, - "loss": 0.4254, + "epoch": 10.55, + "learning_rate": 1.60056338028169e-06, + "loss": 0.3841, "step": 760 }, { - "epoch": 0.67, - "learning_rate": 3.9813286713286715e-06, - "loss": 0.4275, + "epoch": 10.69, + "learning_rate": 1.5949295774647886e-06, + "loss": 0.3742, "step": 770 }, { - "epoch": 0.68, - "learning_rate": 3.98062937062937e-06, - "loss": 0.4205, + "epoch": 10.83, + "learning_rate": 1.5892957746478871e-06, + "loss": 0.3679, "step": 780 }, { - "epoch": 0.68, - "learning_rate": 3.97993006993007e-06, - "loss": 0.3875, + "epoch": 10.97, + "learning_rate": 1.5836619718309859e-06, + "loss": 0.3654, "step": 790 }, { - "epoch": 0.69, - "learning_rate": 3.979230769230769e-06, - "loss": 0.3841, + "epoch": 11.0, + "eval_loss": 0.5407082438468933, + "eval_runtime": 126.3624, + "eval_samples_per_second": 4.21, + "eval_steps_per_second": 0.53, + "eval_wer": 0.24856977566368837, + "step": 792 + }, + { + "epoch": 11.11, + "learning_rate": 1.5780281690140844e-06, + "loss": 0.3768, "step": 800 }, { - "epoch": 0.7, - "learning_rate": 3.978531468531469e-06, - "loss": 0.441, + "epoch": 11.25, + "learning_rate": 1.572394366197183e-06, + "loss": 0.3744, "step": 810 }, { - "epoch": 0.71, - "learning_rate": 3.977832167832168e-06, - "loss": 0.384, + "epoch": 11.39, + "learning_rate": 1.5667605633802815e-06, + "loss": 0.3552, "step": 820 }, { - "epoch": 0.72, - "learning_rate": 3.977132867132867e-06, - "loss": 0.4162, + "epoch": 11.53, + "learning_rate": 1.5611267605633803e-06, + "loss": 0.3837, "step": 830 }, { - "epoch": 0.73, - "learning_rate": 3.976433566433566e-06, - "loss": 0.4469, + "epoch": 11.66, + "learning_rate": 1.5554929577464789e-06, + "loss": 0.3543, "step": 840 }, { - "epoch": 0.74, - "learning_rate": 3.975734265734266e-06, - "loss": 0.4394, + "epoch": 11.8, + "learning_rate": 1.5498591549295774e-06, + "loss": 0.3827, "step": 850 }, { - "epoch": 0.74, - "learning_rate": 3.975034965034965e-06, - "loss": 0.3957, + "epoch": 11.94, + "learning_rate": 1.544225352112676e-06, + "loss": 0.373, "step": 860 }, { - "epoch": 0.75, - "learning_rate": 3.974335664335664e-06, - "loss": 0.4293, + "epoch": 12.0, + "eval_loss": 0.5389824509620667, + "eval_runtime": 127.3392, + "eval_samples_per_second": 4.178, + "eval_steps_per_second": 0.526, + "eval_wer": 0.24747701999100083, + "step": 864 + }, + { + "epoch": 12.08, + "learning_rate": 1.5385915492957747e-06, + "loss": 0.3676, "step": 870 }, { - "epoch": 0.76, - "learning_rate": 3.973636363636363e-06, - "loss": 0.3948, + "epoch": 12.22, + "learning_rate": 1.5329577464788733e-06, + "loss": 0.3608, "step": 880 }, { - "epoch": 0.77, - "learning_rate": 3.972937062937063e-06, - "loss": 0.4366, + "epoch": 12.36, + "learning_rate": 1.5273239436619718e-06, + "loss": 0.3712, "step": 890 }, { - "epoch": 0.78, - "learning_rate": 3.9722377622377615e-06, - "loss": 0.4388, + "epoch": 12.5, + "learning_rate": 1.5216901408450704e-06, + "loss": 0.3857, "step": 900 }, { - "epoch": 0.79, - "learning_rate": 3.971538461538461e-06, - "loss": 0.3781, + "epoch": 12.64, + "learning_rate": 1.516056338028169e-06, + "loss": 0.3474, "step": 910 }, { - "epoch": 0.8, - "learning_rate": 3.9708391608391605e-06, - "loss": 0.4174, + "epoch": 12.78, + "learning_rate": 1.5104225352112677e-06, + "loss": 0.377, "step": 920 }, { - "epoch": 0.81, - "learning_rate": 3.97013986013986e-06, - "loss": 0.393, + "epoch": 12.91, + "learning_rate": 1.5047887323943662e-06, + "loss": 0.3606, "step": 930 }, { - "epoch": 0.81, - "learning_rate": 3.9694405594405595e-06, - "loss": 0.4458, + "epoch": 13.0, + "eval_loss": 0.5441206097602844, + "eval_runtime": 127.0593, + "eval_samples_per_second": 4.187, + "eval_steps_per_second": 0.527, + "eval_wer": 0.247219901009192, + "step": 936 + }, + { + "epoch": 13.06, + "learning_rate": 1.4991549295774648e-06, + "loss": 0.382, "step": 940 }, { - "epoch": 0.82, - "learning_rate": 3.968741258741258e-06, - "loss": 0.4534, + "epoch": 13.19, + "learning_rate": 1.4935211267605633e-06, + "loss": 0.3637, "step": 950 }, { - "epoch": 0.83, - "learning_rate": 3.968041958041958e-06, - "loss": 0.4391, + "epoch": 13.33, + "learning_rate": 1.487887323943662e-06, + "loss": 0.3787, "step": 960 }, { - "epoch": 0.84, - "learning_rate": 3.967342657342657e-06, - "loss": 0.4267, + "epoch": 13.47, + "learning_rate": 1.4822535211267604e-06, + "loss": 0.3722, "step": 970 }, { - "epoch": 0.85, - "learning_rate": 3.966643356643357e-06, - "loss": 0.4302, + "epoch": 13.61, + "learning_rate": 1.476619718309859e-06, + "loss": 0.3511, "step": 980 }, { - "epoch": 0.86, - "learning_rate": 3.965944055944056e-06, - "loss": 0.4674, + "epoch": 13.75, + "learning_rate": 1.4709859154929575e-06, + "loss": 0.3836, "step": 990 }, { - "epoch": 0.87, - "learning_rate": 3.965244755244755e-06, - "loss": 0.4632, + "epoch": 13.89, + "learning_rate": 1.4653521126760563e-06, + "loss": 0.369, "step": 1000 }, { - "epoch": 0.87, - "learning_rate": 3.964545454545454e-06, - "loss": 0.4233, - "step": 1010 + "epoch": 14.0, + "eval_loss": 0.5388315916061401, + "eval_runtime": 126.4346, + "eval_samples_per_second": 4.208, + "eval_steps_per_second": 0.53, + "eval_wer": 0.24895545413640163, + "step": 1008 + }, + { + "epoch": 14.03, + "learning_rate": 1.4597183098591548e-06, + "loss": 0.374, + "step": 1010 }, { - "epoch": 0.88, - "learning_rate": 3.963846153846154e-06, - "loss": 0.4044, + "epoch": 14.17, + "learning_rate": 1.4540845070422534e-06, + "loss": 0.3665, "step": 1020 }, { - "epoch": 0.89, - "learning_rate": 3.963146853146853e-06, - "loss": 0.4616, + "epoch": 14.3, + "learning_rate": 1.448450704225352e-06, + "loss": 0.3777, "step": 1030 }, { - "epoch": 0.9, - "learning_rate": 3.962447552447553e-06, - "loss": 0.4386, + "epoch": 14.44, + "learning_rate": 1.4428169014084505e-06, + "loss": 0.3551, "step": 1040 }, { - "epoch": 0.91, - "learning_rate": 3.9617482517482515e-06, - "loss": 0.4154, + "epoch": 14.58, + "learning_rate": 1.4371830985915493e-06, + "loss": 0.3793, "step": 1050 }, { - "epoch": 0.92, - "learning_rate": 3.961048951048951e-06, - "loss": 0.4102, + "epoch": 14.72, + "learning_rate": 1.4315492957746478e-06, + "loss": 0.375, "step": 1060 }, { - "epoch": 0.93, - "learning_rate": 3.9603496503496505e-06, - "loss": 0.4106, + "epoch": 14.86, + "learning_rate": 1.4259154929577464e-06, + "loss": 0.3518, "step": 1070 }, { - "epoch": 0.94, - "learning_rate": 3.959650349650349e-06, - "loss": 0.449, + "epoch": 15.0, + "learning_rate": 1.420281690140845e-06, + "loss": 0.3762, + "step": 1080 + }, + { + "epoch": 15.0, + "eval_loss": 0.5389070510864258, + "eval_runtime": 126.3932, + "eval_samples_per_second": 4.209, + "eval_steps_per_second": 0.53, + "eval_wer": 0.24966253133637592, "step": 1080 }, { - "epoch": 0.94, - "learning_rate": 3.958951048951049e-06, - "loss": 0.4715, + "epoch": 15.14, + "learning_rate": 1.4146478873239437e-06, + "loss": 0.3805, "step": 1090 }, { - "epoch": 0.95, - "learning_rate": 3.958251748251748e-06, - "loss": 0.4988, + "epoch": 15.28, + "learning_rate": 1.4090140845070422e-06, + "loss": 0.3789, "step": 1100 }, { - "epoch": 0.96, - "learning_rate": 3.957552447552448e-06, - "loss": 0.4438, + "epoch": 15.42, + "learning_rate": 1.4033802816901408e-06, + "loss": 0.3621, "step": 1110 }, { - "epoch": 0.97, - "learning_rate": 3.956853146853146e-06, - "loss": 0.4058, + "epoch": 15.55, + "learning_rate": 1.3977464788732393e-06, + "loss": 0.3749, "step": 1120 }, { - "epoch": 0.98, - "learning_rate": 3.956153846153846e-06, - "loss": 0.3781, + "epoch": 15.69, + "learning_rate": 1.392112676056338e-06, + "loss": 0.3548, "step": 1130 }, { - "epoch": 0.99, - "learning_rate": 3.955454545454545e-06, - "loss": 0.3865, + "epoch": 15.83, + "learning_rate": 1.3864788732394366e-06, + "loss": 0.3794, "step": 1140 }, { - "epoch": 1.0, - "learning_rate": 3.954755244755245e-06, - "loss": 0.4806, + "epoch": 15.97, + "learning_rate": 1.3808450704225352e-06, + "loss": 0.3821, "step": 1150 }, { - "epoch": 1.0, - "eval_loss": 0.5673575401306152, - "eval_runtime": 131.9861, - "eval_samples_per_second": 4.031, - "eval_steps_per_second": 2.015, - "eval_wer": 0.26997493089927366, - "step": 1154 + "epoch": 16.0, + "eval_loss": 0.5352242588996887, + "eval_runtime": 127.705, + "eval_samples_per_second": 4.166, + "eval_steps_per_second": 0.525, + "eval_wer": 0.24895545413640163, + "step": 1152 }, { - "epoch": 1.01, - "learning_rate": 3.954055944055943e-06, - "loss": 0.4652, + "epoch": 16.11, + "learning_rate": 1.3752112676056337e-06, + "loss": 0.3735, "step": 1160 }, { - "epoch": 1.01, - "learning_rate": 3.953356643356643e-06, - "loss": 0.4642, + "epoch": 16.25, + "learning_rate": 1.3695774647887323e-06, + "loss": 0.3688, "step": 1170 }, { - "epoch": 1.02, - "learning_rate": 3.952657342657342e-06, - "loss": 0.4661, + "epoch": 16.39, + "learning_rate": 1.363943661971831e-06, + "loss": 0.353, "step": 1180 }, { - "epoch": 1.03, - "learning_rate": 3.951958041958042e-06, - "loss": 0.435, + "epoch": 16.53, + "learning_rate": 1.3583098591549296e-06, + "loss": 0.3848, "step": 1190 }, { - "epoch": 1.04, - "learning_rate": 3.951258741258741e-06, - "loss": 0.4269, + "epoch": 16.66, + "learning_rate": 1.3526760563380281e-06, + "loss": 0.3767, "step": 1200 }, { - "epoch": 1.05, - "learning_rate": 3.950559440559441e-06, - "loss": 0.4067, + "epoch": 16.8, + "learning_rate": 1.3470422535211267e-06, + "loss": 0.3533, "step": 1210 }, { - "epoch": 1.06, - "learning_rate": 3.9498601398601395e-06, - "loss": 0.397, + "epoch": 16.94, + "learning_rate": 1.3414084507042255e-06, + "loss": 0.3605, "step": 1220 }, { - "epoch": 1.07, - "learning_rate": 3.949160839160839e-06, - "loss": 0.3716, + "epoch": 17.0, + "eval_loss": 0.5433817505836487, + "eval_runtime": 128.2697, + "eval_samples_per_second": 4.148, + "eval_steps_per_second": 0.522, + "eval_wer": 0.24921257311821046, + "step": 1224 + }, + { + "epoch": 17.08, + "learning_rate": 1.335774647887324e-06, + "loss": 0.3997, "step": 1230 }, { - "epoch": 1.07, - "learning_rate": 3.9484615384615385e-06, - "loss": 0.446, + "epoch": 17.22, + "learning_rate": 1.3301408450704226e-06, + "loss": 0.353, "step": 1240 }, { - "epoch": 1.08, - "learning_rate": 3.947762237762238e-06, - "loss": 0.4251, + "epoch": 17.36, + "learning_rate": 1.324507042253521e-06, + "loss": 0.3618, "step": 1250 }, { - "epoch": 1.09, - "learning_rate": 3.947062937062937e-06, - "loss": 0.4264, + "epoch": 17.5, + "learning_rate": 1.3188732394366199e-06, + "loss": 0.3795, "step": 1260 }, { - "epoch": 1.1, - "learning_rate": 3.946363636363636e-06, - "loss": 0.4241, + "epoch": 17.64, + "learning_rate": 1.3132394366197182e-06, + "loss": 0.353, "step": 1270 }, { - "epoch": 1.11, - "learning_rate": 3.945664335664336e-06, - "loss": 0.3776, + "epoch": 17.78, + "learning_rate": 1.3076056338028168e-06, + "loss": 0.385, "step": 1280 }, { - "epoch": 1.12, - "learning_rate": 3.944965034965035e-06, - "loss": 0.4869, + "epoch": 17.91, + "learning_rate": 1.3019718309859153e-06, + "loss": 0.3703, "step": 1290 }, { - "epoch": 1.13, - "learning_rate": 3.944265734265734e-06, - "loss": 0.4406, + "epoch": 18.0, + "eval_loss": 0.5415087342262268, + "eval_runtime": 127.5674, + "eval_samples_per_second": 4.17, + "eval_steps_per_second": 0.525, + "eval_wer": 0.24998393006363695, + "step": 1296 + }, + { + "epoch": 18.06, + "learning_rate": 1.2963380281690139e-06, + "loss": 0.3809, "step": 1300 }, { - "epoch": 1.14, - "learning_rate": 3.943566433566433e-06, - "loss": 0.3714, + "epoch": 18.19, + "learning_rate": 1.2907042253521126e-06, + "loss": 0.3718, "step": 1310 }, { - "epoch": 1.14, - "learning_rate": 3.942867132867133e-06, - "loss": 0.4296, + "epoch": 18.33, + "learning_rate": 1.2850704225352112e-06, + "loss": 0.3714, "step": 1320 }, { - "epoch": 1.15, - "learning_rate": 3.9421678321678314e-06, - "loss": 0.4316, + "epoch": 18.47, + "learning_rate": 1.2794366197183097e-06, + "loss": 0.3692, "step": 1330 }, { - "epoch": 1.16, - "learning_rate": 3.941468531468531e-06, - "loss": 0.407, + "epoch": 18.61, + "learning_rate": 1.2738028169014083e-06, + "loss": 0.3758, "step": 1340 }, { - "epoch": 1.17, - "learning_rate": 3.9407692307692304e-06, - "loss": 0.4837, + "epoch": 18.75, + "learning_rate": 1.268169014084507e-06, + "loss": 0.3642, "step": 1350 }, { - "epoch": 1.18, - "learning_rate": 3.94006993006993e-06, - "loss": 0.4113, + "epoch": 18.89, + "learning_rate": 1.2625352112676056e-06, + "loss": 0.3667, "step": 1360 }, { - "epoch": 1.19, - "learning_rate": 3.9393706293706294e-06, - "loss": 0.4394, + "epoch": 19.0, + "eval_loss": 0.5498944520950317, + "eval_runtime": 127.5121, + "eval_samples_per_second": 4.172, + "eval_steps_per_second": 0.525, + "eval_wer": 0.24869833515459278, + "step": 1368 + }, + { + "epoch": 19.03, + "learning_rate": 1.2569014084507041e-06, + "loss": 0.3731, "step": 1370 }, { - "epoch": 1.2, - "learning_rate": 3.938671328671328e-06, - "loss": 0.4117, + "epoch": 19.17, + "learning_rate": 1.2512676056338027e-06, + "loss": 0.3593, "step": 1380 }, { - "epoch": 1.2, - "learning_rate": 3.937972027972028e-06, - "loss": 0.4547, + "epoch": 19.3, + "learning_rate": 1.2456338028169014e-06, + "loss": 0.3763, "step": 1390 }, { - "epoch": 1.21, - "learning_rate": 3.937272727272727e-06, - "loss": 0.42, + "epoch": 19.44, + "learning_rate": 1.24e-06, + "loss": 0.3641, "step": 1400 }, { - "epoch": 1.22, - "learning_rate": 3.9365734265734266e-06, - "loss": 0.5635, + "epoch": 19.58, + "learning_rate": 1.2343661971830985e-06, + "loss": 0.3697, "step": 1410 }, { - "epoch": 1.23, - "learning_rate": 3.935874125874126e-06, - "loss": 0.363, + "epoch": 19.72, + "learning_rate": 1.228732394366197e-06, + "loss": 0.3714, "step": 1420 }, { - "epoch": 1.24, - "learning_rate": 3.935174825174825e-06, - "loss": 0.3753, + "epoch": 19.86, + "learning_rate": 1.2230985915492956e-06, + "loss": 0.3666, "step": 1430 }, { - "epoch": 1.25, - "learning_rate": 3.934475524475524e-06, - "loss": 0.414, + "epoch": 20.0, + "learning_rate": 1.2174647887323944e-06, + "loss": 0.3703, + "step": 1440 + }, + { + "epoch": 20.0, + "eval_loss": 0.5482383966445923, + "eval_runtime": 127.6825, + "eval_samples_per_second": 4.167, + "eval_steps_per_second": 0.525, + "eval_wer": 0.24940541235456706, "step": 1440 }, { - "epoch": 1.26, - "learning_rate": 3.933776223776224e-06, - "loss": 0.4094, + "epoch": 20.14, + "learning_rate": 1.211830985915493e-06, + "loss": 0.3678, "step": 1450 }, { - "epoch": 1.27, - "learning_rate": 3.933076923076923e-06, - "loss": 0.4114, + "epoch": 20.28, + "learning_rate": 1.2061971830985915e-06, + "loss": 0.3657, "step": 1460 }, { - "epoch": 1.27, - "learning_rate": 3.932377622377623e-06, - "loss": 0.44, + "epoch": 20.42, + "learning_rate": 1.20056338028169e-06, + "loss": 0.3614, "step": 1470 }, { - "epoch": 1.28, - "learning_rate": 3.931678321678321e-06, - "loss": 0.4268, + "epoch": 20.55, + "learning_rate": 1.1949295774647888e-06, + "loss": 0.3816, "step": 1480 }, { - "epoch": 1.29, - "learning_rate": 3.930979020979021e-06, - "loss": 0.4548, + "epoch": 20.69, + "learning_rate": 1.1892957746478874e-06, + "loss": 0.3652, "step": 1490 }, { - "epoch": 1.3, - "learning_rate": 3.93027972027972e-06, - "loss": 0.4305, + "epoch": 20.83, + "learning_rate": 1.183661971830986e-06, + "loss": 0.3814, "step": 1500 }, { - "epoch": 1.31, - "learning_rate": 3.929580419580419e-06, - "loss": 0.4156, + "epoch": 20.97, + "learning_rate": 1.1780281690140845e-06, + "loss": 0.369, "step": 1510 }, { - "epoch": 1.32, - "learning_rate": 3.9288811188811185e-06, - "loss": 0.3706, + "epoch": 21.0, + "eval_loss": 0.5417876839637756, + "eval_runtime": 127.2993, + "eval_samples_per_second": 4.179, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2504338882818024, + "step": 1512 + }, + { + "epoch": 21.11, + "learning_rate": 1.1723943661971832e-06, + "loss": 0.3693, "step": 1520 }, { - "epoch": 1.33, - "learning_rate": 3.928181818181818e-06, - "loss": 0.4603, + "epoch": 21.25, + "learning_rate": 1.1667605633802818e-06, + "loss": 0.3878, "step": 1530 }, { - "epoch": 1.33, - "learning_rate": 3.9274825174825175e-06, - "loss": 0.4222, + "epoch": 21.39, + "learning_rate": 1.1611267605633803e-06, + "loss": 0.3766, "step": 1540 }, { - "epoch": 1.34, - "learning_rate": 3.926783216783216e-06, - "loss": 0.436, + "epoch": 21.53, + "learning_rate": 1.1554929577464789e-06, + "loss": 0.3791, "step": 1550 }, { - "epoch": 1.35, - "learning_rate": 3.926083916083916e-06, - "loss": 0.4884, + "epoch": 21.66, + "learning_rate": 1.1498591549295772e-06, + "loss": 0.3511, "step": 1560 }, { - "epoch": 1.36, - "learning_rate": 3.925384615384615e-06, - "loss": 0.3887, + "epoch": 21.8, + "learning_rate": 1.144225352112676e-06, + "loss": 0.3627, "step": 1570 }, { - "epoch": 1.37, - "learning_rate": 3.924685314685315e-06, - "loss": 0.3735, + "epoch": 21.94, + "learning_rate": 1.1385915492957745e-06, + "loss": 0.3708, "step": 1580 }, { - "epoch": 1.38, - "learning_rate": 3.923986013986013e-06, - "loss": 0.3924, + "epoch": 22.0, + "eval_loss": 0.5436869263648987, + "eval_runtime": 127.6416, + "eval_samples_per_second": 4.168, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2478626984637141, + "step": 1584 + }, + { + "epoch": 22.08, + "learning_rate": 1.132957746478873e-06, + "loss": 0.382, "step": 1590 }, { - "epoch": 1.39, - "learning_rate": 3.923286713286713e-06, - "loss": 0.4278, + "epoch": 22.22, + "learning_rate": 1.1273239436619716e-06, + "loss": 0.3679, "step": 1600 }, { - "epoch": 1.39, - "learning_rate": 3.922587412587412e-06, - "loss": 0.4174, + "epoch": 22.36, + "learning_rate": 1.1216901408450704e-06, + "loss": 0.3632, "step": 1610 }, { - "epoch": 1.4, - "learning_rate": 3.921888111888112e-06, - "loss": 0.3733, + "epoch": 22.5, + "learning_rate": 1.116056338028169e-06, + "loss": 0.3814, "step": 1620 }, { - "epoch": 1.41, - "learning_rate": 3.921188811188811e-06, - "loss": 0.4129, + "epoch": 22.64, + "learning_rate": 1.1104225352112675e-06, + "loss": 0.3719, "step": 1630 }, { - "epoch": 1.42, - "learning_rate": 3.920489510489511e-06, - "loss": 0.3954, + "epoch": 22.78, + "learning_rate": 1.104788732394366e-06, + "loss": 0.3633, "step": 1640 }, { - "epoch": 1.43, - "learning_rate": 3.919790209790209e-06, - "loss": 0.4381, + "epoch": 22.91, + "learning_rate": 1.0991549295774648e-06, + "loss": 0.3609, "step": 1650 }, { - "epoch": 1.44, - "learning_rate": 3.919090909090909e-06, - "loss": 0.4233, + "epoch": 23.0, + "eval_loss": 0.545259952545166, + "eval_runtime": 126.5135, + "eval_samples_per_second": 4.205, + "eval_steps_per_second": 0.53, + "eval_wer": 0.2479912579546185, + "step": 1656 + }, + { + "epoch": 23.06, + "learning_rate": 1.0935211267605633e-06, + "loss": 0.3762, "step": 1660 }, { - "epoch": 1.45, - "learning_rate": 3.918391608391608e-06, - "loss": 0.4528, + "epoch": 23.19, + "learning_rate": 1.087887323943662e-06, + "loss": 0.3726, "step": 1670 }, { - "epoch": 1.46, - "learning_rate": 3.917692307692308e-06, - "loss": 0.4385, + "epoch": 23.33, + "learning_rate": 1.0822535211267604e-06, + "loss": 0.3704, "step": 1680 }, { - "epoch": 1.46, - "learning_rate": 3.9169930069930066e-06, - "loss": 0.4328, + "epoch": 23.47, + "learning_rate": 1.076619718309859e-06, + "loss": 0.3788, "step": 1690 }, { - "epoch": 1.47, - "learning_rate": 3.916293706293706e-06, - "loss": 0.4573, + "epoch": 23.61, + "learning_rate": 1.0709859154929578e-06, + "loss": 0.3743, "step": 1700 }, { - "epoch": 1.48, - "learning_rate": 3.9155944055944056e-06, - "loss": 0.483, + "epoch": 23.75, + "learning_rate": 1.0653521126760563e-06, + "loss": 0.3677, "step": 1710 }, { - "epoch": 1.49, - "learning_rate": 3.914895104895105e-06, - "loss": 0.4303, + "epoch": 23.89, + "learning_rate": 1.0597183098591549e-06, + "loss": 0.3534, "step": 1720 }, { - "epoch": 1.5, - "learning_rate": 3.914195804195804e-06, - "loss": 0.37, + "epoch": 24.0, + "eval_loss": 0.539250373840332, + "eval_runtime": 126.0, + "eval_samples_per_second": 4.222, + "eval_steps_per_second": 0.532, + "eval_wer": 0.24837693642733175, + "step": 1728 + }, + { + "epoch": 24.03, + "learning_rate": 1.0540845070422534e-06, + "loss": 0.3721, "step": 1730 }, { - "epoch": 1.51, - "learning_rate": 3.913496503496503e-06, - "loss": 0.3627, + "epoch": 24.17, + "learning_rate": 1.0484507042253522e-06, + "loss": 0.3682, "step": 1740 }, { - "epoch": 1.52, - "learning_rate": 3.912797202797203e-06, - "loss": 0.4677, + "epoch": 24.3, + "learning_rate": 1.0428169014084507e-06, + "loss": 0.3674, "step": 1750 }, { - "epoch": 1.52, - "learning_rate": 3.912097902097902e-06, - "loss": 0.3917, + "epoch": 24.44, + "learning_rate": 1.0371830985915493e-06, + "loss": 0.3616, "step": 1760 }, { - "epoch": 1.53, - "learning_rate": 3.911398601398601e-06, - "loss": 0.3872, + "epoch": 24.58, + "learning_rate": 1.0315492957746478e-06, + "loss": 0.3809, "step": 1770 }, { - "epoch": 1.54, - "learning_rate": 3.9106993006993e-06, - "loss": 0.4367, + "epoch": 24.72, + "learning_rate": 1.0259154929577466e-06, + "loss": 0.3643, "step": 1780 }, { - "epoch": 1.55, - "learning_rate": 3.91e-06, - "loss": 0.3843, + "epoch": 24.86, + "learning_rate": 1.0202816901408451e-06, + "loss": 0.3706, "step": 1790 }, { - "epoch": 1.56, - "learning_rate": 3.909300699300699e-06, - "loss": 0.4319, + "epoch": 25.0, + "learning_rate": 1.0146478873239437e-06, + "loss": 0.3656, + "step": 1800 + }, + { + "epoch": 25.0, + "eval_loss": 0.536328911781311, + "eval_runtime": 127.0748, + "eval_samples_per_second": 4.187, + "eval_steps_per_second": 0.527, + "eval_wer": 0.24766985922735746, "step": 1800 }, { - "epoch": 1.57, - "learning_rate": 3.908601398601398e-06, - "loss": 0.4144, + "epoch": 25.14, + "learning_rate": 1.0090140845070422e-06, + "loss": 0.3793, "step": 1810 }, { - "epoch": 1.58, - "learning_rate": 3.9079020979020975e-06, - "loss": 0.4558, + "epoch": 25.28, + "learning_rate": 1.0033802816901408e-06, + "loss": 0.3599, "step": 1820 }, { - "epoch": 1.59, - "learning_rate": 3.907202797202797e-06, - "loss": 0.4162, + "epoch": 25.42, + "learning_rate": 9.977464788732393e-07, + "loss": 0.3615, "step": 1830 }, { - "epoch": 1.59, - "learning_rate": 3.9065034965034965e-06, - "loss": 0.4819, + "epoch": 25.55, + "learning_rate": 9.921126760563379e-07, + "loss": 0.3651, "step": 1840 }, { - "epoch": 1.6, - "learning_rate": 3.905804195804196e-06, - "loss": 0.4162, + "epoch": 25.69, + "learning_rate": 9.864788732394366e-07, + "loss": 0.3711, "step": 1850 }, { - "epoch": 1.61, - "learning_rate": 3.9051048951048955e-06, - "loss": 0.4193, + "epoch": 25.83, + "learning_rate": 9.808450704225352e-07, + "loss": 0.3746, "step": 1860 }, { - "epoch": 1.62, - "learning_rate": 3.904405594405594e-06, - "loss": 0.4649, + "epoch": 25.97, + "learning_rate": 9.752112676056337e-07, + "loss": 0.3713, "step": 1870 }, { - "epoch": 1.63, - "learning_rate": 3.903706293706294e-06, - "loss": 0.4096, + "epoch": 26.0, + "eval_loss": 0.540567934513092, + "eval_runtime": 126.6741, + "eval_samples_per_second": 4.2, + "eval_steps_per_second": 0.529, + "eval_wer": 0.24612714533650445, + "step": 1872 + }, + { + "epoch": 26.11, + "learning_rate": 9.695774647887323e-07, + "loss": 0.3727, "step": 1880 }, { - "epoch": 1.64, - "learning_rate": 3.903006993006993e-06, - "loss": 0.4651, + "epoch": 26.25, + "learning_rate": 9.63943661971831e-07, + "loss": 0.3724, "step": 1890 }, { - "epoch": 1.65, - "learning_rate": 3.902307692307693e-06, - "loss": 0.4042, + "epoch": 26.39, + "learning_rate": 9.583098591549296e-07, + "loss": 0.3564, "step": 1900 }, { - "epoch": 1.65, - "learning_rate": 3.901608391608391e-06, - "loss": 0.4365, + "epoch": 26.53, + "learning_rate": 9.526760563380282e-07, + "loss": 0.3656, "step": 1910 }, { - "epoch": 1.66, - "learning_rate": 3.900909090909091e-06, - "loss": 0.4693, + "epoch": 26.66, + "learning_rate": 9.470422535211268e-07, + "loss": 0.356, "step": 1920 }, { - "epoch": 1.67, - "learning_rate": 3.90020979020979e-06, - "loss": 0.3902, + "epoch": 26.8, + "learning_rate": 9.414084507042253e-07, + "loss": 0.3826, "step": 1930 }, { - "epoch": 1.68, - "learning_rate": 3.89951048951049e-06, - "loss": 0.4166, + "epoch": 26.94, + "learning_rate": 9.357746478873238e-07, + "loss": 0.3572, "step": 1940 }, { - "epoch": 1.69, - "learning_rate": 3.898811188811188e-06, - "loss": 0.4452, + "epoch": 27.0, + "eval_loss": 0.536870539188385, + "eval_runtime": 128.7211, + "eval_samples_per_second": 4.133, + "eval_steps_per_second": 0.521, + "eval_wer": 0.2465128238092177, + "step": 1944 + }, + { + "epoch": 27.08, + "learning_rate": 9.301408450704225e-07, + "loss": 0.3724, "step": 1950 }, { - "epoch": 1.7, - "learning_rate": 3.898111888111888e-06, - "loss": 0.4268, + "epoch": 27.22, + "learning_rate": 9.24507042253521e-07, + "loss": 0.3663, "step": 1960 }, { - "epoch": 1.71, - "learning_rate": 3.897412587412587e-06, - "loss": 0.4681, + "epoch": 27.36, + "learning_rate": 9.188732394366197e-07, + "loss": 0.3558, "step": 1970 }, { - "epoch": 1.72, - "learning_rate": 3.896713286713286e-06, - "loss": 0.4049, - "step": 1980 + "epoch": 27.5, + "learning_rate": 9.132394366197182e-07, + "loss": 0.3715, + "step": 1980 }, { - "epoch": 1.72, - "learning_rate": 3.8960139860139855e-06, - "loss": 0.471, + "epoch": 27.64, + "learning_rate": 9.076056338028169e-07, + "loss": 0.3579, "step": 1990 }, { - "epoch": 1.73, - "learning_rate": 3.895314685314685e-06, - "loss": 0.4484, + "epoch": 27.78, + "learning_rate": 9.019718309859154e-07, + "loss": 0.3775, "step": 2000 }, { - "epoch": 1.74, - "learning_rate": 3.8946153846153845e-06, - "loss": 0.4749, + "epoch": 27.91, + "learning_rate": 8.963380281690141e-07, + "loss": 0.3665, "step": 2010 }, { - "epoch": 1.75, - "learning_rate": 3.893916083916084e-06, - "loss": 0.4929, + "epoch": 28.0, + "eval_loss": 0.5374864935874939, + "eval_runtime": 126.8744, + "eval_samples_per_second": 4.193, + "eval_steps_per_second": 0.528, + "eval_wer": 0.24664138330012214, + "step": 2016 + }, + { + "epoch": 28.06, + "learning_rate": 8.907042253521126e-07, + "loss": 0.3765, "step": 2020 }, { - "epoch": 1.76, - "learning_rate": 3.893216783216783e-06, - "loss": 0.4125, + "epoch": 28.19, + "learning_rate": 8.850704225352113e-07, + "loss": 0.367, "step": 2030 }, { - "epoch": 1.77, - "learning_rate": 3.892517482517482e-06, - "loss": 0.4171, + "epoch": 28.33, + "learning_rate": 8.794366197183098e-07, + "loss": 0.3783, "step": 2040 }, { - "epoch": 1.78, - "learning_rate": 3.891818181818182e-06, - "loss": 0.5211, + "epoch": 28.47, + "learning_rate": 8.738028169014085e-07, + "loss": 0.3651, "step": 2050 }, { - "epoch": 1.78, - "learning_rate": 3.891118881118881e-06, - "loss": 0.4221, + "epoch": 28.61, + "learning_rate": 8.68169014084507e-07, + "loss": 0.3717, "step": 2060 }, { - "epoch": 1.79, - "learning_rate": 3.890419580419581e-06, - "loss": 0.4622, + "epoch": 28.75, + "learning_rate": 8.625352112676056e-07, + "loss": 0.374, "step": 2070 }, { - "epoch": 1.8, - "learning_rate": 3.889720279720279e-06, - "loss": 0.403, + "epoch": 28.89, + "learning_rate": 8.569014084507041e-07, + "loss": 0.3748, "step": 2080 }, { - "epoch": 1.81, - "learning_rate": 3.889020979020979e-06, - "loss": 0.432, + "epoch": 29.0, + "eval_loss": 0.536729633808136, + "eval_runtime": 127.2778, + "eval_samples_per_second": 4.18, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2479912579546185, + "step": 2088 + }, + { + "epoch": 29.03, + "learning_rate": 8.512676056338027e-07, + "loss": 0.3693, "step": 2090 }, { - "epoch": 1.82, - "learning_rate": 3.888321678321678e-06, - "loss": 0.439, + "epoch": 29.17, + "learning_rate": 8.456338028169013e-07, + "loss": 0.3585, "step": 2100 }, { - "epoch": 1.83, - "learning_rate": 3.887622377622378e-06, - "loss": 0.4619, + "epoch": 29.3, + "learning_rate": 8.399999999999999e-07, + "loss": 0.3669, "step": 2110 }, { - "epoch": 1.84, - "learning_rate": 3.8869230769230765e-06, - "loss": 0.4404, + "epoch": 29.44, + "learning_rate": 8.343661971830986e-07, + "loss": 0.3709, "step": 2120 }, { - "epoch": 1.85, - "learning_rate": 3.886223776223776e-06, - "loss": 0.4447, + "epoch": 29.58, + "learning_rate": 8.287323943661971e-07, + "loss": 0.3646, "step": 2130 }, { - "epoch": 1.85, - "learning_rate": 3.8855244755244755e-06, - "loss": 0.4246, + "epoch": 29.72, + "learning_rate": 8.230985915492958e-07, + "loss": 0.3628, "step": 2140 }, { - "epoch": 1.86, - "learning_rate": 3.884825174825175e-06, - "loss": 0.4289, + "epoch": 29.86, + "learning_rate": 8.174647887323943e-07, + "loss": 0.3709, "step": 2150 }, { - "epoch": 1.87, - "learning_rate": 3.884125874125874e-06, - "loss": 0.5245, + "epoch": 30.0, + "learning_rate": 8.11830985915493e-07, + "loss": 0.3769, + "step": 2160 + }, + { + "epoch": 30.0, + "eval_loss": 0.5359097719192505, + "eval_runtime": 127.9102, + "eval_samples_per_second": 4.159, + "eval_steps_per_second": 0.524, + "eval_wer": 0.24587002635469563, "step": 2160 }, { - "epoch": 1.88, - "learning_rate": 3.883426573426573e-06, - "loss": 0.405, + "epoch": 30.14, + "learning_rate": 8.061971830985915e-07, + "loss": 0.3729, "step": 2170 }, { - "epoch": 1.89, - "learning_rate": 3.882727272727273e-06, - "loss": 0.4307, + "epoch": 30.28, + "learning_rate": 8.005633802816902e-07, + "loss": 0.3729, "step": 2180 }, { - "epoch": 1.9, - "learning_rate": 3.882027972027972e-06, - "loss": 0.4372, + "epoch": 30.42, + "learning_rate": 7.949295774647887e-07, + "loss": 0.3582, "step": 2190 }, { - "epoch": 1.91, - "learning_rate": 3.881328671328671e-06, - "loss": 0.4754, + "epoch": 30.55, + "learning_rate": 7.892957746478873e-07, + "loss": 0.3717, "step": 2200 }, { - "epoch": 1.91, - "learning_rate": 3.88062937062937e-06, - "loss": 0.4121, + "epoch": 30.69, + "learning_rate": 7.836619718309859e-07, + "loss": 0.3557, "step": 2210 }, { - "epoch": 1.92, - "learning_rate": 3.88e-06, - "loss": 0.44, + "epoch": 30.83, + "learning_rate": 7.780281690140845e-07, + "loss": 0.3725, "step": 2220 }, { - "epoch": 1.93, - "learning_rate": 3.879300699300699e-06, - "loss": 0.4103, + "epoch": 30.97, + "learning_rate": 7.72394366197183e-07, + "loss": 0.3634, "step": 2230 }, { - "epoch": 1.94, - "learning_rate": 3.878601398601398e-06, - "loss": 0.4443, + "epoch": 31.0, + "eval_loss": 0.5417142510414124, + "eval_runtime": 127.5766, + "eval_samples_per_second": 4.17, + "eval_steps_per_second": 0.525, + "eval_wer": 0.2470913415182876, + "step": 2232 + }, + { + "epoch": 31.11, + "learning_rate": 7.667605633802816e-07, + "loss": 0.3762, "step": 2240 }, { - "epoch": 1.95, - "learning_rate": 3.877902097902098e-06, - "loss": 0.4186, + "epoch": 31.25, + "learning_rate": 7.611267605633802e-07, + "loss": 0.3653, "step": 2250 }, { - "epoch": 1.96, - "learning_rate": 3.877202797202797e-06, - "loss": 0.4083, + "epoch": 31.39, + "learning_rate": 7.554929577464788e-07, + "loss": 0.3425, "step": 2260 }, { - "epoch": 1.97, - "learning_rate": 3.876503496503497e-06, - "loss": 0.4846, + "epoch": 31.53, + "learning_rate": 7.498591549295774e-07, + "loss": 0.363, "step": 2270 }, { - "epoch": 1.98, - "learning_rate": 3.875804195804195e-06, - "loss": 0.4019, + "epoch": 31.66, + "learning_rate": 7.44225352112676e-07, + "loss": 0.36, "step": 2280 }, { - "epoch": 1.98, - "learning_rate": 3.875104895104895e-06, - "loss": 0.4598, + "epoch": 31.8, + "learning_rate": 7.385915492957746e-07, + "loss": 0.3709, "step": 2290 }, { - "epoch": 1.99, - "learning_rate": 3.874405594405594e-06, - "loss": 0.4109, + "epoch": 31.94, + "learning_rate": 7.329577464788732e-07, + "loss": 0.3627, "step": 2300 }, { - "epoch": 2.0, - "eval_loss": 0.5667211413383484, - "eval_runtime": 132.8098, - "eval_samples_per_second": 4.006, - "eval_steps_per_second": 2.003, - "eval_wer": 0.2739602751173105, - "step": 2308 + "epoch": 32.0, + "eval_loss": 0.5398467779159546, + "eval_runtime": 128.1832, + "eval_samples_per_second": 4.15, + "eval_steps_per_second": 0.523, + "eval_wer": 0.24734846050009643, + "step": 2304 }, { - "epoch": 2.0, - "learning_rate": 3.873706293706294e-06, - "loss": 0.4696, + "epoch": 32.08, + "learning_rate": 7.273239436619719e-07, + "loss": 0.3842, "step": 2310 }, { - "epoch": 2.01, - "learning_rate": 3.8730069930069925e-06, - "loss": 0.4279, + "epoch": 32.22, + "learning_rate": 7.216901408450704e-07, + "loss": 0.3702, "step": 2320 }, { - "epoch": 2.02, - "learning_rate": 3.872307692307692e-06, - "loss": 0.4668, + "epoch": 32.36, + "learning_rate": 7.16056338028169e-07, + "loss": 0.3721, "step": 2330 }, { - "epoch": 2.03, - "learning_rate": 3.8716083916083915e-06, - "loss": 0.3705, + "epoch": 32.5, + "learning_rate": 7.104225352112676e-07, + "loss": 0.3728, "step": 2340 }, { - "epoch": 2.04, - "learning_rate": 3.870909090909091e-06, - "loss": 0.4757, + "epoch": 32.64, + "learning_rate": 7.047887323943662e-07, + "loss": 0.3482, "step": 2350 }, { - "epoch": 2.05, - "learning_rate": 3.87020979020979e-06, - "loss": 0.4652, + "epoch": 32.78, + "learning_rate": 6.991549295774648e-07, + "loss": 0.3691, "step": 2360 }, { - "epoch": 2.05, - "learning_rate": 3.869510489510489e-06, - "loss": 0.4144, + "epoch": 32.91, + "learning_rate": 6.935211267605634e-07, + "loss": 0.3497, "step": 2370 }, { - "epoch": 2.06, - "learning_rate": 3.868811188811189e-06, - "loss": 0.4441, + "epoch": 33.0, + "eval_loss": 0.5427743792533875, + "eval_runtime": 126.3596, + "eval_samples_per_second": 4.21, + "eval_steps_per_second": 0.53, + "eval_wer": 0.24831265668187955, + "step": 2376 + }, + { + "epoch": 33.06, + "learning_rate": 6.878873239436619e-07, + "loss": 0.3807, "step": 2380 }, { - "epoch": 2.07, - "learning_rate": 3.868111888111888e-06, - "loss": 0.4188, + "epoch": 33.19, + "learning_rate": 6.822535211267605e-07, + "loss": 0.3613, "step": 2390 }, { - "epoch": 2.08, - "learning_rate": 3.867412587412587e-06, - "loss": 0.4725, + "epoch": 33.33, + "learning_rate": 6.766197183098591e-07, + "loss": 0.3699, "step": 2400 }, { - "epoch": 2.09, - "learning_rate": 3.866713286713286e-06, - "loss": 0.4527, + "epoch": 33.47, + "learning_rate": 6.709859154929577e-07, + "loss": 0.3712, "step": 2410 }, { - "epoch": 2.1, - "learning_rate": 3.866013986013986e-06, - "loss": 0.4182, + "epoch": 33.61, + "learning_rate": 6.653521126760563e-07, + "loss": 0.3717, "step": 2420 }, { - "epoch": 2.11, - "learning_rate": 3.865314685314685e-06, - "loss": 0.3844, + "epoch": 33.75, + "learning_rate": 6.597183098591549e-07, + "loss": 0.3586, "step": 2430 }, { - "epoch": 2.11, - "learning_rate": 3.864615384615384e-06, - "loss": 0.4113, + "epoch": 33.89, + "learning_rate": 6.540845070422535e-07, + "loss": 0.3479, "step": 2440 }, { - "epoch": 2.12, - "learning_rate": 3.8639160839160835e-06, - "loss": 0.4282, + "epoch": 34.0, + "eval_loss": 0.5389805436134338, + "eval_runtime": 126.1536, + "eval_samples_per_second": 4.217, + "eval_steps_per_second": 0.531, + "eval_wer": 0.24811981744552292, + "step": 2448 + }, + { + "epoch": 34.03, + "learning_rate": 6.484507042253521e-07, + "loss": 0.3858, "step": 2450 }, { - "epoch": 2.13, - "learning_rate": 3.863216783216783e-06, - "loss": 0.4842, + "epoch": 34.17, + "learning_rate": 6.428169014084506e-07, + "loss": 0.3618, "step": 2460 }, { - "epoch": 2.14, - "learning_rate": 3.8625174825174825e-06, - "loss": 0.4822, + "epoch": 34.3, + "learning_rate": 6.371830985915493e-07, + "loss": 0.3707, "step": 2470 }, { - "epoch": 2.15, - "learning_rate": 3.861818181818182e-06, - "loss": 0.3696, + "epoch": 34.44, + "learning_rate": 6.315492957746478e-07, + "loss": 0.3718, "step": 2480 }, { - "epoch": 2.16, - "learning_rate": 3.8611188811188815e-06, - "loss": 0.4124, + "epoch": 34.58, + "learning_rate": 6.259154929577465e-07, + "loss": 0.3534, "step": 2490 }, { - "epoch": 2.17, - "learning_rate": 3.86041958041958e-06, - "loss": 0.4624, + "epoch": 34.72, + "learning_rate": 6.20281690140845e-07, + "loss": 0.3613, "step": 2500 }, { - "epoch": 2.17, - "learning_rate": 3.85972027972028e-06, - "loss": 0.3711, + "epoch": 34.86, + "learning_rate": 6.146478873239437e-07, + "loss": 0.3623, "step": 2510 }, { - "epoch": 2.18, - "learning_rate": 3.859020979020979e-06, - "loss": 0.4044, + "epoch": 35.0, + "learning_rate": 6.090140845070423e-07, + "loss": 0.363, + "step": 2520 + }, + { + "epoch": 35.0, + "eval_loss": 0.5388094782829285, + "eval_runtime": 126.3817, + "eval_samples_per_second": 4.209, + "eval_steps_per_second": 0.53, + "eval_wer": 0.2477984187182619, "step": 2520 }, { - "epoch": 2.19, - "learning_rate": 3.858321678321679e-06, - "loss": 0.4136, + "epoch": 35.14, + "learning_rate": 6.033802816901408e-07, + "loss": 0.3673, "step": 2530 }, { - "epoch": 2.2, - "learning_rate": 3.857622377622377e-06, - "loss": 0.3982, + "epoch": 35.28, + "learning_rate": 5.977464788732394e-07, + "loss": 0.3787, "step": 2540 }, { - "epoch": 2.21, - "learning_rate": 3.856923076923077e-06, - "loss": 0.4259, + "epoch": 35.42, + "learning_rate": 5.92112676056338e-07, + "loss": 0.3589, "step": 2550 }, { - "epoch": 2.22, - "learning_rate": 3.856223776223776e-06, - "loss": 0.4588, + "epoch": 35.55, + "learning_rate": 5.864788732394366e-07, + "loss": 0.3732, "step": 2560 }, { - "epoch": 2.23, - "learning_rate": 3.855524475524475e-06, - "loss": 0.4043, + "epoch": 35.69, + "learning_rate": 5.808450704225352e-07, + "loss": 0.3626, "step": 2570 }, { - "epoch": 2.24, - "learning_rate": 3.854825174825174e-06, - "loss": 0.4745, + "epoch": 35.83, + "learning_rate": 5.752112676056338e-07, + "loss": 0.3671, "step": 2580 }, { - "epoch": 2.24, - "learning_rate": 3.854125874125874e-06, - "loss": 0.3965, + "epoch": 35.97, + "learning_rate": 5.695774647887323e-07, + "loss": 0.3622, "step": 2590 }, { - "epoch": 2.25, - "learning_rate": 3.853426573426573e-06, - "loss": 0.449, + "epoch": 36.0, + "eval_loss": 0.5396317839622498, + "eval_runtime": 127.4298, + "eval_samples_per_second": 4.175, + "eval_steps_per_second": 0.526, + "eval_wer": 0.24895545413640163, + "step": 2592 + }, + { + "epoch": 36.11, + "learning_rate": 5.63943661971831e-07, + "loss": 0.3753, "step": 2600 }, { - "epoch": 2.26, - "learning_rate": 3.852727272727272e-06, - "loss": 0.4828, + "epoch": 36.25, + "learning_rate": 5.583098591549295e-07, + "loss": 0.3594, "step": 2610 }, { - "epoch": 2.27, - "learning_rate": 3.8520279720279715e-06, - "loss": 0.4536, + "epoch": 36.39, + "learning_rate": 5.526760563380282e-07, + "loss": 0.3507, "step": 2620 }, { - "epoch": 2.28, - "learning_rate": 3.851328671328671e-06, - "loss": 0.4621, + "epoch": 36.53, + "learning_rate": 5.470422535211267e-07, + "loss": 0.3842, "step": 2630 }, { - "epoch": 2.29, - "learning_rate": 3.8506293706293705e-06, - "loss": 0.396, + "epoch": 36.66, + "learning_rate": 5.414084507042254e-07, + "loss": 0.3699, "step": 2640 }, { - "epoch": 2.3, - "learning_rate": 3.84993006993007e-06, - "loss": 0.4883, + "epoch": 36.8, + "learning_rate": 5.357746478873239e-07, + "loss": 0.368, "step": 2650 }, { - "epoch": 2.3, - "learning_rate": 3.849230769230769e-06, - "loss": 0.4217, + "epoch": 36.94, + "learning_rate": 5.301408450704226e-07, + "loss": 0.3685, "step": 2660 }, { - "epoch": 2.31, - "learning_rate": 3.848531468531468e-06, - "loss": 0.479, + "epoch": 37.0, + "eval_loss": 0.5408422946929932, + "eval_runtime": 127.9531, + "eval_samples_per_second": 4.158, + "eval_steps_per_second": 0.524, + "eval_wer": 0.2478626984637141, + "step": 2664 + }, + { + "epoch": 37.08, + "learning_rate": 5.24507042253521e-07, + "loss": 0.3811, "step": 2670 }, { - "epoch": 2.32, - "learning_rate": 3.847832167832168e-06, - "loss": 0.4179, + "epoch": 37.22, + "learning_rate": 5.188732394366197e-07, + "loss": 0.3746, "step": 2680 }, { - "epoch": 2.33, - "learning_rate": 3.847132867132867e-06, - "loss": 0.4314, + "epoch": 37.36, + "learning_rate": 5.132394366197182e-07, + "loss": 0.3654, "step": 2690 }, { - "epoch": 2.34, - "learning_rate": 3.846433566433567e-06, - "loss": 0.4006, + "epoch": 37.5, + "learning_rate": 5.076056338028169e-07, + "loss": 0.3634, "step": 2700 }, { - "epoch": 2.35, - "learning_rate": 3.845734265734266e-06, - "loss": 0.4523, + "epoch": 37.64, + "learning_rate": 5.019718309859154e-07, + "loss": 0.3468, "step": 2710 }, { - "epoch": 2.36, - "learning_rate": 3.845034965034965e-06, - "loss": 0.4371, + "epoch": 37.78, + "learning_rate": 4.96338028169014e-07, + "loss": 0.3737, "step": 2720 }, { - "epoch": 2.37, - "learning_rate": 3.844335664335664e-06, - "loss": 0.4165, + "epoch": 37.91, + "learning_rate": 4.907042253521126e-07, + "loss": 0.356, "step": 2730 }, { - "epoch": 2.37, - "learning_rate": 3.843636363636364e-06, - "loss": 0.4169, + "epoch": 38.0, + "eval_loss": 0.5385244488716125, + "eval_runtime": 128.0588, + "eval_samples_per_second": 4.154, + "eval_steps_per_second": 0.523, + "eval_wer": 0.24593430610014785, + "step": 2736 + }, + { + "epoch": 38.06, + "learning_rate": 4.850704225352112e-07, + "loss": 0.3759, "step": 2740 }, { - "epoch": 2.38, - "learning_rate": 3.8429370629370624e-06, - "loss": 0.4272, + "epoch": 38.19, + "learning_rate": 4.794366197183099e-07, + "loss": 0.3653, "step": 2750 }, { - "epoch": 2.39, - "learning_rate": 3.842237762237762e-06, - "loss": 0.4621, + "epoch": 38.33, + "learning_rate": 4.7380281690140846e-07, + "loss": 0.3482, "step": 2760 }, { - "epoch": 2.4, - "learning_rate": 3.8415384615384614e-06, - "loss": 0.4041, + "epoch": 38.47, + "learning_rate": 4.6816901408450706e-07, + "loss": 0.3606, "step": 2770 }, { - "epoch": 2.41, - "learning_rate": 3.840839160839161e-06, - "loss": 0.4403, + "epoch": 38.61, + "learning_rate": 4.6253521126760566e-07, + "loss": 0.3666, "step": 2780 }, { - "epoch": 2.42, - "learning_rate": 3.84013986013986e-06, - "loss": 0.4194, + "epoch": 38.75, + "learning_rate": 4.5690140845070416e-07, + "loss": 0.3706, "step": 2790 }, { - "epoch": 2.43, - "learning_rate": 3.839440559440559e-06, - "loss": 0.447, + "epoch": 38.89, + "learning_rate": 4.5126760563380276e-07, + "loss": 0.3529, "step": 2800 }, { - "epoch": 2.43, - "learning_rate": 3.838741258741259e-06, - "loss": 0.3986, + "epoch": 39.0, + "eval_loss": 0.5388730764389038, + "eval_runtime": 127.0748, + "eval_samples_per_second": 4.187, + "eval_steps_per_second": 0.527, + "eval_wer": 0.24670566304557434, + "step": 2808 + }, + { + "epoch": 39.03, + "learning_rate": 4.4563380281690137e-07, + "loss": 0.3863, "step": 2810 }, { - "epoch": 2.44, - "learning_rate": 3.838041958041958e-06, - "loss": 0.4245, + "epoch": 39.17, + "learning_rate": 4.3999999999999997e-07, + "loss": 0.3677, "step": 2820 }, { - "epoch": 2.45, - "learning_rate": 3.837342657342657e-06, - "loss": 0.4412, + "epoch": 39.3, + "learning_rate": 4.3436619718309857e-07, + "loss": 0.3677, "step": 2830 }, { - "epoch": 2.46, - "learning_rate": 3.836643356643356e-06, - "loss": 0.4128, + "epoch": 39.44, + "learning_rate": 4.287323943661972e-07, + "loss": 0.353, "step": 2840 }, { - "epoch": 2.47, - "learning_rate": 3.835944055944056e-06, - "loss": 0.4236, + "epoch": 39.58, + "learning_rate": 4.230985915492958e-07, + "loss": 0.3658, "step": 2850 }, { - "epoch": 2.48, - "learning_rate": 3.835244755244755e-06, - "loss": 0.5051, + "epoch": 39.72, + "learning_rate": 4.1746478873239433e-07, + "loss": 0.3712, "step": 2860 }, { - "epoch": 2.49, - "learning_rate": 3.834545454545455e-06, - "loss": 0.3899, + "epoch": 39.86, + "learning_rate": 4.1183098591549293e-07, + "loss": 0.3577, "step": 2870 }, { - "epoch": 2.5, - "learning_rate": 3.833846153846153e-06, - "loss": 0.402, + "epoch": 40.0, + "learning_rate": 4.0619718309859153e-07, + "loss": 0.3702, "step": 2880 }, { - "epoch": 2.5, - "learning_rate": 3.833146853146853e-06, - "loss": 0.4073, + "epoch": 40.0, + "eval_loss": 0.5392444729804993, + "eval_runtime": 128.3773, + "eval_samples_per_second": 4.144, + "eval_steps_per_second": 0.522, + "eval_wer": 0.24818409719097512, + "step": 2880 + }, + { + "epoch": 40.14, + "learning_rate": 4.0056338028169014e-07, + "loss": 0.3731, "step": 2890 }, { - "epoch": 2.51, - "learning_rate": 3.832447552447552e-06, - "loss": 0.4324, + "epoch": 40.28, + "learning_rate": 3.9492957746478874e-07, + "loss": 0.3599, "step": 2900 }, { - "epoch": 2.52, - "learning_rate": 3.831748251748252e-06, - "loss": 0.4846, + "epoch": 40.42, + "learning_rate": 3.8929577464788734e-07, + "loss": 0.3603, "step": 2910 }, { - "epoch": 2.53, - "learning_rate": 3.831048951048951e-06, - "loss": 0.4426, + "epoch": 40.55, + "learning_rate": 3.836619718309859e-07, + "loss": 0.3668, "step": 2920 }, { - "epoch": 2.54, - "learning_rate": 3.83034965034965e-06, - "loss": 0.3916, + "epoch": 40.69, + "learning_rate": 3.7802816901408444e-07, + "loss": 0.3518, "step": 2930 }, { - "epoch": 2.55, - "learning_rate": 3.8296503496503495e-06, - "loss": 0.3975, + "epoch": 40.83, + "learning_rate": 3.7239436619718305e-07, + "loss": 0.3774, "step": 2940 }, { - "epoch": 2.56, - "learning_rate": 3.828951048951049e-06, - "loss": 0.439, + "epoch": 40.97, + "learning_rate": 3.6676056338028165e-07, + "loss": 0.3645, "step": 2950 }, { - "epoch": 2.56, - "learning_rate": 3.8282517482517485e-06, - "loss": 0.4785, + "epoch": 41.0, + "eval_loss": 0.5407747030258179, + "eval_runtime": 128.2235, + "eval_samples_per_second": 4.149, + "eval_steps_per_second": 0.523, + "eval_wer": 0.24670566304557434, + "step": 2952 + }, + { + "epoch": 41.11, + "learning_rate": 3.6112676056338025e-07, + "loss": 0.3806, "step": 2960 }, { - "epoch": 2.57, - "learning_rate": 3.827552447552447e-06, - "loss": 0.4355, + "epoch": 41.25, + "learning_rate": 3.5549295774647886e-07, + "loss": 0.3694, "step": 2970 }, { - "epoch": 2.58, - "learning_rate": 3.826853146853147e-06, - "loss": 0.3911, - "step": 2980 + "epoch": 41.39, + "learning_rate": 3.4985915492957746e-07, + "loss": 0.3531, + "step": 2980 }, { - "epoch": 2.59, - "learning_rate": 3.826153846153846e-06, - "loss": 0.4459, + "epoch": 41.53, + "learning_rate": 3.4422535211267606e-07, + "loss": 0.3604, "step": 2990 }, { - "epoch": 2.6, - "learning_rate": 3.825454545454546e-06, - "loss": 0.4879, + "epoch": 41.66, + "learning_rate": 3.3859154929577466e-07, + "loss": 0.3691, "step": 3000 }, { - "epoch": 2.61, - "learning_rate": 3.824755244755244e-06, - "loss": 0.4449, + "epoch": 41.8, + "learning_rate": 3.329577464788732e-07, + "loss": 0.3744, "step": 3010 }, { - "epoch": 2.62, - "learning_rate": 3.824055944055944e-06, - "loss": 0.4061, + "epoch": 41.94, + "learning_rate": 3.273239436619718e-07, + "loss": 0.3489, "step": 3020 }, { - "epoch": 2.63, - "learning_rate": 3.823356643356643e-06, - "loss": 0.3946, + "epoch": 42.0, + "eval_loss": 0.5406195521354675, + "eval_runtime": 128.1617, + "eval_samples_per_second": 4.151, + "eval_steps_per_second": 0.523, + "eval_wer": 0.24741274024554863, + "step": 3024 + }, + { + "epoch": 42.08, + "learning_rate": 3.216901408450704e-07, + "loss": 0.3823, "step": 3030 }, { - "epoch": 2.63, - "learning_rate": 3.822657342657342e-06, - "loss": 0.4905, + "epoch": 42.22, + "learning_rate": 3.16056338028169e-07, + "loss": 0.3526, "step": 3040 }, { - "epoch": 2.64, - "learning_rate": 3.8219580419580414e-06, - "loss": 0.4251, + "epoch": 42.36, + "learning_rate": 3.104225352112676e-07, + "loss": 0.3669, "step": 3050 }, { - "epoch": 2.65, - "learning_rate": 3.821258741258741e-06, - "loss": 0.4532, + "epoch": 42.5, + "learning_rate": 3.047887323943662e-07, + "loss": 0.3766, "step": 3060 }, { - "epoch": 2.66, - "learning_rate": 3.82055944055944e-06, - "loss": 0.3845, + "epoch": 42.64, + "learning_rate": 2.9971830985915494e-07, + "loss": 0.3746, "step": 3070 }, { - "epoch": 2.67, - "learning_rate": 3.81986013986014e-06, - "loss": 0.4218, + "epoch": 42.78, + "learning_rate": 2.9408450704225354e-07, + "loss": 0.3825, "step": 3080 }, { - "epoch": 2.68, - "learning_rate": 3.8191608391608386e-06, - "loss": 0.3965, + "epoch": 42.91, + "learning_rate": 2.8845070422535214e-07, + "loss": 0.3556, "step": 3090 }, { - "epoch": 2.69, - "learning_rate": 3.818461538461538e-06, - "loss": 0.4261, + "epoch": 43.0, + "eval_loss": 0.5401654839515686, + "eval_runtime": 128.4726, + "eval_samples_per_second": 4.141, + "eval_steps_per_second": 0.522, + "eval_wer": 0.2471556212637398, + "step": 3096 + }, + { + "epoch": 43.06, + "learning_rate": 2.828169014084507e-07, + "loss": 0.3766, "step": 3100 }, { - "epoch": 2.69, - "learning_rate": 3.8177622377622376e-06, - "loss": 0.3952, + "epoch": 43.19, + "learning_rate": 2.7718309859154924e-07, + "loss": 0.3609, "step": 3110 }, { - "epoch": 2.7, - "learning_rate": 3.817062937062937e-06, - "loss": 0.4337, + "epoch": 43.33, + "learning_rate": 2.7154929577464784e-07, + "loss": 0.3619, "step": 3120 }, { - "epoch": 2.71, - "learning_rate": 3.8163636363636366e-06, - "loss": 0.3518, + "epoch": 43.47, + "learning_rate": 2.6591549295774645e-07, + "loss": 0.3635, "step": 3130 }, { - "epoch": 2.72, - "learning_rate": 3.815664335664336e-06, - "loss": 0.4675, + "epoch": 43.61, + "learning_rate": 2.6028169014084505e-07, + "loss": 0.3668, "step": 3140 }, { - "epoch": 2.73, - "learning_rate": 3.814965034965035e-06, - "loss": 0.4442, + "epoch": 43.75, + "learning_rate": 2.5464788732394365e-07, + "loss": 0.368, "step": 3150 }, { - "epoch": 2.74, - "learning_rate": 3.814265734265734e-06, - "loss": 0.4365, + "epoch": 43.89, + "learning_rate": 2.4901408450704226e-07, + "loss": 0.356, "step": 3160 }, { - "epoch": 2.75, - "learning_rate": 3.8135664335664333e-06, - "loss": 0.3938, + "epoch": 44.0, + "eval_loss": 0.538616418838501, + "eval_runtime": 127.2122, + "eval_samples_per_second": 4.182, + "eval_steps_per_second": 0.527, + "eval_wer": 0.24676994279102654, + "step": 3168 + }, + { + "epoch": 44.03, + "learning_rate": 2.433802816901408e-07, + "loss": 0.3737, "step": 3170 }, { - "epoch": 2.76, - "learning_rate": 3.8128671328671328e-06, - "loss": 0.3778, + "epoch": 44.17, + "learning_rate": 2.3774647887323944e-07, + "loss": 0.3586, "step": 3180 }, { - "epoch": 2.76, - "learning_rate": 3.812167832167832e-06, - "loss": 0.43, + "epoch": 44.3, + "learning_rate": 2.32112676056338e-07, + "loss": 0.3721, "step": 3190 }, { - "epoch": 2.77, - "learning_rate": 3.8114685314685313e-06, - "loss": 0.3924, + "epoch": 44.44, + "learning_rate": 2.264788732394366e-07, + "loss": 0.3611, "step": 3200 }, { - "epoch": 2.78, - "learning_rate": 3.810769230769231e-06, - "loss": 0.4437, + "epoch": 44.58, + "learning_rate": 2.208450704225352e-07, + "loss": 0.3664, "step": 3210 }, { - "epoch": 2.79, - "learning_rate": 3.81006993006993e-06, - "loss": 0.4305, + "epoch": 44.72, + "learning_rate": 2.152112676056338e-07, + "loss": 0.354, "step": 3220 }, { - "epoch": 2.8, - "learning_rate": 3.809370629370629e-06, - "loss": 0.4576, + "epoch": 44.86, + "learning_rate": 2.095774647887324e-07, + "loss": 0.3545, "step": 3230 }, { - "epoch": 2.81, - "learning_rate": 3.8086713286713285e-06, - "loss": 0.4286, + "epoch": 45.0, + "learning_rate": 2.0394366197183097e-07, + "loss": 0.3632, + "step": 3240 + }, + { + "epoch": 45.0, + "eval_loss": 0.5401559472084045, + "eval_runtime": 126.237, + "eval_samples_per_second": 4.214, + "eval_steps_per_second": 0.531, + "eval_wer": 0.24631998457286108, "step": 3240 }, { - "epoch": 2.82, - "learning_rate": 3.807972027972028e-06, - "loss": 0.4298, + "epoch": 45.14, + "learning_rate": 1.9830985915492958e-07, + "loss": 0.3597, "step": 3250 }, { - "epoch": 2.82, - "learning_rate": 3.807272727272727e-06, - "loss": 0.4584, + "epoch": 45.28, + "learning_rate": 1.9267605633802815e-07, + "loss": 0.3655, "step": 3260 }, { - "epoch": 2.83, - "learning_rate": 3.8065734265734265e-06, - "loss": 0.4241, + "epoch": 45.42, + "learning_rate": 1.8704225352112676e-07, + "loss": 0.3644, "step": 3270 }, { - "epoch": 2.84, - "learning_rate": 3.8058741258741256e-06, - "loss": 0.44, + "epoch": 45.55, + "learning_rate": 1.8140845070422533e-07, + "loss": 0.378, "step": 3280 }, { - "epoch": 2.85, - "learning_rate": 3.8051748251748247e-06, - "loss": 0.3742, + "epoch": 45.69, + "learning_rate": 1.7577464788732394e-07, + "loss": 0.3613, "step": 3290 }, { - "epoch": 2.86, - "learning_rate": 3.804475524475524e-06, - "loss": 0.3989, + "epoch": 45.83, + "learning_rate": 1.7014084507042254e-07, + "loss": 0.3659, "step": 3300 }, { - "epoch": 2.87, - "learning_rate": 3.8037762237762237e-06, - "loss": 0.44, + "epoch": 45.97, + "learning_rate": 1.6450704225352112e-07, + "loss": 0.3693, "step": 3310 }, { - "epoch": 2.88, - "learning_rate": 3.803076923076923e-06, - "loss": 0.4348, + "epoch": 46.0, + "eval_loss": 0.5401335954666138, + "eval_runtime": 127.2873, + "eval_samples_per_second": 4.18, + "eval_steps_per_second": 0.526, + "eval_wer": 0.2471556212637398, + "step": 3312 + }, + { + "epoch": 46.11, + "learning_rate": 1.588732394366197e-07, + "loss": 0.3782, "step": 3320 }, { - "epoch": 2.89, - "learning_rate": 3.8023776223776223e-06, - "loss": 0.424, + "epoch": 46.25, + "learning_rate": 1.532394366197183e-07, + "loss": 0.3685, "step": 3330 }, { - "epoch": 2.89, - "learning_rate": 3.8016783216783213e-06, - "loss": 0.3793, + "epoch": 46.39, + "learning_rate": 1.476056338028169e-07, + "loss": 0.3586, "step": 3340 }, { - "epoch": 2.9, - "learning_rate": 3.800979020979021e-06, - "loss": 0.4532, + "epoch": 46.53, + "learning_rate": 1.4197183098591547e-07, + "loss": 0.3648, "step": 3350 }, { - "epoch": 2.91, - "learning_rate": 3.8002797202797203e-06, - "loss": 0.4313, + "epoch": 46.66, + "learning_rate": 1.3633802816901408e-07, + "loss": 0.3639, "step": 3360 }, { - "epoch": 2.92, - "learning_rate": 3.7995804195804194e-06, - "loss": 0.4326, + "epoch": 46.8, + "learning_rate": 1.3070422535211268e-07, + "loss": 0.367, "step": 3370 }, { - "epoch": 2.93, - "learning_rate": 3.798881118881119e-06, - "loss": 0.3999, + "epoch": 46.94, + "learning_rate": 1.2507042253521128e-07, + "loss": 0.3593, "step": 3380 }, { - "epoch": 2.94, - "learning_rate": 3.798181818181818e-06, - "loss": 0.4128, + "epoch": 47.0, + "eval_loss": 0.5389713048934937, + "eval_runtime": 127.3901, + "eval_samples_per_second": 4.176, + "eval_steps_per_second": 0.526, + "eval_wer": 0.24625570482740888, + "step": 3384 + }, + { + "epoch": 47.08, + "learning_rate": 1.1943661971830986e-07, + "loss": 0.3798, "step": 3390 }, { - "epoch": 2.95, - "learning_rate": 3.797482517482517e-06, - "loss": 0.4218, + "epoch": 47.22, + "learning_rate": 1.1380281690140845e-07, + "loss": 0.3644, "step": 3400 }, { - "epoch": 2.95, - "learning_rate": 3.7967832167832165e-06, - "loss": 0.4248, + "epoch": 47.36, + "learning_rate": 1.0816901408450704e-07, + "loss": 0.3545, "step": 3410 }, { - "epoch": 2.96, - "learning_rate": 3.796083916083916e-06, - "loss": 0.3458, + "epoch": 47.5, + "learning_rate": 1.0253521126760563e-07, + "loss": 0.3633, "step": 3420 }, { - "epoch": 2.97, - "learning_rate": 3.7953846153846155e-06, - "loss": 0.4079, + "epoch": 47.64, + "learning_rate": 9.690140845070423e-08, + "loss": 0.3532, "step": 3430 }, { - "epoch": 2.98, - "learning_rate": 3.794685314685314e-06, - "loss": 0.43, + "epoch": 47.78, + "learning_rate": 9.126760563380281e-08, + "loss": 0.3705, "step": 3440 }, { - "epoch": 2.99, - "learning_rate": 3.7939860139860137e-06, - "loss": 0.4257, + "epoch": 47.91, + "learning_rate": 8.56338028169014e-08, + "loss": 0.3515, "step": 3450 }, { - "epoch": 3.0, - "learning_rate": 3.793286713286713e-06, - "loss": 0.4183, - "step": 3460 + "epoch": 48.0, + "eval_loss": 0.5398772954940796, + "eval_runtime": 129.9986, + "eval_samples_per_second": 4.092, + "eval_steps_per_second": 0.515, + "eval_wer": 0.24676994279102654, + "step": 3456 }, { - "epoch": 3.0, - "eval_loss": 0.5650942921638489, - "eval_runtime": 133.5311, - "eval_samples_per_second": 3.984, - "eval_steps_per_second": 1.992, - "eval_wer": 0.2742173940991194, - "step": 3462 + "epoch": 48.06, + "learning_rate": 8e-08, + "loss": 0.3824, + "step": 3460 }, { - "epoch": 3.01, - "learning_rate": 3.7925874125874123e-06, - "loss": 0.4397, + "epoch": 48.19, + "learning_rate": 7.436619718309858e-08, + "loss": 0.3749, "step": 3470 }, { - "epoch": 3.02, - "learning_rate": 3.7918881118881117e-06, - "loss": 0.4497, + "epoch": 48.33, + "learning_rate": 6.873239436619718e-08, + "loss": 0.3759, "step": 3480 }, { - "epoch": 3.02, - "learning_rate": 3.7911888111888112e-06, - "loss": 0.4424, + "epoch": 48.47, + "learning_rate": 6.309859154929577e-08, + "loss": 0.354, "step": 3490 }, { - "epoch": 3.03, - "learning_rate": 3.7904895104895103e-06, - "loss": 0.5406, + "epoch": 48.61, + "learning_rate": 5.746478873239436e-08, + "loss": 0.3629, "step": 3500 }, { - "epoch": 3.04, - "learning_rate": 3.7897902097902094e-06, - "loss": 0.5165, + "epoch": 48.75, + "learning_rate": 5.183098591549295e-08, + "loss": 0.3605, "step": 3510 }, { - "epoch": 3.05, - "learning_rate": 3.789090909090909e-06, - "loss": 0.388, + "epoch": 48.89, + "learning_rate": 4.619718309859155e-08, + "loss": 0.3485, "step": 3520 }, { - "epoch": 3.06, - "learning_rate": 3.7883916083916084e-06, - "loss": 0.3958, + "epoch": 49.0, + "eval_loss": 0.5391861796379089, + "eval_runtime": 127.4223, + "eval_samples_per_second": 4.175, + "eval_steps_per_second": 0.526, + "eval_wer": 0.24612714533650445, + "step": 3528 + }, + { + "epoch": 49.03, + "learning_rate": 4.0563380281690137e-08, + "loss": 0.3749, "step": 3530 }, { - "epoch": 3.07, - "learning_rate": 3.787692307692308e-06, - "loss": 0.3826, + "epoch": 49.17, + "learning_rate": 3.492957746478873e-08, + "loss": 0.3625, "step": 3540 }, { - "epoch": 3.08, - "learning_rate": 3.7869930069930065e-06, - "loss": 0.4399, + "epoch": 49.3, + "learning_rate": 2.9295774647887323e-08, + "loss": 0.3768, "step": 3550 }, { - "epoch": 3.08, - "learning_rate": 3.786293706293706e-06, - "loss": 0.4987, + "epoch": 49.44, + "learning_rate": 2.3661971830985916e-08, + "loss": 0.3523, "step": 3560 }, { - "epoch": 3.09, - "learning_rate": 3.7855944055944055e-06, - "loss": 0.4862, + "epoch": 49.58, + "learning_rate": 1.802816901408451e-08, + "loss": 0.3673, "step": 3570 }, { - "epoch": 3.1, - "learning_rate": 3.7848951048951046e-06, - "loss": 0.4197, + "epoch": 49.72, + "learning_rate": 1.2394366197183099e-08, + "loss": 0.3624, "step": 3580 }, { - "epoch": 3.11, - "learning_rate": 3.784195804195804e-06, - "loss": 0.4305, + "epoch": 49.86, + "learning_rate": 6.76056338028169e-09, + "loss": 0.3632, "step": 3590 }, { - "epoch": 3.12, - "learning_rate": 3.7834965034965036e-06, - "loss": 0.4473, + "epoch": 50.0, + "learning_rate": 1.1267605633802818e-09, + "loss": 0.3591, "step": 3600 }, - { - "epoch": 3.13, - "learning_rate": 3.7827972027972027e-06, - "loss": 0.4162, - "step": 3610 - }, - { - "epoch": 3.14, - "learning_rate": 3.7820979020979017e-06, - "loss": 0.4128, - "step": 3620 - }, - { - "epoch": 3.15, - "learning_rate": 3.7813986013986012e-06, - "loss": 0.4461, - "step": 3630 - }, - { - "epoch": 3.15, - "learning_rate": 3.7806993006993007e-06, - "loss": 0.3405, - "step": 3640 - }, - { - "epoch": 3.16, - "learning_rate": 3.78e-06, - "loss": 0.4331, - "step": 3650 - }, - { - "epoch": 3.17, - "learning_rate": 3.779300699300699e-06, - "loss": 0.4181, - "step": 3660 - }, - { - "epoch": 3.18, - "learning_rate": 3.7786013986013984e-06, - "loss": 0.4451, - "step": 3670 - }, - { - "epoch": 3.19, - "learning_rate": 3.777902097902098e-06, - "loss": 0.4119, - "step": 3680 - }, - { - "epoch": 3.2, - "learning_rate": 3.777202797202797e-06, - "loss": 0.4076, - "step": 3690 - }, - { - "epoch": 3.21, - "learning_rate": 3.7765034965034964e-06, - "loss": 0.4246, - "step": 3700 - }, - { - "epoch": 3.21, - "learning_rate": 3.775804195804196e-06, - "loss": 0.4545, - "step": 3710 - }, - { - "epoch": 3.22, - "learning_rate": 3.7751048951048946e-06, - "loss": 0.4589, - "step": 3720 - }, - { - "epoch": 3.23, - "learning_rate": 3.774405594405594e-06, - "loss": 0.3718, - "step": 3730 - }, - { - "epoch": 3.24, - "learning_rate": 3.7737062937062936e-06, - "loss": 0.4376, - "step": 3740 - }, - { - "epoch": 3.25, - "learning_rate": 3.773006993006993e-06, - "loss": 0.4793, - "step": 3750 - }, - { - "epoch": 3.26, - "learning_rate": 3.772307692307692e-06, - "loss": 0.4543, - "step": 3760 - }, - { - "epoch": 3.27, - "learning_rate": 3.7716083916083912e-06, - "loss": 0.4228, - "step": 3770 - }, - { - "epoch": 3.28, - "learning_rate": 3.7709090909090907e-06, - "loss": 0.4624, - "step": 3780 - }, - { - "epoch": 3.28, - "learning_rate": 3.7702097902097902e-06, - "loss": 0.4135, - "step": 3790 - }, - { - "epoch": 3.29, - "learning_rate": 3.7695104895104893e-06, - "loss": 0.3678, - "step": 3800 - }, - { - "epoch": 3.3, - "learning_rate": 3.768811188811189e-06, - "loss": 0.5265, - "step": 3810 - }, - { - "epoch": 3.31, - "learning_rate": 3.768111888111888e-06, - "loss": 0.4423, - "step": 3820 - }, - { - "epoch": 3.32, - "learning_rate": 3.767412587412587e-06, - "loss": 0.3714, - "step": 3830 - }, - { - "epoch": 3.33, - "learning_rate": 3.7667132867132864e-06, - "loss": 0.4268, - "step": 3840 - }, - { - "epoch": 3.34, - "learning_rate": 3.766013986013986e-06, - "loss": 0.4489, - "step": 3850 - }, - { - "epoch": 3.34, - "learning_rate": 3.7653146853146854e-06, - "loss": 0.5035, - "step": 3860 - }, - { - "epoch": 3.35, - "learning_rate": 3.7646153846153845e-06, - "loss": 0.4687, - "step": 3870 - }, - { - "epoch": 3.36, - "learning_rate": 3.7639160839160836e-06, - "loss": 0.4121, - "step": 3880 - }, - { - "epoch": 3.37, - "learning_rate": 3.763216783216783e-06, - "loss": 0.369, - "step": 3890 - }, - { - "epoch": 3.38, - "learning_rate": 3.762517482517482e-06, - "loss": 0.4527, - "step": 3900 - }, - { - "epoch": 3.39, - "learning_rate": 3.7618181818181816e-06, - "loss": 0.4308, - "step": 3910 - }, - { - "epoch": 3.4, - "learning_rate": 3.761118881118881e-06, - "loss": 0.4128, - "step": 3920 - }, - { - "epoch": 3.41, - "learning_rate": 3.7604195804195802e-06, - "loss": 0.521, - "step": 3930 - }, - { - "epoch": 3.41, - "learning_rate": 3.7597202797202793e-06, - "loss": 0.4238, - "step": 3940 - }, - { - "epoch": 3.42, - "learning_rate": 3.7590209790209788e-06, - "loss": 0.4704, - "step": 3950 - }, - { - "epoch": 3.43, - "learning_rate": 3.7583216783216783e-06, - "loss": 0.4642, - "step": 3960 - }, - { - "epoch": 3.44, - "learning_rate": 3.7576223776223778e-06, - "loss": 0.4667, - "step": 3970 - }, - { - "epoch": 3.45, - "learning_rate": 3.7569230769230764e-06, - "loss": 0.4269, - "step": 3980 - }, - { - "epoch": 3.46, - "learning_rate": 3.756223776223776e-06, - "loss": 0.4289, - "step": 3990 - }, - { - "epoch": 3.47, - "learning_rate": 3.7555244755244754e-06, - "loss": 0.4133, - "step": 4000 - }, - { - "epoch": 3.47, - "learning_rate": 3.7548251748251745e-06, - "loss": 0.421, - "step": 4010 - }, - { - "epoch": 3.48, - "learning_rate": 3.754125874125874e-06, - "loss": 0.4431, - "step": 4020 - }, - { - "epoch": 3.49, - "learning_rate": 3.7534265734265735e-06, - "loss": 0.42, - "step": 4030 - }, - { - "epoch": 3.5, - "learning_rate": 3.7527272727272726e-06, - "loss": 0.3878, - "step": 4040 - }, - { - "epoch": 3.51, - "learning_rate": 3.7520279720279716e-06, - "loss": 0.4353, - "step": 4050 - }, - { - "epoch": 3.52, - "learning_rate": 3.751328671328671e-06, - "loss": 0.4756, - "step": 4060 - }, - { - "epoch": 3.53, - "learning_rate": 3.7506293706293706e-06, - "loss": 0.4126, - "step": 4070 - }, - { - "epoch": 3.54, - "learning_rate": 3.7499300699300697e-06, - "loss": 0.4228, - "step": 4080 - }, - { - "epoch": 3.54, - "learning_rate": 3.7492307692307688e-06, - "loss": 0.4061, - "step": 4090 - }, - { - "epoch": 3.55, - "learning_rate": 3.7485314685314683e-06, - "loss": 0.4199, - "step": 4100 - }, - { - "epoch": 3.56, - "learning_rate": 3.7478321678321678e-06, - "loss": 0.3854, - "step": 4110 - }, - { - "epoch": 3.57, - "learning_rate": 3.747132867132867e-06, - "loss": 0.4457, - "step": 4120 - }, - { - "epoch": 3.58, - "learning_rate": 3.7464335664335663e-06, - "loss": 0.4599, - "step": 4130 - }, - { - "epoch": 3.59, - "learning_rate": 3.745734265734266e-06, - "loss": 0.4054, - "step": 4140 - }, - { - "epoch": 3.6, - "learning_rate": 3.745034965034965e-06, - "loss": 0.3808, - "step": 4150 - }, - { - "epoch": 3.6, - "learning_rate": 3.744335664335664e-06, - "loss": 0.4587, - "step": 4160 - }, - { - "epoch": 3.61, - "learning_rate": 3.7436363636363635e-06, - "loss": 0.4025, - "step": 4170 - }, - { - "epoch": 3.62, - "learning_rate": 3.742937062937063e-06, - "loss": 0.4518, - "step": 4180 - }, - { - "epoch": 3.63, - "learning_rate": 3.742237762237762e-06, - "loss": 0.4274, - "step": 4190 - }, - { - "epoch": 3.64, - "learning_rate": 3.741538461538461e-06, - "loss": 0.3934, - "step": 4200 - }, - { - "epoch": 3.65, - "learning_rate": 3.7408391608391606e-06, - "loss": 0.4389, - "step": 4210 - }, - { - "epoch": 3.66, - "learning_rate": 3.74013986013986e-06, - "loss": 0.4551, - "step": 4220 - }, - { - "epoch": 3.67, - "learning_rate": 3.739440559440559e-06, - "loss": 0.437, - "step": 4230 - }, - { - "epoch": 3.67, - "learning_rate": 3.7387412587412587e-06, - "loss": 0.3626, - "step": 4240 - }, - { - "epoch": 3.68, - "learning_rate": 3.738041958041958e-06, - "loss": 0.4564, - "step": 4250 - }, - { - "epoch": 3.69, - "learning_rate": 3.737342657342657e-06, - "loss": 0.4565, - "step": 4260 - }, - { - "epoch": 3.7, - "learning_rate": 3.7366433566433563e-06, - "loss": 0.3513, - "step": 4270 - }, - { - "epoch": 3.71, - "learning_rate": 3.735944055944056e-06, - "loss": 0.4132, - "step": 4280 - }, - { - "epoch": 3.72, - "learning_rate": 3.7352447552447553e-06, - "loss": 0.4435, - "step": 4290 - }, - { - "epoch": 3.73, - "learning_rate": 3.7345454545454544e-06, - "loss": 0.4355, - "step": 4300 - }, - { - "epoch": 3.73, - "learning_rate": 3.7338461538461535e-06, - "loss": 0.4505, - "step": 4310 - }, - { - "epoch": 3.74, - "learning_rate": 3.733146853146853e-06, - "loss": 0.4314, - "step": 4320 - }, - { - "epoch": 3.75, - "learning_rate": 3.7324475524475525e-06, - "loss": 0.4169, - "step": 4330 - }, - { - "epoch": 3.76, - "learning_rate": 3.7317482517482515e-06, - "loss": 0.4096, - "step": 4340 - }, - { - "epoch": 3.77, - "learning_rate": 3.731048951048951e-06, - "loss": 0.4357, - "step": 4350 - }, - { - "epoch": 3.78, - "learning_rate": 3.73034965034965e-06, - "loss": 0.4208, - "step": 4360 - }, - { - "epoch": 3.79, - "learning_rate": 3.729650349650349e-06, - "loss": 0.4181, - "step": 4370 - }, - { - "epoch": 3.8, - "learning_rate": 3.7289510489510487e-06, - "loss": 0.3545, - "step": 4380 - }, - { - "epoch": 3.8, - "learning_rate": 3.728251748251748e-06, - "loss": 0.4258, - "step": 4390 - }, - { - "epoch": 3.81, - "learning_rate": 3.7275524475524477e-06, - "loss": 0.435, - "step": 4400 - }, - { - "epoch": 3.82, - "learning_rate": 3.7268531468531468e-06, - "loss": 0.4027, - "step": 4410 - }, - { - "epoch": 3.83, - "learning_rate": 3.726153846153846e-06, - "loss": 0.3978, - "step": 4420 - }, - { - "epoch": 3.84, - "learning_rate": 3.7254545454545453e-06, - "loss": 0.4087, - "step": 4430 - }, - { - "epoch": 3.85, - "learning_rate": 3.7247552447552444e-06, - "loss": 0.4328, - "step": 4440 - }, - { - "epoch": 3.86, - "learning_rate": 3.724055944055944e-06, - "loss": 0.4419, - "step": 4450 - }, - { - "epoch": 3.86, - "learning_rate": 3.7233566433566434e-06, - "loss": 0.4289, - "step": 4460 - }, - { - "epoch": 3.87, - "learning_rate": 3.7226573426573425e-06, - "loss": 0.4208, - "step": 4470 - }, - { - "epoch": 3.88, - "learning_rate": 3.7219580419580415e-06, - "loss": 0.3757, - "step": 4480 - }, - { - "epoch": 3.89, - "learning_rate": 3.721258741258741e-06, - "loss": 0.4707, - "step": 4490 - }, - { - "epoch": 3.9, - "learning_rate": 3.7205594405594405e-06, - "loss": 0.4446, - "step": 4500 - }, - { - "epoch": 3.91, - "learning_rate": 3.71986013986014e-06, - "loss": 0.4387, - "step": 4510 - }, - { - "epoch": 3.92, - "learning_rate": 3.719160839160839e-06, - "loss": 0.3761, - "step": 4520 - }, - { - "epoch": 3.93, - "learning_rate": 3.718461538461538e-06, - "loss": 0.3772, - "step": 4530 - }, - { - "epoch": 3.93, - "learning_rate": 3.7177622377622377e-06, - "loss": 0.3546, - "step": 4540 - }, - { - "epoch": 3.94, - "learning_rate": 3.7170629370629367e-06, - "loss": 0.3831, - "step": 4550 - }, - { - "epoch": 3.95, - "learning_rate": 3.7163636363636362e-06, - "loss": 0.4194, - "step": 4560 - }, - { - "epoch": 3.96, - "learning_rate": 3.7156643356643357e-06, - "loss": 0.3452, - "step": 4570 - }, - { - "epoch": 3.97, - "learning_rate": 3.714965034965035e-06, - "loss": 0.426, - "step": 4580 - }, - { - "epoch": 3.98, - "learning_rate": 3.714265734265734e-06, - "loss": 0.4237, - "step": 4590 - }, - { - "epoch": 3.99, - "learning_rate": 3.7135664335664334e-06, - "loss": 0.4047, - "step": 4600 - }, - { - "epoch": 3.99, - "learning_rate": 3.712867132867133e-06, - "loss": 0.4618, - "step": 4610 - }, - { - "epoch": 4.0, - "eval_loss": 0.5653170347213745, - "eval_runtime": 133.4467, - "eval_samples_per_second": 3.987, - "eval_steps_per_second": 1.993, - "eval_wer": 0.2675323005720897, - "step": 4616 - }, - { - "epoch": 4.0, - "learning_rate": 3.712167832167832e-06, - "loss": 0.4252, - "step": 4620 - }, - { - "epoch": 4.01, - "learning_rate": 3.711468531468531e-06, - "loss": 0.4812, - "step": 4630 - }, - { - "epoch": 4.02, - "learning_rate": 3.7107692307692305e-06, - "loss": 0.3366, - "step": 4640 - }, - { - "epoch": 4.03, - "learning_rate": 3.71006993006993e-06, - "loss": 0.4217, - "step": 4650 - }, - { - "epoch": 4.04, - "learning_rate": 3.709370629370629e-06, - "loss": 0.459, - "step": 4660 - }, - { - "epoch": 4.05, - "learning_rate": 3.7086713286713286e-06, - "loss": 0.4434, - "step": 4670 - }, - { - "epoch": 4.06, - "learning_rate": 3.707972027972028e-06, - "loss": 0.4243, - "step": 4680 - }, - { - "epoch": 4.06, - "learning_rate": 3.7072727272727267e-06, - "loss": 0.4106, - "step": 4690 - }, - { - "epoch": 4.07, - "learning_rate": 3.7065734265734262e-06, - "loss": 0.4261, - "step": 4700 - }, - { - "epoch": 4.08, - "learning_rate": 3.7058741258741257e-06, - "loss": 0.4321, - "step": 4710 - }, - { - "epoch": 4.09, - "learning_rate": 3.7051748251748252e-06, - "loss": 0.4066, - "step": 4720 - }, - { - "epoch": 4.1, - "learning_rate": 3.7044755244755243e-06, - "loss": 0.3874, - "step": 4730 - }, - { - "epoch": 4.11, - "learning_rate": 3.7037762237762234e-06, - "loss": 0.3956, - "step": 4740 - }, - { - "epoch": 4.12, - "learning_rate": 3.703076923076923e-06, - "loss": 0.3823, - "step": 4750 - }, - { - "epoch": 4.12, - "learning_rate": 3.7023776223776224e-06, - "loss": 0.3953, - "step": 4760 - }, - { - "epoch": 4.13, - "learning_rate": 3.7016783216783214e-06, - "loss": 0.4628, - "step": 4770 - }, - { - "epoch": 4.14, - "learning_rate": 3.700979020979021e-06, - "loss": 0.4156, - "step": 4780 - }, - { - "epoch": 4.15, - "learning_rate": 3.7002797202797204e-06, - "loss": 0.3769, - "step": 4790 - }, - { - "epoch": 4.16, - "learning_rate": 3.699580419580419e-06, - "loss": 0.3838, - "step": 4800 - }, - { - "epoch": 4.17, - "learning_rate": 3.6988811188811186e-06, - "loss": 0.3492, - "step": 4810 - }, - { - "epoch": 4.18, - "learning_rate": 3.698181818181818e-06, - "loss": 0.3568, - "step": 4820 - }, - { - "epoch": 4.19, - "learning_rate": 3.6974825174825176e-06, - "loss": 0.4544, - "step": 4830 - }, - { - "epoch": 4.19, - "learning_rate": 3.6967832167832167e-06, - "loss": 0.3981, - "step": 4840 - }, - { - "epoch": 4.2, - "learning_rate": 3.6960839160839157e-06, - "loss": 0.4105, - "step": 4850 - }, - { - "epoch": 4.21, - "learning_rate": 3.6953846153846152e-06, - "loss": 0.422, - "step": 4860 - }, - { - "epoch": 4.22, - "learning_rate": 3.6946853146853143e-06, - "loss": 0.3775, - "step": 4870 - }, - { - "epoch": 4.23, - "learning_rate": 3.693986013986014e-06, - "loss": 0.4763, - "step": 4880 - }, - { - "epoch": 4.24, - "learning_rate": 3.6932867132867133e-06, - "loss": 0.3996, - "step": 4890 - }, - { - "epoch": 4.25, - "learning_rate": 3.6925874125874128e-06, - "loss": 0.4157, - "step": 4900 - }, - { - "epoch": 4.25, - "learning_rate": 3.6918881118881114e-06, - "loss": 0.4038, - "step": 4910 - }, - { - "epoch": 4.26, - "learning_rate": 3.691188811188811e-06, - "loss": 0.4375, - "step": 4920 - }, - { - "epoch": 4.27, - "learning_rate": 3.6904895104895104e-06, - "loss": 0.3983, - "step": 4930 - }, - { - "epoch": 4.28, - "learning_rate": 3.68979020979021e-06, - "loss": 0.376, - "step": 4940 - }, - { - "epoch": 4.29, - "learning_rate": 3.689090909090909e-06, - "loss": 0.4349, - "step": 4950 - }, - { - "epoch": 4.3, - "learning_rate": 3.688391608391608e-06, - "loss": 0.4193, - "step": 4960 - }, - { - "epoch": 4.31, - "learning_rate": 3.6876923076923076e-06, - "loss": 0.4872, - "step": 4970 - }, - { - "epoch": 4.32, - "learning_rate": 3.6869930069930066e-06, - "loss": 0.4245, - "step": 4980 - }, - { - "epoch": 4.32, - "learning_rate": 3.686293706293706e-06, - "loss": 0.3797, - "step": 4990 - }, - { - "epoch": 4.33, - "learning_rate": 3.6855944055944056e-06, - "loss": 0.3833, - "step": 5000 - }, - { - "epoch": 4.34, - "learning_rate": 3.6848951048951047e-06, - "loss": 0.4412, - "step": 5010 - }, - { - "epoch": 4.35, - "learning_rate": 3.6841958041958038e-06, - "loss": 0.4183, - "step": 5020 - }, - { - "epoch": 4.36, - "learning_rate": 3.6834965034965033e-06, - "loss": 0.3991, - "step": 5030 - }, - { - "epoch": 4.37, - "learning_rate": 3.6827972027972028e-06, - "loss": 0.4045, - "step": 5040 - }, - { - "epoch": 4.38, - "learning_rate": 3.682097902097902e-06, - "loss": 0.419, - "step": 5050 - }, - { - "epoch": 4.38, - "learning_rate": 3.6814685314685313e-06, - "loss": 0.4751, - "step": 5060 - }, - { - "epoch": 4.39, - "learning_rate": 3.6807692307692304e-06, - "loss": 0.4423, - "step": 5070 - }, - { - "epoch": 4.4, - "learning_rate": 3.68006993006993e-06, - "loss": 0.4421, - "step": 5080 - }, - { - "epoch": 4.41, - "learning_rate": 3.6793706293706294e-06, - "loss": 0.4682, - "step": 5090 - }, - { - "epoch": 4.42, - "learning_rate": 3.678671328671329e-06, - "loss": 0.4166, - "step": 5100 - }, - { - "epoch": 4.43, - "learning_rate": 3.6779720279720275e-06, - "loss": 0.3662, - "step": 5110 - }, - { - "epoch": 4.44, - "learning_rate": 3.677272727272727e-06, - "loss": 0.4312, - "step": 5120 - }, - { - "epoch": 4.45, - "learning_rate": 3.6765734265734265e-06, - "loss": 0.4069, - "step": 5130 - }, - { - "epoch": 4.45, - "learning_rate": 3.6758741258741256e-06, - "loss": 0.3921, - "step": 5140 - }, - { - "epoch": 4.46, - "learning_rate": 3.675174825174825e-06, - "loss": 0.4333, - "step": 5150 - }, - { - "epoch": 4.47, - "learning_rate": 3.674475524475524e-06, - "loss": 0.4416, - "step": 5160 - }, - { - "epoch": 4.48, - "learning_rate": 3.6737762237762237e-06, - "loss": 0.4463, - "step": 5170 - }, - { - "epoch": 4.49, - "learning_rate": 3.6730769230769227e-06, - "loss": 0.439, - "step": 5180 - }, - { - "epoch": 4.5, - "learning_rate": 3.6723776223776222e-06, - "loss": 0.4153, - "step": 5190 - }, - { - "epoch": 4.51, - "learning_rate": 3.6716783216783217e-06, - "loss": 0.4236, - "step": 5200 - }, - { - "epoch": 4.51, - "learning_rate": 3.670979020979021e-06, - "loss": 0.4354, - "step": 5210 - }, - { - "epoch": 4.52, - "learning_rate": 3.67027972027972e-06, - "loss": 0.4321, - "step": 5220 - }, - { - "epoch": 4.53, - "learning_rate": 3.6695804195804194e-06, - "loss": 0.4584, - "step": 5230 - }, - { - "epoch": 4.54, - "learning_rate": 3.668881118881119e-06, - "loss": 0.4637, - "step": 5240 - }, - { - "epoch": 4.55, - "learning_rate": 3.668181818181818e-06, - "loss": 0.414, - "step": 5250 - }, - { - "epoch": 4.56, - "learning_rate": 3.6674825174825174e-06, - "loss": 0.4954, - "step": 5260 - }, - { - "epoch": 4.57, - "learning_rate": 3.6667832167832165e-06, - "loss": 0.3738, - "step": 5270 - }, - { - "epoch": 4.58, - "learning_rate": 3.666083916083916e-06, - "loss": 0.3884, - "step": 5280 - }, - { - "epoch": 4.58, - "learning_rate": 3.665384615384615e-06, - "loss": 0.3681, - "step": 5290 - }, - { - "epoch": 4.59, - "learning_rate": 3.6646853146853146e-06, - "loss": 0.4485, - "step": 5300 - }, - { - "epoch": 4.6, - "learning_rate": 3.663986013986014e-06, - "loss": 0.4244, - "step": 5310 - }, - { - "epoch": 4.61, - "learning_rate": 3.6632867132867127e-06, - "loss": 0.3891, - "step": 5320 - }, - { - "epoch": 4.62, - "learning_rate": 3.6625874125874122e-06, - "loss": 0.4124, - "step": 5330 - }, - { - "epoch": 4.63, - "learning_rate": 3.6618881118881117e-06, - "loss": 0.3761, - "step": 5340 - }, - { - "epoch": 4.64, - "learning_rate": 3.6611888111888112e-06, - "loss": 0.3659, - "step": 5350 - }, - { - "epoch": 4.64, - "learning_rate": 3.6604895104895103e-06, - "loss": 0.4604, - "step": 5360 - }, - { - "epoch": 4.65, - "learning_rate": 3.65979020979021e-06, - "loss": 0.4532, - "step": 5370 - }, - { - "epoch": 4.66, - "learning_rate": 3.659090909090909e-06, - "loss": 0.4347, - "step": 5380 - }, - { - "epoch": 4.67, - "learning_rate": 3.6583916083916084e-06, - "loss": 0.4212, - "step": 5390 - }, - { - "epoch": 4.68, - "learning_rate": 3.6576923076923074e-06, - "loss": 0.457, - "step": 5400 - }, - { - "epoch": 4.69, - "learning_rate": 3.656993006993007e-06, - "loss": 0.5144, - "step": 5410 - }, - { - "epoch": 4.7, - "learning_rate": 3.6562937062937064e-06, - "loss": 0.4147, - "step": 5420 - }, - { - "epoch": 4.71, - "learning_rate": 3.655594405594405e-06, - "loss": 0.4336, - "step": 5430 - }, - { - "epoch": 4.71, - "learning_rate": 3.6548951048951046e-06, - "loss": 0.4126, - "step": 5440 - }, - { - "epoch": 4.72, - "learning_rate": 3.654195804195804e-06, - "loss": 0.4083, - "step": 5450 - }, - { - "epoch": 4.73, - "learning_rate": 3.6534965034965036e-06, - "loss": 0.444, - "step": 5460 - }, - { - "epoch": 4.74, - "learning_rate": 3.6527972027972026e-06, - "loss": 0.4407, - "step": 5470 - }, - { - "epoch": 4.75, - "learning_rate": 3.6520979020979017e-06, - "loss": 0.4018, - "step": 5480 - }, - { - "epoch": 4.76, - "learning_rate": 3.651398601398601e-06, - "loss": 0.4195, - "step": 5490 - }, - { - "epoch": 4.77, - "learning_rate": 3.6506993006993003e-06, - "loss": 0.4083, - "step": 5500 - }, - { - "epoch": 4.77, - "learning_rate": 3.6499999999999998e-06, - "loss": 0.4352, - "step": 5510 - }, - { - "epoch": 4.78, - "learning_rate": 3.6493006993006993e-06, - "loss": 0.451, - "step": 5520 - }, - { - "epoch": 4.79, - "learning_rate": 3.6486013986013988e-06, - "loss": 0.3954, - "step": 5530 - }, - { - "epoch": 4.8, - "learning_rate": 3.6479020979020974e-06, - "loss": 0.4088, - "step": 5540 - }, - { - "epoch": 4.81, - "learning_rate": 3.647202797202797e-06, - "loss": 0.3787, - "step": 5550 - }, - { - "epoch": 4.82, - "learning_rate": 3.6465034965034964e-06, - "loss": 0.4491, - "step": 5560 - }, - { - "epoch": 4.83, - "learning_rate": 3.645804195804196e-06, - "loss": 0.476, - "step": 5570 - }, - { - "epoch": 4.83, - "learning_rate": 3.645104895104895e-06, - "loss": 0.4762, - "step": 5580 - }, - { - "epoch": 4.84, - "learning_rate": 3.644405594405594e-06, - "loss": 0.3717, - "step": 5590 - }, - { - "epoch": 4.85, - "learning_rate": 3.6437062937062936e-06, - "loss": 0.447, - "step": 5600 - }, - { - "epoch": 4.86, - "learning_rate": 3.6430069930069926e-06, - "loss": 0.427, - "step": 5610 - }, - { - "epoch": 4.87, - "learning_rate": 3.642307692307692e-06, - "loss": 0.4573, - "step": 5620 - }, - { - "epoch": 4.88, - "learning_rate": 3.6416083916083916e-06, - "loss": 0.4257, - "step": 5630 - }, - { - "epoch": 4.89, - "learning_rate": 3.640909090909091e-06, - "loss": 0.4192, - "step": 5640 - }, - { - "epoch": 4.9, - "learning_rate": 3.6402097902097898e-06, - "loss": 0.4273, - "step": 5650 - }, - { - "epoch": 4.9, - "learning_rate": 3.6395104895104893e-06, - "loss": 0.4011, - "step": 5660 - }, - { - "epoch": 4.91, - "learning_rate": 3.6388111888111888e-06, - "loss": 0.4335, - "step": 5670 - }, - { - "epoch": 4.92, - "learning_rate": 3.638111888111888e-06, - "loss": 0.4133, - "step": 5680 - }, - { - "epoch": 4.93, - "learning_rate": 3.6374125874125873e-06, - "loss": 0.4318, - "step": 5690 - }, - { - "epoch": 4.94, - "learning_rate": 3.6367132867132864e-06, - "loss": 0.4009, - "step": 5700 - }, - { - "epoch": 4.95, - "learning_rate": 3.636013986013986e-06, - "loss": 0.37, - "step": 5710 - }, - { - "epoch": 4.96, - "learning_rate": 3.635314685314685e-06, - "loss": 0.5268, - "step": 5720 - }, - { - "epoch": 4.96, - "learning_rate": 3.6346153846153845e-06, - "loss": 0.3504, - "step": 5730 - }, - { - "epoch": 4.97, - "learning_rate": 3.633916083916084e-06, - "loss": 0.4493, - "step": 5740 - }, - { - "epoch": 4.98, - "learning_rate": 3.6332167832167835e-06, - "loss": 0.4104, - "step": 5750 - }, - { - "epoch": 4.99, - "learning_rate": 3.632517482517482e-06, - "loss": 0.4701, - "step": 5760 - }, - { - "epoch": 5.0, - "learning_rate": 3.6318181818181816e-06, - "loss": 0.4179, - "step": 5770 - }, - { - "epoch": 5.0, - "eval_loss": 0.5541394352912903, - "eval_runtime": 132.2755, - "eval_samples_per_second": 4.022, - "eval_steps_per_second": 2.011, - "eval_wer": 0.2696535321720126, - "step": 5770 - }, - { - "epoch": 5.01, - "learning_rate": 3.631118881118881e-06, - "loss": 0.4515, - "step": 5780 - }, - { - "epoch": 5.02, - "learning_rate": 3.63041958041958e-06, - "loss": 0.3908, - "step": 5790 - }, - { - "epoch": 5.03, - "learning_rate": 3.6297202797202797e-06, - "loss": 0.3718, - "step": 5800 - }, - { - "epoch": 5.03, - "learning_rate": 3.6290209790209788e-06, - "loss": 0.4033, - "step": 5810 - }, - { - "epoch": 5.04, - "learning_rate": 3.6283216783216783e-06, - "loss": 0.4639, - "step": 5820 - }, - { - "epoch": 5.05, - "learning_rate": 3.6276223776223773e-06, - "loss": 0.4132, - "step": 5830 - }, - { - "epoch": 5.06, - "learning_rate": 3.626923076923077e-06, - "loss": 0.3738, - "step": 5840 - }, - { - "epoch": 5.07, - "learning_rate": 3.6262237762237763e-06, - "loss": 0.3811, - "step": 5850 - }, - { - "epoch": 5.08, - "learning_rate": 3.625524475524475e-06, - "loss": 0.3906, - "step": 5860 - }, - { - "epoch": 5.09, - "learning_rate": 3.6248251748251745e-06, - "loss": 0.456, - "step": 5870 - }, - { - "epoch": 5.1, - "learning_rate": 3.624125874125874e-06, - "loss": 0.4335, - "step": 5880 - }, - { - "epoch": 5.1, - "learning_rate": 3.6234265734265735e-06, - "loss": 0.4065, - "step": 5890 - }, - { - "epoch": 5.11, - "learning_rate": 3.6227272727272725e-06, - "loss": 0.3946, - "step": 5900 - }, - { - "epoch": 5.12, - "learning_rate": 3.622027972027972e-06, - "loss": 0.4255, - "step": 5910 - }, - { - "epoch": 5.13, - "learning_rate": 3.621328671328671e-06, - "loss": 0.5383, - "step": 5920 - }, - { - "epoch": 5.14, - "learning_rate": 3.6206293706293706e-06, - "loss": 0.4545, - "step": 5930 - }, - { - "epoch": 5.15, - "learning_rate": 3.6199300699300697e-06, - "loss": 0.4416, - "step": 5940 - }, - { - "epoch": 5.16, - "learning_rate": 3.619230769230769e-06, - "loss": 0.3873, - "step": 5950 - }, - { - "epoch": 5.16, - "learning_rate": 3.6185314685314687e-06, - "loss": 0.4583, - "step": 5960 - }, - { - "epoch": 5.17, - "learning_rate": 3.6178321678321673e-06, - "loss": 0.4221, - "step": 5970 - }, - { - "epoch": 5.18, - "learning_rate": 3.617132867132867e-06, - "loss": 0.3759, - "step": 5980 - }, - { - "epoch": 5.19, - "learning_rate": 3.6164335664335663e-06, - "loss": 0.3778, - "step": 5990 - }, - { - "epoch": 5.2, - "learning_rate": 3.615734265734266e-06, - "loss": 0.3657, - "step": 6000 - }, - { - "epoch": 5.21, - "learning_rate": 3.615034965034965e-06, - "loss": 0.4768, - "step": 6010 - }, - { - "epoch": 5.22, - "learning_rate": 3.614335664335664e-06, - "loss": 0.4704, - "step": 6020 - }, - { - "epoch": 5.23, - "learning_rate": 3.6136363636363635e-06, - "loss": 0.4471, - "step": 6030 - }, - { - "epoch": 5.23, - "learning_rate": 3.6129370629370625e-06, - "loss": 0.4016, - "step": 6040 - }, - { - "epoch": 5.24, - "learning_rate": 3.612237762237762e-06, - "loss": 0.3933, - "step": 6050 - }, - { - "epoch": 5.25, - "learning_rate": 3.6115384615384615e-06, - "loss": 0.4244, - "step": 6060 - }, - { - "epoch": 5.26, - "learning_rate": 3.610839160839161e-06, - "loss": 0.4475, - "step": 6070 - }, - { - "epoch": 5.27, - "learning_rate": 3.6101398601398597e-06, - "loss": 0.4473, - "step": 6080 - }, - { - "epoch": 5.28, - "learning_rate": 3.609440559440559e-06, - "loss": 0.454, - "step": 6090 - }, - { - "epoch": 5.29, - "learning_rate": 3.6087412587412587e-06, - "loss": 0.4177, - "step": 6100 - }, - { - "epoch": 5.29, - "learning_rate": 3.608041958041958e-06, - "loss": 0.4084, - "step": 6110 - }, - { - "epoch": 5.3, - "learning_rate": 3.6073426573426572e-06, - "loss": 0.4163, - "step": 6120 - }, - { - "epoch": 5.31, - "learning_rate": 3.6066433566433563e-06, - "loss": 0.4717, - "step": 6130 - }, - { - "epoch": 5.32, - "learning_rate": 3.605944055944056e-06, - "loss": 0.3936, - "step": 6140 - }, - { - "epoch": 5.33, - "learning_rate": 3.605244755244755e-06, - "loss": 0.3789, - "step": 6150 - }, - { - "epoch": 5.34, - "learning_rate": 3.6045454545454544e-06, - "loss": 0.4144, - "step": 6160 - }, - { - "epoch": 5.35, - "learning_rate": 3.603846153846154e-06, - "loss": 0.3966, - "step": 6170 - }, - { - "epoch": 5.36, - "learning_rate": 3.6031468531468534e-06, - "loss": 0.4479, - "step": 6180 - }, - { - "epoch": 5.36, - "learning_rate": 3.602447552447552e-06, - "loss": 0.37, - "step": 6190 - }, - { - "epoch": 5.37, - "learning_rate": 3.6017482517482515e-06, - "loss": 0.366, - "step": 6200 - }, - { - "epoch": 5.38, - "learning_rate": 3.601048951048951e-06, - "loss": 0.443, - "step": 6210 - }, - { - "epoch": 5.39, - "learning_rate": 3.60034965034965e-06, - "loss": 0.3772, - "step": 6220 - }, - { - "epoch": 5.4, - "learning_rate": 3.5996503496503496e-06, - "loss": 0.4389, - "step": 6230 - }, - { - "epoch": 5.41, - "learning_rate": 3.5989510489510487e-06, - "loss": 0.4294, - "step": 6240 - }, - { - "epoch": 5.42, - "learning_rate": 3.598251748251748e-06, - "loss": 0.4025, - "step": 6250 - }, - { - "epoch": 5.42, - "learning_rate": 3.5975524475524472e-06, - "loss": 0.4683, - "step": 6260 - }, - { - "epoch": 5.43, - "learning_rate": 3.5968531468531467e-06, - "loss": 0.4215, - "step": 6270 - }, - { - "epoch": 5.44, - "learning_rate": 3.5961538461538462e-06, - "loss": 0.3982, - "step": 6280 - }, - { - "epoch": 5.45, - "learning_rate": 3.595454545454545e-06, - "loss": 0.3678, - "step": 6290 - }, - { - "epoch": 5.46, - "learning_rate": 3.5947552447552444e-06, - "loss": 0.3787, - "step": 6300 - }, - { - "epoch": 5.47, - "learning_rate": 3.594055944055944e-06, - "loss": 0.4167, - "step": 6310 - }, - { - "epoch": 5.48, - "learning_rate": 3.5933566433566434e-06, - "loss": 0.4013, - "step": 6320 - }, - { - "epoch": 5.49, - "learning_rate": 3.5926573426573424e-06, - "loss": 0.3849, - "step": 6330 - }, - { - "epoch": 5.49, - "learning_rate": 3.591958041958042e-06, - "loss": 0.4911, - "step": 6340 - }, - { - "epoch": 5.5, - "learning_rate": 3.591258741258741e-06, - "loss": 0.3917, - "step": 6350 - }, - { - "epoch": 5.51, - "learning_rate": 3.5905594405594405e-06, - "loss": 0.4331, - "step": 6360 - }, - { - "epoch": 5.52, - "learning_rate": 3.5898601398601396e-06, - "loss": 0.4441, - "step": 6370 - }, - { - "epoch": 5.53, - "learning_rate": 3.589160839160839e-06, - "loss": 0.404, - "step": 6380 - }, - { - "epoch": 5.54, - "learning_rate": 3.5884615384615386e-06, - "loss": 0.3654, - "step": 6390 - }, - { - "epoch": 5.55, - "learning_rate": 3.5877622377622372e-06, - "loss": 0.3759, - "step": 6400 - }, - { - "epoch": 5.55, - "learning_rate": 3.5870629370629367e-06, - "loss": 0.3972, - "step": 6410 - }, - { - "epoch": 5.56, - "learning_rate": 3.5863636363636362e-06, - "loss": 0.4738, - "step": 6420 - }, - { - "epoch": 5.57, - "learning_rate": 3.5856643356643357e-06, - "loss": 0.3825, - "step": 6430 - }, - { - "epoch": 5.58, - "learning_rate": 3.5849650349650348e-06, - "loss": 0.4313, - "step": 6440 - }, - { - "epoch": 5.59, - "learning_rate": 3.5842657342657343e-06, - "loss": 0.4117, - "step": 6450 - }, - { - "epoch": 5.6, - "learning_rate": 3.5835664335664334e-06, - "loss": 0.4463, - "step": 6460 - }, - { - "epoch": 5.61, - "learning_rate": 3.5828671328671324e-06, - "loss": 0.4928, - "step": 6470 - }, - { - "epoch": 5.61, - "learning_rate": 3.582167832167832e-06, - "loss": 0.3977, - "step": 6480 - }, - { - "epoch": 5.62, - "learning_rate": 3.5814685314685314e-06, - "loss": 0.43, - "step": 6490 - }, - { - "epoch": 5.63, - "learning_rate": 3.580769230769231e-06, - "loss": 0.3967, - "step": 6500 - }, - { - "epoch": 5.64, - "learning_rate": 3.5800699300699296e-06, - "loss": 0.4091, - "step": 6510 - }, - { - "epoch": 5.65, - "learning_rate": 3.579370629370629e-06, - "loss": 0.4269, - "step": 6520 - }, - { - "epoch": 5.66, - "learning_rate": 3.5786713286713286e-06, - "loss": 0.4157, - "step": 6530 - }, - { - "epoch": 5.67, - "learning_rate": 3.577972027972028e-06, - "loss": 0.4275, - "step": 6540 - }, - { - "epoch": 5.68, - "learning_rate": 3.577272727272727e-06, - "loss": 0.4638, - "step": 6550 - }, - { - "epoch": 5.68, - "learning_rate": 3.5765734265734266e-06, - "loss": 0.4441, - "step": 6560 - }, - { - "epoch": 5.69, - "learning_rate": 3.5758741258741257e-06, - "loss": 0.4582, - "step": 6570 - }, - { - "epoch": 5.7, - "learning_rate": 3.5751748251748248e-06, - "loss": 0.4679, - "step": 6580 - }, - { - "epoch": 5.71, - "learning_rate": 3.5744755244755243e-06, - "loss": 0.4212, - "step": 6590 - }, - { - "epoch": 5.72, - "learning_rate": 3.5737762237762238e-06, - "loss": 0.4247, - "step": 6600 - }, - { - "epoch": 5.73, - "learning_rate": 3.5730769230769233e-06, - "loss": 0.4173, - "step": 6610 - }, - { - "epoch": 5.74, - "learning_rate": 3.572377622377622e-06, - "loss": 0.4359, - "step": 6620 - }, - { - "epoch": 5.74, - "learning_rate": 3.5716783216783214e-06, - "loss": 0.4385, - "step": 6630 - }, - { - "epoch": 5.75, - "learning_rate": 3.570979020979021e-06, - "loss": 0.4632, - "step": 6640 - }, - { - "epoch": 5.76, - "learning_rate": 3.57027972027972e-06, - "loss": 0.4045, - "step": 6650 - }, - { - "epoch": 5.77, - "learning_rate": 3.5695804195804195e-06, - "loss": 0.4145, - "step": 6660 - }, - { - "epoch": 5.78, - "learning_rate": 3.5688811188811186e-06, - "loss": 0.393, - "step": 6670 - }, - { - "epoch": 5.79, - "learning_rate": 3.568181818181818e-06, - "loss": 0.4025, - "step": 6680 - }, - { - "epoch": 5.8, - "learning_rate": 3.567482517482517e-06, - "loss": 0.378, - "step": 6690 - }, - { - "epoch": 5.81, - "learning_rate": 3.5667832167832166e-06, - "loss": 0.4254, - "step": 6700 - }, - { - "epoch": 5.81, - "learning_rate": 3.566083916083916e-06, - "loss": 0.4688, - "step": 6710 - }, - { - "epoch": 5.82, - "learning_rate": 3.5653846153846156e-06, - "loss": 0.4761, - "step": 6720 - }, - { - "epoch": 5.83, - "learning_rate": 3.5646853146853143e-06, - "loss": 0.4667, - "step": 6730 - }, - { - "epoch": 5.84, - "learning_rate": 3.5639860139860138e-06, - "loss": 0.5203, - "step": 6740 - }, - { - "epoch": 5.85, - "learning_rate": 3.5632867132867133e-06, - "loss": 0.4006, - "step": 6750 - }, - { - "epoch": 5.86, - "learning_rate": 3.5625874125874123e-06, - "loss": 0.4119, - "step": 6760 - }, - { - "epoch": 5.87, - "learning_rate": 3.561888111888112e-06, - "loss": 0.4235, - "step": 6770 - }, - { - "epoch": 5.87, - "learning_rate": 3.561188811188811e-06, - "loss": 0.3927, - "step": 6780 - }, - { - "epoch": 5.88, - "learning_rate": 3.5604895104895104e-06, - "loss": 0.4529, - "step": 6790 - }, - { - "epoch": 5.89, - "learning_rate": 3.5597902097902095e-06, - "loss": 0.4006, - "step": 6800 - }, - { - "epoch": 5.9, - "learning_rate": 3.559090909090909e-06, - "loss": 0.4497, - "step": 6810 - }, - { - "epoch": 5.91, - "learning_rate": 3.5583916083916085e-06, - "loss": 0.4493, - "step": 6820 - }, - { - "epoch": 5.92, - "learning_rate": 3.557692307692307e-06, - "loss": 0.3804, - "step": 6830 - }, - { - "epoch": 5.93, - "learning_rate": 3.5569930069930066e-06, - "loss": 0.3847, - "step": 6840 - }, - { - "epoch": 5.94, - "learning_rate": 3.556293706293706e-06, - "loss": 0.4154, - "step": 6850 - }, - { - "epoch": 5.94, - "learning_rate": 3.5555944055944056e-06, - "loss": 0.3667, - "step": 6860 - }, - { - "epoch": 5.95, - "learning_rate": 3.5548951048951047e-06, - "loss": 0.4174, - "step": 6870 - }, - { - "epoch": 5.96, - "learning_rate": 3.554195804195804e-06, - "loss": 0.424, - "step": 6880 - }, - { - "epoch": 5.97, - "learning_rate": 3.5534965034965033e-06, - "loss": 0.4112, - "step": 6890 - }, - { - "epoch": 5.98, - "learning_rate": 3.5528671328671327e-06, - "loss": 0.4325, - "step": 6900 - }, - { - "epoch": 5.99, - "learning_rate": 3.5521678321678322e-06, - "loss": 0.4382, - "step": 6910 - }, - { - "epoch": 6.0, - "learning_rate": 3.5514685314685313e-06, - "loss": 0.4376, - "step": 6920 - }, - { - "epoch": 6.0, - "eval_loss": 0.5798775553703308, - "eval_runtime": 131.9415, - "eval_samples_per_second": 4.032, - "eval_steps_per_second": 2.016, - "eval_wer": 0.26913929420839494, - "step": 6924 - }, - { - "epoch": 6.01, - "learning_rate": 3.5507692307692304e-06, - "loss": 0.4753, - "step": 6930 - }, - { - "epoch": 6.01, - "learning_rate": 3.55006993006993e-06, - "loss": 0.4354, - "step": 6940 - }, - { - "epoch": 6.02, - "learning_rate": 3.5493706293706294e-06, - "loss": 0.4241, - "step": 6950 - }, - { - "epoch": 6.03, - "learning_rate": 3.5486713286713284e-06, - "loss": 0.4086, - "step": 6960 - }, - { - "epoch": 6.04, - "learning_rate": 3.547972027972028e-06, - "loss": 0.4, - "step": 6970 - }, - { - "epoch": 6.05, - "learning_rate": 3.547272727272727e-06, - "loss": 0.4019, - "step": 6980 - }, - { - "epoch": 6.06, - "learning_rate": 3.5465734265734265e-06, - "loss": 0.457, - "step": 6990 - }, - { - "epoch": 6.07, - "learning_rate": 3.5458741258741256e-06, - "loss": 0.3821, - "step": 7000 - }, - { - "epoch": 6.07, - "learning_rate": 3.545174825174825e-06, - "loss": 0.4102, - "step": 7010 - }, - { - "epoch": 6.08, - "learning_rate": 3.5444755244755246e-06, - "loss": 0.4352, - "step": 7020 - }, - { - "epoch": 6.09, - "learning_rate": 3.5437762237762236e-06, - "loss": 0.3816, - "step": 7030 - }, - { - "epoch": 6.1, - "learning_rate": 3.5430769230769227e-06, - "loss": 0.4442, - "step": 7040 - }, - { - "epoch": 6.11, - "learning_rate": 3.542377622377622e-06, - "loss": 0.4007, - "step": 7050 - }, - { - "epoch": 6.12, - "learning_rate": 3.5416783216783217e-06, - "loss": 0.4247, - "step": 7060 - }, - { - "epoch": 6.13, - "learning_rate": 3.5409790209790208e-06, - "loss": 0.4067, - "step": 7070 - }, - { - "epoch": 6.14, - "learning_rate": 3.5403496503496502e-06, - "loss": 0.3995, - "step": 7080 - }, - { - "epoch": 6.14, - "learning_rate": 3.5396503496503493e-06, - "loss": 0.4824, - "step": 7090 - }, - { - "epoch": 6.15, - "learning_rate": 3.538951048951049e-06, - "loss": 0.3947, - "step": 7100 - }, - { - "epoch": 6.16, - "learning_rate": 3.5382517482517483e-06, - "loss": 0.3508, - "step": 7110 - }, - { - "epoch": 6.17, - "learning_rate": 3.5375524475524474e-06, - "loss": 0.4147, - "step": 7120 - }, - { - "epoch": 6.18, - "learning_rate": 3.5368531468531465e-06, - "loss": 0.3916, - "step": 7130 - }, - { - "epoch": 6.19, - "learning_rate": 3.536153846153846e-06, - "loss": 0.4855, - "step": 7140 - }, - { - "epoch": 6.2, - "learning_rate": 3.5354545454545454e-06, - "loss": 0.3445, - "step": 7150 - }, - { - "epoch": 6.2, - "learning_rate": 3.5347552447552445e-06, - "loss": 0.4443, - "step": 7160 - }, - { - "epoch": 6.21, - "learning_rate": 3.534055944055944e-06, - "loss": 0.4426, - "step": 7170 - }, - { - "epoch": 6.22, - "learning_rate": 3.533356643356643e-06, - "loss": 0.4079, - "step": 7180 - }, - { - "epoch": 6.23, - "learning_rate": 3.532657342657342e-06, - "loss": 0.3727, - "step": 7190 - }, - { - "epoch": 6.24, - "learning_rate": 3.5319580419580417e-06, - "loss": 0.362, - "step": 7200 - }, - { - "epoch": 6.25, - "learning_rate": 3.531258741258741e-06, - "loss": 0.424, - "step": 7210 - }, - { - "epoch": 6.26, - "learning_rate": 3.5305594405594407e-06, - "loss": 0.4108, - "step": 7220 - }, - { - "epoch": 6.27, - "learning_rate": 3.5298601398601397e-06, - "loss": 0.4526, - "step": 7230 - }, - { - "epoch": 6.27, - "learning_rate": 3.529160839160839e-06, - "loss": 0.417, - "step": 7240 - }, - { - "epoch": 6.28, - "learning_rate": 3.5284615384615383e-06, - "loss": 0.4048, - "step": 7250 - }, - { - "epoch": 6.29, - "learning_rate": 3.527762237762238e-06, - "loss": 0.421, - "step": 7260 - }, - { - "epoch": 6.3, - "learning_rate": 3.527062937062937e-06, - "loss": 0.4592, - "step": 7270 - }, - { - "epoch": 6.31, - "learning_rate": 3.5263636363636364e-06, - "loss": 0.4749, - "step": 7280 - }, - { - "epoch": 6.32, - "learning_rate": 3.5256643356643354e-06, - "loss": 0.426, - "step": 7290 - }, - { - "epoch": 6.33, - "learning_rate": 3.5249650349650345e-06, - "loss": 0.3914, - "step": 7300 - }, - { - "epoch": 6.33, - "learning_rate": 3.524265734265734e-06, - "loss": 0.4809, - "step": 7310 - }, - { - "epoch": 6.34, - "learning_rate": 3.5235664335664335e-06, - "loss": 0.4657, - "step": 7320 - }, - { - "epoch": 6.35, - "learning_rate": 3.522867132867133e-06, - "loss": 0.37, - "step": 7330 - }, - { - "epoch": 6.36, - "learning_rate": 3.5221678321678317e-06, - "loss": 0.4217, - "step": 7340 - }, - { - "epoch": 6.37, - "learning_rate": 3.521468531468531e-06, - "loss": 0.4398, - "step": 7350 - }, - { - "epoch": 6.38, - "learning_rate": 3.5207692307692306e-06, - "loss": 0.462, - "step": 7360 - }, - { - "epoch": 6.39, - "learning_rate": 3.5200699300699297e-06, - "loss": 0.3877, - "step": 7370 - }, - { - "epoch": 6.39, - "learning_rate": 3.5193706293706292e-06, - "loss": 0.4435, - "step": 7380 - }, - { - "epoch": 6.4, - "learning_rate": 3.5186713286713287e-06, - "loss": 0.411, - "step": 7390 - }, - { - "epoch": 6.41, - "learning_rate": 3.517972027972028e-06, - "loss": 0.4068, - "step": 7400 - }, - { - "epoch": 6.42, - "learning_rate": 3.517272727272727e-06, - "loss": 0.4755, - "step": 7410 - }, - { - "epoch": 6.43, - "learning_rate": 3.5165734265734264e-06, - "loss": 0.386, - "step": 7420 - }, - { - "epoch": 6.44, - "learning_rate": 3.515874125874126e-06, - "loss": 0.3746, - "step": 7430 - }, - { - "epoch": 6.45, - "learning_rate": 3.5151748251748254e-06, - "loss": 0.3711, - "step": 7440 - }, - { - "epoch": 6.46, - "learning_rate": 3.514475524475524e-06, - "loss": 0.4024, - "step": 7450 - }, - { - "epoch": 6.46, - "learning_rate": 3.5137762237762235e-06, - "loss": 0.4098, - "step": 7460 - }, - { - "epoch": 6.47, - "learning_rate": 3.513076923076923e-06, - "loss": 0.3528, - "step": 7470 - }, - { - "epoch": 6.48, - "learning_rate": 3.512377622377622e-06, - "loss": 0.5305, - "step": 7480 - }, - { - "epoch": 6.49, - "learning_rate": 3.5116783216783216e-06, - "loss": 0.4691, - "step": 7490 - }, - { - "epoch": 6.5, - "learning_rate": 3.510979020979021e-06, - "loss": 0.4021, - "step": 7500 - }, - { - "epoch": 6.51, - "learning_rate": 3.51027972027972e-06, - "loss": 0.4125, - "step": 7510 - }, - { - "epoch": 6.52, - "learning_rate": 3.509580419580419e-06, - "loss": 0.386, - "step": 7520 - }, - { - "epoch": 6.52, - "learning_rate": 3.5088811188811187e-06, - "loss": 0.4242, - "step": 7530 - }, - { - "epoch": 6.53, - "learning_rate": 3.508181818181818e-06, - "loss": 0.4123, - "step": 7540 - }, - { - "epoch": 6.54, - "learning_rate": 3.5074825174825173e-06, - "loss": 0.4487, - "step": 7550 - }, - { - "epoch": 6.55, - "learning_rate": 3.5067832167832164e-06, - "loss": 0.4478, - "step": 7560 - }, - { - "epoch": 6.56, - "learning_rate": 3.506083916083916e-06, - "loss": 0.4163, - "step": 7570 - }, - { - "epoch": 6.57, - "learning_rate": 3.5053846153846153e-06, - "loss": 0.4304, - "step": 7580 - }, - { - "epoch": 6.58, - "learning_rate": 3.5046853146853144e-06, - "loss": 0.4456, - "step": 7590 - }, - { - "epoch": 6.59, - "learning_rate": 3.503986013986014e-06, - "loss": 0.4465, - "step": 7600 - }, - { - "epoch": 6.59, - "learning_rate": 3.5032867132867134e-06, - "loss": 0.3964, - "step": 7610 - }, - { - "epoch": 6.6, - "learning_rate": 3.5025874125874125e-06, - "loss": 0.4074, - "step": 7620 - }, - { - "epoch": 6.61, - "learning_rate": 3.5018881118881116e-06, - "loss": 0.4124, - "step": 7630 - }, - { - "epoch": 6.62, - "learning_rate": 3.501188811188811e-06, - "loss": 0.4041, - "step": 7640 - }, - { - "epoch": 6.63, - "learning_rate": 3.5004895104895106e-06, - "loss": 0.402, - "step": 7650 - }, - { - "epoch": 6.64, - "learning_rate": 3.4997902097902096e-06, - "loss": 0.4579, - "step": 7660 - }, - { - "epoch": 6.65, - "learning_rate": 3.4990909090909087e-06, - "loss": 0.4575, - "step": 7670 - }, - { - "epoch": 6.65, - "learning_rate": 3.498391608391608e-06, - "loss": 0.3933, - "step": 7680 - }, - { - "epoch": 6.66, - "learning_rate": 3.4976923076923077e-06, - "loss": 0.3882, - "step": 7690 - }, - { - "epoch": 6.67, - "learning_rate": 3.4969930069930068e-06, - "loss": 0.3905, - "step": 7700 - }, - { - "epoch": 6.68, - "learning_rate": 3.4962937062937063e-06, - "loss": 0.4503, - "step": 7710 - }, - { - "epoch": 6.69, - "learning_rate": 3.4955944055944053e-06, - "loss": 0.411, - "step": 7720 - }, - { - "epoch": 6.7, - "learning_rate": 3.4948951048951044e-06, - "loss": 0.4377, - "step": 7730 - }, - { - "epoch": 6.71, - "learning_rate": 3.494195804195804e-06, - "loss": 0.4029, - "step": 7740 - }, - { - "epoch": 6.72, - "learning_rate": 3.4934965034965034e-06, - "loss": 0.4286, - "step": 7750 - }, - { - "epoch": 6.72, - "learning_rate": 3.492797202797203e-06, - "loss": 0.4271, - "step": 7760 - }, - { - "epoch": 6.73, - "learning_rate": 3.492097902097902e-06, - "loss": 0.411, - "step": 7770 - }, - { - "epoch": 6.74, - "learning_rate": 3.491398601398601e-06, - "loss": 0.4059, - "step": 7780 - }, - { - "epoch": 6.75, - "learning_rate": 3.4906993006993005e-06, - "loss": 0.3642, - "step": 7790 - }, - { - "epoch": 6.76, - "learning_rate": 3.49e-06, - "loss": 0.3648, - "step": 7800 - }, - { - "epoch": 6.77, - "learning_rate": 3.489300699300699e-06, - "loss": 0.4237, - "step": 7810 - }, - { - "epoch": 6.78, - "learning_rate": 3.4886013986013986e-06, - "loss": 0.4553, - "step": 7820 - }, - { - "epoch": 6.78, - "learning_rate": 3.4879020979020977e-06, - "loss": 0.4313, - "step": 7830 - }, - { - "epoch": 6.79, - "learning_rate": 3.4872027972027968e-06, - "loss": 0.3817, - "step": 7840 - }, - { - "epoch": 6.8, - "learning_rate": 3.4865034965034963e-06, - "loss": 0.4534, - "step": 7850 - }, - { - "epoch": 6.81, - "learning_rate": 3.4858041958041958e-06, - "loss": 0.4108, - "step": 7860 - }, - { - "epoch": 6.82, - "learning_rate": 3.4851048951048953e-06, - "loss": 0.4737, - "step": 7870 - }, - { - "epoch": 6.83, - "learning_rate": 3.4844055944055943e-06, - "loss": 0.4346, - "step": 7880 - }, - { - "epoch": 6.84, - "learning_rate": 3.4837062937062934e-06, - "loss": 0.4078, - "step": 7890 - }, - { - "epoch": 6.85, - "learning_rate": 3.483006993006993e-06, - "loss": 0.4898, - "step": 7900 - }, - { - "epoch": 6.85, - "learning_rate": 3.482307692307692e-06, - "loss": 0.4099, - "step": 7910 - }, - { - "epoch": 6.86, - "learning_rate": 3.4816083916083915e-06, - "loss": 0.4807, - "step": 7920 - }, - { - "epoch": 6.87, - "learning_rate": 3.480909090909091e-06, - "loss": 0.3721, - "step": 7930 - }, - { - "epoch": 6.88, - "learning_rate": 3.48020979020979e-06, - "loss": 0.4563, - "step": 7940 - }, - { - "epoch": 6.89, - "learning_rate": 3.479510489510489e-06, - "loss": 0.3941, - "step": 7950 - }, - { - "epoch": 6.9, - "learning_rate": 3.4788111888111886e-06, - "loss": 0.3597, - "step": 7960 - }, - { - "epoch": 6.91, - "learning_rate": 3.478111888111888e-06, - "loss": 0.4191, - "step": 7970 - }, - { - "epoch": 6.91, - "learning_rate": 3.4774125874125876e-06, - "loss": 0.4304, - "step": 7980 - }, - { - "epoch": 6.92, - "learning_rate": 3.4767132867132862e-06, - "loss": 0.371, - "step": 7990 - }, - { - "epoch": 6.93, - "learning_rate": 3.4760139860139857e-06, - "loss": 0.4132, - "step": 8000 - }, - { - "epoch": 6.94, - "learning_rate": 3.4753146853146852e-06, - "loss": 0.3688, - "step": 8010 - }, - { - "epoch": 6.95, - "learning_rate": 3.4746153846153843e-06, - "loss": 0.4284, - "step": 8020 - }, - { - "epoch": 6.96, - "learning_rate": 3.473916083916084e-06, - "loss": 0.4216, - "step": 8030 - }, - { - "epoch": 6.97, - "learning_rate": 3.4732167832167833e-06, - "loss": 0.4085, - "step": 8040 - }, - { - "epoch": 6.98, - "learning_rate": 3.4725174825174824e-06, - "loss": 0.3671, - "step": 8050 - }, - { - "epoch": 6.98, - "learning_rate": 3.4718181818181815e-06, - "loss": 0.4413, - "step": 8060 - }, - { - "epoch": 6.99, - "learning_rate": 3.471118881118881e-06, - "loss": 0.4341, - "step": 8070 - }, - { - "epoch": 7.0, - "eval_loss": 0.5593249201774597, - "eval_runtime": 132.6281, - "eval_samples_per_second": 4.011, - "eval_steps_per_second": 2.006, - "eval_wer": 0.2648968310085492, - "step": 8078 - }, - { - "epoch": 7.0, - "learning_rate": 3.4704195804195805e-06, - "loss": 0.3919, - "step": 8080 - }, - { - "epoch": 7.01, - "learning_rate": 3.4697202797202795e-06, - "loss": 0.4472, - "step": 8090 - }, - { - "epoch": 7.02, - "learning_rate": 3.4690209790209786e-06, - "loss": 0.4076, - "step": 8100 - }, - { - "epoch": 7.03, - "learning_rate": 3.468321678321678e-06, - "loss": 0.4004, - "step": 8110 - }, - { - "epoch": 7.04, - "learning_rate": 3.4676223776223776e-06, - "loss": 0.4262, - "step": 8120 - }, - { - "epoch": 7.05, - "learning_rate": 3.4669230769230767e-06, - "loss": 0.3604, - "step": 8130 - }, - { - "epoch": 7.05, - "learning_rate": 3.466223776223776e-06, - "loss": 0.4613, - "step": 8140 - }, - { - "epoch": 7.06, - "learning_rate": 3.4655244755244757e-06, - "loss": 0.4261, - "step": 8150 - }, - { - "epoch": 7.07, - "learning_rate": 3.4648251748251747e-06, - "loss": 0.4473, - "step": 8160 - }, - { - "epoch": 7.08, - "learning_rate": 3.464125874125874e-06, - "loss": 0.3835, - "step": 8170 - }, - { - "epoch": 7.09, - "learning_rate": 3.4634265734265733e-06, - "loss": 0.4308, - "step": 8180 - }, - { - "epoch": 7.1, - "learning_rate": 3.462727272727273e-06, - "loss": 0.43, - "step": 8190 - }, - { - "epoch": 7.11, - "learning_rate": 3.462027972027972e-06, - "loss": 0.3746, - "step": 8200 - }, - { - "epoch": 7.11, - "learning_rate": 3.461328671328671e-06, - "loss": 0.3715, - "step": 8210 - }, - { - "epoch": 7.12, - "learning_rate": 3.4606293706293704e-06, - "loss": 0.4403, - "step": 8220 - }, - { - "epoch": 7.13, - "learning_rate": 3.45993006993007e-06, - "loss": 0.4333, - "step": 8230 - }, - { - "epoch": 7.14, - "learning_rate": 3.459230769230769e-06, - "loss": 0.3821, - "step": 8240 - }, - { - "epoch": 7.15, - "learning_rate": 3.4585314685314685e-06, - "loss": 0.399, - "step": 8250 - }, - { - "epoch": 7.16, - "learning_rate": 3.457832167832168e-06, - "loss": 0.3684, - "step": 8260 - }, - { - "epoch": 7.17, - "learning_rate": 3.4571328671328667e-06, - "loss": 0.4255, - "step": 8270 - }, - { - "epoch": 7.17, - "learning_rate": 3.456433566433566e-06, - "loss": 0.4221, - "step": 8280 - }, - { - "epoch": 7.18, - "learning_rate": 3.4557342657342657e-06, - "loss": 0.4537, - "step": 8290 - }, - { - "epoch": 7.19, - "learning_rate": 3.455034965034965e-06, - "loss": 0.4006, - "step": 8300 - }, - { - "epoch": 7.2, - "learning_rate": 3.4543356643356642e-06, - "loss": 0.4107, - "step": 8310 - }, - { - "epoch": 7.21, - "learning_rate": 3.4536363636363633e-06, - "loss": 0.466, - "step": 8320 - }, - { - "epoch": 7.22, - "learning_rate": 3.452937062937063e-06, - "loss": 0.4655, - "step": 8330 - }, - { - "epoch": 7.23, - "learning_rate": 3.452237762237762e-06, - "loss": 0.4353, - "step": 8340 - }, - { - "epoch": 7.24, - "learning_rate": 3.4515384615384614e-06, - "loss": 0.3783, - "step": 8350 - }, - { - "epoch": 7.24, - "learning_rate": 3.450839160839161e-06, - "loss": 0.3839, - "step": 8360 - }, - { - "epoch": 7.25, - "learning_rate": 3.45013986013986e-06, - "loss": 0.4209, - "step": 8370 - }, - { - "epoch": 7.26, - "learning_rate": 3.449440559440559e-06, - "loss": 0.3719, - "step": 8380 - }, - { - "epoch": 7.27, - "learning_rate": 3.4487412587412585e-06, - "loss": 0.4884, - "step": 8390 - }, - { - "epoch": 7.28, - "learning_rate": 3.448041958041958e-06, - "loss": 0.4634, - "step": 8400 - }, - { - "epoch": 7.29, - "learning_rate": 3.4473426573426575e-06, - "loss": 0.3454, - "step": 8410 - }, - { - "epoch": 7.3, - "learning_rate": 3.4466433566433566e-06, - "loss": 0.3983, - "step": 8420 - }, - { - "epoch": 7.3, - "learning_rate": 3.4459440559440556e-06, - "loss": 0.3874, - "step": 8430 - }, - { - "epoch": 7.31, - "learning_rate": 3.445244755244755e-06, - "loss": 0.396, - "step": 8440 - }, - { - "epoch": 7.32, - "learning_rate": 3.4445454545454542e-06, - "loss": 0.4124, - "step": 8450 - }, - { - "epoch": 7.33, - "learning_rate": 3.4438461538461537e-06, - "loss": 0.3665, - "step": 8460 - }, - { - "epoch": 7.34, - "learning_rate": 3.443146853146853e-06, - "loss": 0.3893, - "step": 8470 - }, - { - "epoch": 7.35, - "learning_rate": 3.4424475524475523e-06, - "loss": 0.5006, - "step": 8480 - }, - { - "epoch": 7.36, - "learning_rate": 3.4417482517482514e-06, - "loss": 0.3679, - "step": 8490 - }, - { - "epoch": 7.37, - "learning_rate": 3.441048951048951e-06, - "loss": 0.3859, - "step": 8500 - }, - { - "epoch": 7.37, - "learning_rate": 3.4403496503496503e-06, - "loss": 0.3818, - "step": 8510 - }, - { - "epoch": 7.38, - "learning_rate": 3.4396503496503494e-06, - "loss": 0.3795, - "step": 8520 - }, - { - "epoch": 7.39, - "learning_rate": 3.4389510489510485e-06, - "loss": 0.4211, - "step": 8530 - }, - { - "epoch": 7.4, - "learning_rate": 3.438251748251748e-06, - "loss": 0.4148, - "step": 8540 - }, - { - "epoch": 7.41, - "learning_rate": 3.4375524475524475e-06, - "loss": 0.412, - "step": 8550 - }, - { - "epoch": 7.42, - "learning_rate": 3.4368531468531466e-06, - "loss": 0.4597, - "step": 8560 - }, - { - "epoch": 7.43, - "learning_rate": 3.436153846153846e-06, - "loss": 0.3923, - "step": 8570 - }, - { - "epoch": 7.43, - "learning_rate": 3.4354545454545456e-06, - "loss": 0.4104, - "step": 8580 - }, - { - "epoch": 7.44, - "learning_rate": 3.4347552447552446e-06, - "loss": 0.4049, - "step": 8590 - }, - { - "epoch": 7.45, - "learning_rate": 3.4340559440559437e-06, - "loss": 0.436, - "step": 8600 - }, - { - "epoch": 7.46, - "learning_rate": 3.433356643356643e-06, - "loss": 0.3974, - "step": 8610 - }, - { - "epoch": 7.47, - "learning_rate": 3.4326573426573427e-06, - "loss": 0.4191, - "step": 8620 - }, - { - "epoch": 7.48, - "learning_rate": 3.4319580419580418e-06, - "loss": 0.5061, - "step": 8630 - }, - { - "epoch": 7.49, - "learning_rate": 3.431258741258741e-06, - "loss": 0.4298, - "step": 8640 - }, - { - "epoch": 7.5, - "learning_rate": 3.4305594405594403e-06, - "loss": 0.3958, - "step": 8650 - }, - { - "epoch": 7.5, - "learning_rate": 3.42986013986014e-06, - "loss": 0.4406, - "step": 8660 - }, - { - "epoch": 7.51, - "learning_rate": 3.429160839160839e-06, - "loss": 0.3959, - "step": 8670 - }, - { - "epoch": 7.52, - "learning_rate": 3.4284615384615384e-06, - "loss": 0.4711, - "step": 8680 - }, - { - "epoch": 7.53, - "learning_rate": 3.427762237762238e-06, - "loss": 0.4468, - "step": 8690 - }, - { - "epoch": 7.54, - "learning_rate": 3.4270629370629366e-06, - "loss": 0.3709, - "step": 8700 - }, - { - "epoch": 7.55, - "learning_rate": 3.426363636363636e-06, - "loss": 0.3925, - "step": 8710 - }, - { - "epoch": 7.56, - "learning_rate": 3.4256643356643356e-06, - "loss": 0.4129, - "step": 8720 - }, - { - "epoch": 7.56, - "learning_rate": 3.424965034965035e-06, - "loss": 0.3852, - "step": 8730 - }, - { - "epoch": 7.57, - "learning_rate": 3.424265734265734e-06, - "loss": 0.4379, - "step": 8740 - }, - { - "epoch": 7.58, - "learning_rate": 3.423566433566433e-06, - "loss": 0.4254, - "step": 8750 - }, - { - "epoch": 7.59, - "learning_rate": 3.4228671328671327e-06, - "loss": 0.413, - "step": 8760 - }, - { - "epoch": 7.6, - "learning_rate": 3.422167832167832e-06, - "loss": 0.4442, - "step": 8770 - }, - { - "epoch": 7.61, - "learning_rate": 3.4214685314685313e-06, - "loss": 0.4296, - "step": 8780 - }, - { - "epoch": 7.62, - "learning_rate": 3.4207692307692308e-06, - "loss": 0.3851, - "step": 8790 - }, - { - "epoch": 7.63, - "learning_rate": 3.4200699300699303e-06, - "loss": 0.4104, - "step": 8800 - }, - { - "epoch": 7.63, - "learning_rate": 3.419370629370629e-06, - "loss": 0.4401, - "step": 8810 - }, - { - "epoch": 7.64, - "learning_rate": 3.4186713286713284e-06, - "loss": 0.4269, - "step": 8820 - }, - { - "epoch": 7.65, - "learning_rate": 3.417972027972028e-06, - "loss": 0.4383, - "step": 8830 - }, - { - "epoch": 7.66, - "learning_rate": 3.4172727272727274e-06, - "loss": 0.3926, - "step": 8840 - }, - { - "epoch": 7.67, - "learning_rate": 3.4165734265734265e-06, - "loss": 0.4193, - "step": 8850 - }, - { - "epoch": 7.68, - "learning_rate": 3.4158741258741255e-06, - "loss": 0.3959, - "step": 8860 - }, - { - "epoch": 7.69, - "learning_rate": 3.415174825174825e-06, - "loss": 0.4067, - "step": 8870 - }, - { - "epoch": 7.69, - "learning_rate": 3.414475524475524e-06, - "loss": 0.3681, - "step": 8880 - }, - { - "epoch": 7.7, - "learning_rate": 3.4137762237762236e-06, - "loss": 0.4089, - "step": 8890 - }, - { - "epoch": 7.71, - "learning_rate": 3.413076923076923e-06, - "loss": 0.4024, - "step": 8900 - }, - { - "epoch": 7.72, - "learning_rate": 3.412377622377622e-06, - "loss": 0.3742, - "step": 8910 - }, - { - "epoch": 7.73, - "learning_rate": 3.4116783216783213e-06, - "loss": 0.3803, - "step": 8920 - }, - { - "epoch": 7.74, - "learning_rate": 3.4109790209790208e-06, - "loss": 0.4946, - "step": 8930 - }, - { - "epoch": 7.75, - "learning_rate": 3.4102797202797202e-06, - "loss": 0.372, - "step": 8940 - }, - { - "epoch": 7.76, - "learning_rate": 3.4095804195804197e-06, - "loss": 0.4491, - "step": 8950 - }, - { - "epoch": 7.76, - "learning_rate": 3.408881118881119e-06, - "loss": 0.4298, - "step": 8960 - }, - { - "epoch": 7.77, - "learning_rate": 3.408181818181818e-06, - "loss": 0.411, - "step": 8970 - }, - { - "epoch": 7.78, - "learning_rate": 3.4074825174825174e-06, - "loss": 0.4381, - "step": 8980 - }, - { - "epoch": 7.79, - "learning_rate": 3.4067832167832165e-06, - "loss": 0.3929, - "step": 8990 - }, - { - "epoch": 7.8, - "learning_rate": 3.406083916083916e-06, - "loss": 0.3752, - "step": 9000 - }, - { - "epoch": 7.81, - "learning_rate": 3.4053846153846155e-06, - "loss": 0.4362, - "step": 9010 - }, - { - "epoch": 7.82, - "learning_rate": 3.4046853146853145e-06, - "loss": 0.4371, - "step": 9020 - }, - { - "epoch": 7.82, - "learning_rate": 3.4039860139860136e-06, - "loss": 0.4526, - "step": 9030 - }, - { - "epoch": 7.83, - "learning_rate": 3.403286713286713e-06, - "loss": 0.4018, - "step": 9040 - }, - { - "epoch": 7.84, - "learning_rate": 3.4025874125874126e-06, - "loss": 0.3963, - "step": 9050 - }, - { - "epoch": 7.85, - "learning_rate": 3.4018881118881117e-06, - "loss": 0.3984, - "step": 9060 - }, - { - "epoch": 7.86, - "learning_rate": 3.401188811188811e-06, - "loss": 0.4395, - "step": 9070 - }, - { - "epoch": 7.87, - "learning_rate": 3.4004895104895102e-06, - "loss": 0.4229, - "step": 9080 - }, - { - "epoch": 7.88, - "learning_rate": 3.3997902097902097e-06, - "loss": 0.4344, - "step": 9090 - }, - { - "epoch": 7.89, - "learning_rate": 3.399090909090909e-06, - "loss": 0.3741, - "step": 9100 - }, - { - "epoch": 7.89, - "learning_rate": 3.3983916083916083e-06, - "loss": 0.3811, - "step": 9110 - }, - { - "epoch": 7.9, - "learning_rate": 3.397692307692308e-06, - "loss": 0.3972, - "step": 9120 - }, - { - "epoch": 7.91, - "learning_rate": 3.396993006993007e-06, - "loss": 0.4293, - "step": 9130 - }, - { - "epoch": 7.92, - "learning_rate": 3.396293706293706e-06, - "loss": 0.4136, - "step": 9140 - }, - { - "epoch": 7.93, - "learning_rate": 3.3955944055944054e-06, - "loss": 0.3997, - "step": 9150 - }, - { - "epoch": 7.94, - "learning_rate": 3.394895104895105e-06, - "loss": 0.4106, - "step": 9160 - }, - { - "epoch": 7.95, - "learning_rate": 3.394195804195804e-06, - "loss": 0.4311, - "step": 9170 - }, - { - "epoch": 7.95, - "learning_rate": 3.393496503496503e-06, - "loss": 0.411, - "step": 9180 - }, - { - "epoch": 7.96, - "learning_rate": 3.3927972027972026e-06, - "loss": 0.4382, - "step": 9190 - }, - { - "epoch": 7.97, - "learning_rate": 3.392097902097902e-06, - "loss": 0.3804, - "step": 9200 - }, - { - "epoch": 7.98, - "learning_rate": 3.391398601398601e-06, - "loss": 0.4592, - "step": 9210 - }, - { - "epoch": 7.99, - "learning_rate": 3.3906993006993007e-06, - "loss": 0.4102, - "step": 9220 - }, - { - "epoch": 8.0, - "learning_rate": 3.39e-06, - "loss": 0.4234, - "step": 9230 - }, - { - "epoch": 8.0, - "eval_loss": 0.5488837957382202, - "eval_runtime": 134.1414, - "eval_samples_per_second": 3.966, - "eval_steps_per_second": 1.983, - "eval_wer": 0.2652182297358103, - "step": 9232 - }, - { - "epoch": 8.01, - "learning_rate": 3.389300699300699e-06, - "loss": 0.3802, - "step": 9240 - }, - { - "epoch": 8.02, - "learning_rate": 3.3886013986013983e-06, - "loss": 0.4252, - "step": 9250 - }, - { - "epoch": 8.02, - "learning_rate": 3.387902097902098e-06, - "loss": 0.3946, - "step": 9260 - }, - { - "epoch": 8.03, - "learning_rate": 3.3872027972027973e-06, - "loss": 0.397, - "step": 9270 - }, - { - "epoch": 8.04, - "learning_rate": 3.3865034965034964e-06, - "loss": 0.5124, - "step": 9280 - }, - { - "epoch": 8.05, - "learning_rate": 3.3858041958041954e-06, - "loss": 0.3946, - "step": 9290 - }, - { - "epoch": 8.06, - "learning_rate": 3.385104895104895e-06, - "loss": 0.4221, - "step": 9300 - }, - { - "epoch": 8.07, - "learning_rate": 3.384405594405594e-06, - "loss": 0.4058, - "step": 9310 - }, - { - "epoch": 8.08, - "learning_rate": 3.3837062937062935e-06, - "loss": 0.4154, - "step": 9320 - }, - { - "epoch": 8.08, - "learning_rate": 3.383006993006993e-06, - "loss": 0.4059, - "step": 9330 - }, - { - "epoch": 8.09, - "learning_rate": 3.3823076923076925e-06, - "loss": 0.4428, - "step": 9340 - }, - { - "epoch": 8.1, - "learning_rate": 3.381608391608391e-06, - "loss": 0.4559, - "step": 9350 - }, - { - "epoch": 8.11, - "learning_rate": 3.3809090909090906e-06, - "loss": 0.4143, - "step": 9360 - }, - { - "epoch": 8.12, - "learning_rate": 3.38020979020979e-06, - "loss": 0.3998, - "step": 9370 - }, - { - "epoch": 8.13, - "learning_rate": 3.3795104895104896e-06, - "loss": 0.4962, - "step": 9380 - }, - { - "epoch": 8.14, - "learning_rate": 3.3788111888111887e-06, - "loss": 0.4313, - "step": 9390 - }, - { - "epoch": 8.15, - "learning_rate": 3.378111888111888e-06, - "loss": 0.4054, - "step": 9400 - }, - { - "epoch": 8.15, - "learning_rate": 3.3774125874125873e-06, - "loss": 0.4037, - "step": 9410 - }, - { - "epoch": 8.16, - "learning_rate": 3.3767132867132864e-06, - "loss": 0.3747, - "step": 9420 - }, - { - "epoch": 8.17, - "learning_rate": 3.376013986013986e-06, - "loss": 0.3761, - "step": 9430 - }, - { - "epoch": 8.18, - "learning_rate": 3.3753146853146854e-06, - "loss": 0.4675, - "step": 9440 - }, - { - "epoch": 8.19, - "learning_rate": 3.374615384615385e-06, - "loss": 0.4281, - "step": 9450 - }, - { - "epoch": 8.2, - "learning_rate": 3.3739160839160835e-06, - "loss": 0.3503, - "step": 9460 - }, - { - "epoch": 8.21, - "learning_rate": 3.373216783216783e-06, - "loss": 0.4173, - "step": 9470 - }, - { - "epoch": 8.21, - "learning_rate": 3.3725174825174825e-06, - "loss": 0.4234, - "step": 9480 - }, - { - "epoch": 8.22, - "learning_rate": 3.3718181818181816e-06, - "loss": 0.39, - "step": 9490 - }, - { - "epoch": 8.23, - "learning_rate": 3.371118881118881e-06, - "loss": 0.424, - "step": 9500 - }, - { - "epoch": 8.24, - "learning_rate": 3.37041958041958e-06, - "loss": 0.4464, - "step": 9510 - }, - { - "epoch": 8.25, - "learning_rate": 3.3697202797202796e-06, - "loss": 0.4552, - "step": 9520 - }, - { - "epoch": 8.26, - "learning_rate": 3.3690209790209787e-06, - "loss": 0.4114, - "step": 9530 - }, - { - "epoch": 8.27, - "learning_rate": 3.368321678321678e-06, - "loss": 0.423, - "step": 9540 - }, - { - "epoch": 8.28, - "learning_rate": 3.3676223776223777e-06, - "loss": 0.4322, - "step": 9550 - }, - { - "epoch": 8.28, - "learning_rate": 3.3669230769230768e-06, - "loss": 0.3917, - "step": 9560 - }, - { - "epoch": 8.29, - "learning_rate": 3.366223776223776e-06, - "loss": 0.4033, - "step": 9570 - }, - { - "epoch": 8.3, - "learning_rate": 3.3655244755244753e-06, - "loss": 0.4534, - "step": 9580 - }, - { - "epoch": 8.31, - "learning_rate": 3.364825174825175e-06, - "loss": 0.4289, - "step": 9590 - }, - { - "epoch": 8.32, - "learning_rate": 3.364125874125874e-06, - "loss": 0.4591, - "step": 9600 - }, - { - "epoch": 8.33, - "learning_rate": 3.3634265734265734e-06, - "loss": 0.398, - "step": 9610 - }, - { - "epoch": 8.34, - "learning_rate": 3.3627272727272725e-06, - "loss": 0.425, - "step": 9620 - }, - { - "epoch": 8.34, - "learning_rate": 3.362027972027972e-06, - "loss": 0.4334, - "step": 9630 - }, - { - "epoch": 8.35, - "learning_rate": 3.361328671328671e-06, - "loss": 0.3715, - "step": 9640 - }, - { - "epoch": 8.36, - "learning_rate": 3.3606293706293706e-06, - "loss": 0.4115, - "step": 9650 - }, - { - "epoch": 8.37, - "learning_rate": 3.35993006993007e-06, - "loss": 0.3408, - "step": 9660 - }, - { - "epoch": 8.38, - "learning_rate": 3.3592307692307687e-06, - "loss": 0.4309, - "step": 9670 - }, - { - "epoch": 8.39, - "learning_rate": 3.358531468531468e-06, - "loss": 0.4107, - "step": 9680 - }, - { - "epoch": 8.4, - "learning_rate": 3.3578321678321677e-06, - "loss": 0.3915, - "step": 9690 - }, - { - "epoch": 8.41, - "learning_rate": 3.357132867132867e-06, - "loss": 0.4034, - "step": 9700 - }, - { - "epoch": 8.41, - "learning_rate": 3.3564335664335663e-06, - "loss": 0.3847, - "step": 9710 - }, - { - "epoch": 8.42, - "learning_rate": 3.3557342657342653e-06, - "loss": 0.423, - "step": 9720 - }, - { - "epoch": 8.43, - "learning_rate": 3.355034965034965e-06, - "loss": 0.4304, - "step": 9730 - }, - { - "epoch": 8.44, - "learning_rate": 3.3543356643356643e-06, - "loss": 0.4048, - "step": 9740 - }, - { - "epoch": 8.45, - "learning_rate": 3.3536363636363634e-06, - "loss": 0.3768, - "step": 9750 - }, - { - "epoch": 8.46, - "learning_rate": 3.352937062937063e-06, - "loss": 0.3473, - "step": 9760 - }, - { - "epoch": 8.47, - "learning_rate": 3.3522377622377624e-06, - "loss": 0.4231, - "step": 9770 - }, - { - "epoch": 8.47, - "learning_rate": 3.351538461538461e-06, - "loss": 0.3808, - "step": 9780 - }, - { - "epoch": 8.48, - "learning_rate": 3.3508391608391605e-06, - "loss": 0.3728, - "step": 9790 - }, - { - "epoch": 8.49, - "learning_rate": 3.35013986013986e-06, - "loss": 0.4372, - "step": 9800 - }, - { - "epoch": 8.5, - "learning_rate": 3.3494405594405595e-06, - "loss": 0.4418, - "step": 9810 - }, - { - "epoch": 8.51, - "learning_rate": 3.3487412587412586e-06, - "loss": 0.4072, - "step": 9820 - }, - { - "epoch": 8.52, - "learning_rate": 3.3480419580419577e-06, - "loss": 0.441, - "step": 9830 - }, - { - "epoch": 8.53, - "learning_rate": 3.347342657342657e-06, - "loss": 0.3316, - "step": 9840 - }, - { - "epoch": 8.54, - "learning_rate": 3.3466433566433563e-06, - "loss": 0.381, - "step": 9850 - }, - { - "epoch": 8.54, - "learning_rate": 3.3459440559440558e-06, - "loss": 0.401, - "step": 9860 - }, - { - "epoch": 8.55, - "learning_rate": 3.3452447552447553e-06, - "loss": 0.4355, - "step": 9870 - }, - { - "epoch": 8.56, - "learning_rate": 3.3445454545454547e-06, - "loss": 0.511, - "step": 9880 - }, - { - "epoch": 8.57, - "learning_rate": 3.3438461538461534e-06, - "loss": 0.413, - "step": 9890 - }, - { - "epoch": 8.58, - "learning_rate": 3.343146853146853e-06, - "loss": 0.422, - "step": 9900 - }, - { - "epoch": 8.59, - "learning_rate": 3.3424475524475524e-06, - "loss": 0.4066, - "step": 9910 - }, - { - "epoch": 8.6, - "learning_rate": 3.341748251748252e-06, - "loss": 0.3828, - "step": 9920 - }, - { - "epoch": 8.6, - "learning_rate": 3.341048951048951e-06, - "loss": 0.4135, - "step": 9930 - }, - { - "epoch": 8.61, - "learning_rate": 3.34034965034965e-06, - "loss": 0.4386, - "step": 9940 - }, - { - "epoch": 8.62, - "learning_rate": 3.3396503496503495e-06, - "loss": 0.3895, - "step": 9950 - }, - { - "epoch": 8.63, - "learning_rate": 3.3389510489510486e-06, - "loss": 0.3449, - "step": 9960 - }, - { - "epoch": 8.64, - "learning_rate": 3.338251748251748e-06, - "loss": 0.3914, - "step": 9970 - }, - { - "epoch": 8.65, - "learning_rate": 3.3375524475524476e-06, - "loss": 0.4172, - "step": 9980 - }, - { - "epoch": 8.66, - "learning_rate": 3.336853146853147e-06, - "loss": 0.3624, - "step": 9990 - }, - { - "epoch": 8.67, - "learning_rate": 3.3361538461538457e-06, - "loss": 0.3909, - "step": 10000 - }, - { - "epoch": 8.67, - "learning_rate": 3.3354545454545452e-06, - "loss": 0.4117, - "step": 10010 - }, - { - "epoch": 8.68, - "learning_rate": 3.3347552447552447e-06, - "loss": 0.3968, - "step": 10020 - }, - { - "epoch": 8.69, - "learning_rate": 3.334055944055944e-06, - "loss": 0.4085, - "step": 10030 - }, - { - "epoch": 8.7, - "learning_rate": 3.3333566433566433e-06, - "loss": 0.4649, - "step": 10040 - }, - { - "epoch": 8.71, - "learning_rate": 3.3326573426573424e-06, - "loss": 0.4003, - "step": 10050 - }, - { - "epoch": 8.72, - "learning_rate": 3.331958041958042e-06, - "loss": 0.3796, - "step": 10060 - }, - { - "epoch": 8.73, - "learning_rate": 3.331258741258741e-06, - "loss": 0.4687, - "step": 10070 - }, - { - "epoch": 8.73, - "learning_rate": 3.3305594405594405e-06, - "loss": 0.4325, - "step": 10080 - }, - { - "epoch": 8.74, - "learning_rate": 3.32986013986014e-06, - "loss": 0.4062, - "step": 10090 - }, - { - "epoch": 8.75, - "learning_rate": 3.329160839160839e-06, - "loss": 0.3887, - "step": 10100 - }, - { - "epoch": 8.76, - "learning_rate": 3.328461538461538e-06, - "loss": 0.3791, - "step": 10110 - }, - { - "epoch": 8.77, - "learning_rate": 3.3277622377622376e-06, - "loss": 0.4117, - "step": 10120 - }, - { - "epoch": 8.78, - "learning_rate": 3.327062937062937e-06, - "loss": 0.4206, - "step": 10130 - }, - { - "epoch": 8.79, - "learning_rate": 3.326363636363636e-06, - "loss": 0.4569, - "step": 10140 - }, - { - "epoch": 8.8, - "learning_rate": 3.3256643356643357e-06, - "loss": 0.3759, - "step": 10150 - }, - { - "epoch": 8.8, - "learning_rate": 3.3249650349650347e-06, - "loss": 0.414, - "step": 10160 - }, - { - "epoch": 8.81, - "learning_rate": 3.3242657342657342e-06, - "loss": 0.3948, - "step": 10170 - }, - { - "epoch": 8.82, - "learning_rate": 3.3235664335664333e-06, - "loss": 0.426, - "step": 10180 - }, - { - "epoch": 8.83, - "learning_rate": 3.322867132867133e-06, - "loss": 0.4246, - "step": 10190 - }, - { - "epoch": 8.84, - "learning_rate": 3.3221678321678323e-06, - "loss": 0.4605, - "step": 10200 - }, - { - "epoch": 8.85, - "learning_rate": 3.321468531468531e-06, - "loss": 0.4355, - "step": 10210 - }, - { - "epoch": 8.86, - "learning_rate": 3.3207692307692304e-06, - "loss": 0.4407, - "step": 10220 - }, - { - "epoch": 8.86, - "learning_rate": 3.32006993006993e-06, - "loss": 0.4483, - "step": 10230 - }, - { - "epoch": 8.87, - "learning_rate": 3.3193706293706294e-06, - "loss": 0.3864, - "step": 10240 - }, - { - "epoch": 8.88, - "learning_rate": 3.3186713286713285e-06, - "loss": 0.4614, - "step": 10250 - }, - { - "epoch": 8.89, - "learning_rate": 3.317972027972028e-06, - "loss": 0.3972, - "step": 10260 - }, - { - "epoch": 8.9, - "learning_rate": 3.317272727272727e-06, - "loss": 0.4305, - "step": 10270 - }, - { - "epoch": 8.91, - "learning_rate": 3.316573426573426e-06, - "loss": 0.3863, - "step": 10280 - }, - { - "epoch": 8.92, - "learning_rate": 3.3158741258741257e-06, - "loss": 0.4265, - "step": 10290 - }, - { - "epoch": 8.93, - "learning_rate": 3.315174825174825e-06, - "loss": 0.3841, - "step": 10300 - }, - { - "epoch": 8.93, - "learning_rate": 3.3144755244755246e-06, - "loss": 0.3922, - "step": 10310 - }, - { - "epoch": 8.94, - "learning_rate": 3.3137762237762233e-06, - "loss": 0.3994, - "step": 10320 - }, - { - "epoch": 8.95, - "learning_rate": 3.313076923076923e-06, - "loss": 0.4247, - "step": 10330 - }, - { - "epoch": 8.96, - "learning_rate": 3.3123776223776223e-06, - "loss": 0.4377, - "step": 10340 - }, - { - "epoch": 8.97, - "learning_rate": 3.3116783216783218e-06, - "loss": 0.3737, - "step": 10350 - }, - { - "epoch": 8.98, - "learning_rate": 3.310979020979021e-06, - "loss": 0.3754, - "step": 10360 - }, - { - "epoch": 8.99, - "learning_rate": 3.31027972027972e-06, - "loss": 0.4627, - "step": 10370 - }, - { - "epoch": 8.99, - "learning_rate": 3.3095804195804194e-06, - "loss": 0.3965, - "step": 10380 - }, - { - "epoch": 9.0, - "eval_loss": 0.560581386089325, - "eval_runtime": 133.9098, - "eval_samples_per_second": 3.973, - "eval_steps_per_second": 1.986, - "eval_wer": 0.26014012984508583, - "step": 10386 - }, - { - "epoch": 9.0, - "learning_rate": 3.3088811188811185e-06, - "loss": 0.4449, - "step": 10390 - }, - { - "epoch": 9.01, - "learning_rate": 3.308181818181818e-06, - "loss": 0.4246, - "step": 10400 - }, - { - "epoch": 9.02, - "learning_rate": 3.3074825174825175e-06, - "loss": 0.4037, - "step": 10410 - }, - { - "epoch": 9.03, - "learning_rate": 3.306783216783217e-06, - "loss": 0.3731, - "step": 10420 - }, - { - "epoch": 9.04, - "learning_rate": 3.3060839160839156e-06, - "loss": 0.4149, - "step": 10430 - }, - { - "epoch": 9.05, - "learning_rate": 3.305384615384615e-06, - "loss": 0.4062, - "step": 10440 - }, - { - "epoch": 9.06, - "learning_rate": 3.3046853146853146e-06, - "loss": 0.4265, - "step": 10450 - }, - { - "epoch": 9.06, - "learning_rate": 3.3039860139860137e-06, - "loss": 0.3848, - "step": 10460 - }, - { - "epoch": 9.07, - "learning_rate": 3.303286713286713e-06, - "loss": 0.3891, - "step": 10470 - }, - { - "epoch": 9.08, - "learning_rate": 3.3025874125874123e-06, - "loss": 0.4249, - "step": 10480 - }, - { - "epoch": 9.09, - "learning_rate": 3.3018881118881118e-06, - "loss": 0.404, - "step": 10490 - }, - { - "epoch": 9.1, - "learning_rate": 3.301188811188811e-06, - "loss": 0.4211, - "step": 10500 - }, - { - "epoch": 9.11, - "learning_rate": 3.3004895104895104e-06, - "loss": 0.3693, - "step": 10510 - }, - { - "epoch": 9.12, - "learning_rate": 3.29979020979021e-06, - "loss": 0.4231, - "step": 10520 - }, - { - "epoch": 9.12, - "learning_rate": 3.2990909090909093e-06, - "loss": 0.379, - "step": 10530 - }, - { - "epoch": 9.13, - "learning_rate": 3.298391608391608e-06, - "loss": 0.3743, - "step": 10540 - }, - { - "epoch": 9.14, - "learning_rate": 3.2976923076923075e-06, - "loss": 0.3608, - "step": 10550 - }, - { - "epoch": 9.15, - "learning_rate": 3.296993006993007e-06, - "loss": 0.3752, - "step": 10560 - }, - { - "epoch": 9.16, - "learning_rate": 3.296293706293706e-06, - "loss": 0.4375, - "step": 10570 - }, - { - "epoch": 9.17, - "learning_rate": 3.2955944055944056e-06, - "loss": 0.4091, - "step": 10580 - }, - { - "epoch": 9.18, - "learning_rate": 3.2948951048951046e-06, - "loss": 0.4659, - "step": 10590 - }, - { - "epoch": 9.19, - "learning_rate": 3.294195804195804e-06, - "loss": 0.4305, - "step": 10600 - }, - { - "epoch": 9.19, - "learning_rate": 3.293496503496503e-06, - "loss": 0.3882, - "step": 10610 - }, - { - "epoch": 9.2, - "learning_rate": 3.2927972027972027e-06, - "loss": 0.3877, - "step": 10620 - }, - { - "epoch": 9.21, - "learning_rate": 3.292097902097902e-06, - "loss": 0.4133, - "step": 10630 - }, - { - "epoch": 9.22, - "learning_rate": 3.291398601398601e-06, - "loss": 0.4197, - "step": 10640 - }, - { - "epoch": 9.23, - "learning_rate": 3.2906993006993003e-06, - "loss": 0.3962, - "step": 10650 - }, - { - "epoch": 9.24, - "learning_rate": 3.29e-06, - "loss": 0.4339, - "step": 10660 - }, - { - "epoch": 9.25, - "learning_rate": 3.2893006993006993e-06, - "loss": 0.405, - "step": 10670 - }, - { - "epoch": 9.25, - "learning_rate": 3.2886013986013984e-06, - "loss": 0.411, - "step": 10680 - }, - { - "epoch": 9.26, - "learning_rate": 3.287902097902098e-06, - "loss": 0.4084, - "step": 10690 - }, - { - "epoch": 9.27, - "learning_rate": 3.287202797202797e-06, - "loss": 0.4886, - "step": 10700 - }, - { - "epoch": 9.28, - "learning_rate": 3.2865034965034965e-06, - "loss": 0.4184, - "step": 10710 - }, - { - "epoch": 9.29, - "learning_rate": 3.2858041958041956e-06, - "loss": 0.407, - "step": 10720 - }, - { - "epoch": 9.3, - "learning_rate": 3.285104895104895e-06, - "loss": 0.4283, - "step": 10730 - }, - { - "epoch": 9.31, - "learning_rate": 3.2844055944055945e-06, - "loss": 0.3711, - "step": 10740 - }, - { - "epoch": 9.32, - "learning_rate": 3.283706293706293e-06, - "loss": 0.4128, - "step": 10750 - }, - { - "epoch": 9.32, - "learning_rate": 3.2830069930069927e-06, - "loss": 0.3888, - "step": 10760 - }, - { - "epoch": 9.33, - "learning_rate": 3.282307692307692e-06, - "loss": 0.4046, - "step": 10770 - }, - { - "epoch": 9.34, - "learning_rate": 3.2816083916083917e-06, - "loss": 0.4792, - "step": 10780 - }, - { - "epoch": 9.35, - "learning_rate": 3.2809090909090908e-06, - "loss": 0.3611, - "step": 10790 - }, - { - "epoch": 9.36, - "learning_rate": 3.2802097902097903e-06, - "loss": 0.4009, - "step": 10800 - }, - { - "epoch": 9.37, - "learning_rate": 3.2795104895104893e-06, - "loss": 0.3805, - "step": 10810 - }, - { - "epoch": 9.38, - "learning_rate": 3.2788111888111884e-06, - "loss": 0.3642, - "step": 10820 - }, - { - "epoch": 9.38, - "learning_rate": 3.278111888111888e-06, - "loss": 0.3998, - "step": 10830 - }, - { - "epoch": 9.39, - "learning_rate": 3.2774125874125874e-06, - "loss": 0.4431, - "step": 10840 - }, - { - "epoch": 9.4, - "learning_rate": 3.276713286713287e-06, - "loss": 0.4207, - "step": 10850 - }, - { - "epoch": 9.41, - "learning_rate": 3.2760139860139855e-06, - "loss": 0.392, - "step": 10860 - }, - { - "epoch": 9.42, - "learning_rate": 3.275314685314685e-06, - "loss": 0.3769, - "step": 10870 - }, - { - "epoch": 9.43, - "learning_rate": 3.2746153846153845e-06, - "loss": 0.4146, - "step": 10880 - }, - { - "epoch": 9.44, - "learning_rate": 3.273916083916084e-06, - "loss": 0.4471, - "step": 10890 - }, - { - "epoch": 9.45, - "learning_rate": 3.273216783216783e-06, - "loss": 0.4716, - "step": 10900 - }, - { - "epoch": 9.45, - "learning_rate": 3.272517482517482e-06, - "loss": 0.3586, - "step": 10910 - }, - { - "epoch": 9.46, - "learning_rate": 3.2718181818181817e-06, - "loss": 0.4394, - "step": 10920 - }, - { - "epoch": 9.47, - "learning_rate": 3.2711188811188808e-06, - "loss": 0.4323, - "step": 10930 - }, - { - "epoch": 9.48, - "learning_rate": 3.2704195804195802e-06, - "loss": 0.4524, - "step": 10940 - }, - { - "epoch": 9.49, - "learning_rate": 3.2697202797202797e-06, - "loss": 0.512, - "step": 10950 - }, - { - "epoch": 9.5, - "learning_rate": 3.2690209790209792e-06, - "loss": 0.3513, - "step": 10960 - }, - { - "epoch": 9.51, - "learning_rate": 3.268321678321678e-06, - "loss": 0.4046, - "step": 10970 - }, - { - "epoch": 9.51, - "learning_rate": 3.2676223776223774e-06, - "loss": 0.3967, - "step": 10980 - }, - { - "epoch": 9.52, - "learning_rate": 3.266923076923077e-06, - "loss": 0.4133, - "step": 10990 - }, - { - "epoch": 9.53, - "learning_rate": 3.266223776223776e-06, - "loss": 0.4759, - "step": 11000 - }, - { - "epoch": 9.54, - "learning_rate": 3.2655244755244755e-06, - "loss": 0.3668, - "step": 11010 - }, - { - "epoch": 9.55, - "learning_rate": 3.2648251748251745e-06, - "loss": 0.4029, - "step": 11020 - }, - { - "epoch": 9.56, - "learning_rate": 3.264125874125874e-06, - "loss": 0.4852, - "step": 11030 - }, - { - "epoch": 9.57, - "learning_rate": 3.263426573426573e-06, - "loss": 0.4197, - "step": 11040 - }, - { - "epoch": 9.58, - "learning_rate": 3.2627272727272726e-06, - "loss": 0.4511, - "step": 11050 - }, - { - "epoch": 9.58, - "learning_rate": 3.262027972027972e-06, - "loss": 0.4441, - "step": 11060 - }, - { - "epoch": 9.59, - "learning_rate": 3.2613286713286716e-06, - "loss": 0.4381, - "step": 11070 - }, - { - "epoch": 9.6, - "learning_rate": 3.2606293706293702e-06, - "loss": 0.3922, - "step": 11080 - }, - { - "epoch": 9.61, - "learning_rate": 3.2599300699300697e-06, - "loss": 0.4215, - "step": 11090 - }, - { - "epoch": 9.62, - "learning_rate": 3.2592307692307692e-06, - "loss": 0.3579, - "step": 11100 - }, - { - "epoch": 9.63, - "learning_rate": 3.2585314685314683e-06, - "loss": 0.4254, - "step": 11110 - }, - { - "epoch": 9.64, - "learning_rate": 3.257832167832168e-06, - "loss": 0.3891, - "step": 11120 - }, - { - "epoch": 9.64, - "learning_rate": 3.257132867132867e-06, - "loss": 0.404, - "step": 11130 - }, - { - "epoch": 9.65, - "learning_rate": 3.2564335664335664e-06, - "loss": 0.4374, - "step": 11140 - }, - { - "epoch": 9.66, - "learning_rate": 3.2557342657342654e-06, - "loss": 0.3818, - "step": 11150 - }, - { - "epoch": 9.67, - "learning_rate": 3.255034965034965e-06, - "loss": 0.3742, - "step": 11160 - }, - { - "epoch": 9.68, - "learning_rate": 3.2543356643356644e-06, - "loss": 0.43, - "step": 11170 - }, - { - "epoch": 9.69, - "learning_rate": 3.253636363636363e-06, - "loss": 0.4267, - "step": 11180 - }, - { - "epoch": 9.7, - "learning_rate": 3.2529370629370626e-06, - "loss": 0.4361, - "step": 11190 - }, - { - "epoch": 9.71, - "learning_rate": 3.252237762237762e-06, - "loss": 0.4058, - "step": 11200 - }, - { - "epoch": 9.71, - "learning_rate": 3.2515384615384616e-06, - "loss": 0.3672, - "step": 11210 - }, - { - "epoch": 9.72, - "learning_rate": 3.2508391608391607e-06, - "loss": 0.3858, - "step": 11220 - }, - { - "epoch": 9.73, - "learning_rate": 3.25013986013986e-06, - "loss": 0.3885, - "step": 11230 - }, - { - "epoch": 9.74, - "learning_rate": 3.2494405594405592e-06, - "loss": 0.3776, - "step": 11240 - }, - { - "epoch": 9.75, - "learning_rate": 3.2487412587412583e-06, - "loss": 0.4401, - "step": 11250 - }, - { - "epoch": 9.76, - "learning_rate": 3.248041958041958e-06, - "loss": 0.4318, - "step": 11260 - }, - { - "epoch": 9.77, - "learning_rate": 3.2473426573426573e-06, - "loss": 0.4234, - "step": 11270 - }, - { - "epoch": 9.77, - "learning_rate": 3.246643356643357e-06, - "loss": 0.436, - "step": 11280 - }, - { - "epoch": 9.78, - "learning_rate": 3.2459440559440554e-06, - "loss": 0.4338, - "step": 11290 - }, - { - "epoch": 9.79, - "learning_rate": 3.245244755244755e-06, - "loss": 0.4059, - "step": 11300 - }, - { - "epoch": 9.8, - "learning_rate": 3.2445454545454544e-06, - "loss": 0.4006, - "step": 11310 - }, - { - "epoch": 9.81, - "learning_rate": 3.243916083916084e-06, - "loss": 0.417, - "step": 11320 - }, - { - "epoch": 9.82, - "learning_rate": 3.243216783216783e-06, - "loss": 0.4349, - "step": 11330 - }, - { - "epoch": 9.83, - "learning_rate": 3.2425174825174825e-06, - "loss": 0.4421, - "step": 11340 - }, - { - "epoch": 9.83, - "learning_rate": 3.2418181818181815e-06, - "loss": 0.4203, - "step": 11350 - }, - { - "epoch": 9.84, - "learning_rate": 3.241118881118881e-06, - "loss": 0.3779, - "step": 11360 - }, - { - "epoch": 9.85, - "learning_rate": 3.2404195804195805e-06, - "loss": 0.4028, - "step": 11370 - }, - { - "epoch": 9.86, - "learning_rate": 3.239720279720279e-06, - "loss": 0.3965, - "step": 11380 - }, - { - "epoch": 9.87, - "learning_rate": 3.2390209790209787e-06, - "loss": 0.3674, - "step": 11390 - }, - { - "epoch": 9.88, - "learning_rate": 3.238321678321678e-06, - "loss": 0.3918, - "step": 11400 - }, - { - "epoch": 9.89, - "learning_rate": 3.2376223776223777e-06, - "loss": 0.4187, - "step": 11410 - }, - { - "epoch": 9.9, - "learning_rate": 3.2369230769230768e-06, - "loss": 0.3845, - "step": 11420 - }, - { - "epoch": 9.9, - "learning_rate": 3.2362237762237762e-06, - "loss": 0.4286, - "step": 11430 - }, - { - "epoch": 9.91, - "learning_rate": 3.2355244755244753e-06, - "loss": 0.448, - "step": 11440 - }, - { - "epoch": 9.92, - "learning_rate": 3.2348251748251744e-06, - "loss": 0.4251, - "step": 11450 - }, - { - "epoch": 9.93, - "learning_rate": 3.234125874125874e-06, - "loss": 0.4281, - "step": 11460 - }, - { - "epoch": 9.94, - "learning_rate": 3.2334265734265734e-06, - "loss": 0.4495, - "step": 11470 - }, - { - "epoch": 9.95, - "learning_rate": 3.232727272727273e-06, - "loss": 0.3919, - "step": 11480 - }, - { - "epoch": 9.96, - "learning_rate": 3.2320279720279715e-06, - "loss": 0.4116, - "step": 11490 - }, - { - "epoch": 9.96, - "learning_rate": 3.231328671328671e-06, - "loss": 0.3788, - "step": 11500 - }, - { - "epoch": 9.97, - "learning_rate": 3.2306293706293705e-06, - "loss": 0.3904, - "step": 11510 - }, - { - "epoch": 9.98, - "learning_rate": 3.22993006993007e-06, - "loss": 0.412, - "step": 11520 - }, - { - "epoch": 9.99, - "learning_rate": 3.229230769230769e-06, - "loss": 0.3909, - "step": 11530 - }, - { - "epoch": 10.0, - "learning_rate": 3.2285314685314686e-06, - "loss": 0.4383, - "step": 11540 - }, - { - "epoch": 10.0, - "eval_loss": 0.5629733204841614, - "eval_runtime": 133.284, - "eval_samples_per_second": 3.991, - "eval_steps_per_second": 1.996, - "eval_wer": 0.2606543678087035, - "step": 11540 - }, - { - "epoch": 10.01, - "learning_rate": 3.2278321678321677e-06, - "loss": 0.422, - "step": 11550 - }, - { - "epoch": 10.02, - "learning_rate": 3.2271328671328667e-06, - "loss": 0.4198, - "step": 11560 - }, - { - "epoch": 10.03, - "learning_rate": 3.2264335664335662e-06, - "loss": 0.3768, - "step": 11570 - }, - { - "epoch": 10.03, - "learning_rate": 3.2257342657342657e-06, - "loss": 0.4059, - "step": 11580 - }, - { - "epoch": 10.04, - "learning_rate": 3.2250349650349652e-06, - "loss": 0.4248, - "step": 11590 - }, - { - "epoch": 10.05, - "learning_rate": 3.224335664335664e-06, - "loss": 0.3902, - "step": 11600 - }, - { - "epoch": 10.06, - "learning_rate": 3.2236363636363634e-06, - "loss": 0.383, - "step": 11610 - }, - { - "epoch": 10.07, - "learning_rate": 3.222937062937063e-06, - "loss": 0.3833, - "step": 11620 - }, - { - "epoch": 10.08, - "learning_rate": 3.222237762237762e-06, - "loss": 0.4813, - "step": 11630 - }, - { - "epoch": 10.09, - "learning_rate": 3.2215384615384614e-06, - "loss": 0.3924, - "step": 11640 - }, - { - "epoch": 10.1, - "learning_rate": 3.220839160839161e-06, - "loss": 0.3906, - "step": 11650 - }, - { - "epoch": 10.1, - "learning_rate": 3.22013986013986e-06, - "loss": 0.3665, - "step": 11660 - }, - { - "epoch": 10.11, - "learning_rate": 3.219440559440559e-06, - "loss": 0.3477, - "step": 11670 - }, - { - "epoch": 10.12, - "learning_rate": 3.2187412587412586e-06, - "loss": 0.4091, - "step": 11680 - }, - { - "epoch": 10.13, - "learning_rate": 3.218041958041958e-06, - "loss": 0.3921, - "step": 11690 - }, - { - "epoch": 10.14, - "learning_rate": 3.2173426573426576e-06, - "loss": 0.3875, - "step": 11700 - }, - { - "epoch": 10.15, - "learning_rate": 3.2166433566433562e-06, - "loss": 0.4104, - "step": 11710 - }, - { - "epoch": 10.16, - "learning_rate": 3.2159440559440557e-06, - "loss": 0.3885, - "step": 11720 - }, - { - "epoch": 10.16, - "learning_rate": 3.2152447552447552e-06, - "loss": 0.3613, - "step": 11730 - }, - { - "epoch": 10.17, - "learning_rate": 3.2145454545454543e-06, - "loss": 0.471, - "step": 11740 - }, - { - "epoch": 10.18, - "learning_rate": 3.213846153846154e-06, - "loss": 0.4413, - "step": 11750 - }, - { - "epoch": 10.19, - "learning_rate": 3.213146853146853e-06, - "loss": 0.3643, - "step": 11760 - }, - { - "epoch": 10.2, - "learning_rate": 3.2124475524475524e-06, - "loss": 0.3322, - "step": 11770 - }, - { - "epoch": 10.21, - "learning_rate": 3.2117482517482514e-06, - "loss": 0.3777, - "step": 11780 - }, - { - "epoch": 10.22, - "learning_rate": 3.211048951048951e-06, - "loss": 0.4579, - "step": 11790 - }, - { - "epoch": 10.23, - "learning_rate": 3.2103496503496504e-06, - "loss": 0.3609, - "step": 11800 - }, - { - "epoch": 10.23, - "learning_rate": 3.2096503496503495e-06, - "loss": 0.4145, - "step": 11810 - }, - { - "epoch": 10.24, - "learning_rate": 3.2089510489510486e-06, - "loss": 0.4498, - "step": 11820 - }, - { - "epoch": 10.25, - "learning_rate": 3.208251748251748e-06, - "loss": 0.4212, - "step": 11830 - }, - { - "epoch": 10.26, - "learning_rate": 3.2075524475524476e-06, - "loss": 0.4339, - "step": 11840 - }, - { - "epoch": 10.27, - "learning_rate": 3.2068531468531466e-06, - "loss": 0.4033, - "step": 11850 - }, - { - "epoch": 10.28, - "learning_rate": 3.206153846153846e-06, - "loss": 0.3386, - "step": 11860 - }, - { - "epoch": 10.29, - "learning_rate": 3.2054545454545452e-06, - "loss": 0.3892, - "step": 11870 - }, - { - "epoch": 10.29, - "learning_rate": 3.2047552447552443e-06, - "loss": 0.3798, - "step": 11880 - }, - { - "epoch": 10.3, - "learning_rate": 3.204055944055944e-06, - "loss": 0.4161, - "step": 11890 - }, - { - "epoch": 10.31, - "learning_rate": 3.2033566433566433e-06, - "loss": 0.3388, - "step": 11900 - }, - { - "epoch": 10.32, - "learning_rate": 3.2026573426573428e-06, - "loss": 0.3871, - "step": 11910 - }, - { - "epoch": 10.33, - "learning_rate": 3.2019580419580414e-06, - "loss": 0.4393, - "step": 11920 - }, - { - "epoch": 10.34, - "learning_rate": 3.201258741258741e-06, - "loss": 0.4055, - "step": 11930 - }, - { - "epoch": 10.35, - "learning_rate": 3.2005594405594404e-06, - "loss": 0.434, - "step": 11940 - }, - { - "epoch": 10.36, - "learning_rate": 3.19986013986014e-06, - "loss": 0.4293, - "step": 11950 - }, - { - "epoch": 10.36, - "learning_rate": 3.199160839160839e-06, - "loss": 0.3783, - "step": 11960 - }, - { - "epoch": 10.37, - "learning_rate": 3.1984615384615385e-06, - "loss": 0.4578, - "step": 11970 - }, - { - "epoch": 10.38, - "learning_rate": 3.1977622377622376e-06, - "loss": 0.3943, - "step": 11980 - }, - { - "epoch": 10.39, - "learning_rate": 3.1970629370629366e-06, - "loss": 0.4987, - "step": 11990 - }, - { - "epoch": 10.4, - "learning_rate": 3.196363636363636e-06, - "loss": 0.4265, - "step": 12000 - }, - { - "epoch": 10.41, - "learning_rate": 3.1956643356643356e-06, - "loss": 0.3909, - "step": 12010 - }, - { - "epoch": 10.42, - "learning_rate": 3.194965034965035e-06, - "loss": 0.3212, - "step": 12020 - }, - { - "epoch": 10.42, - "learning_rate": 3.1942657342657338e-06, - "loss": 0.5361, - "step": 12030 - }, - { - "epoch": 10.43, - "learning_rate": 3.1935664335664333e-06, - "loss": 0.374, - "step": 12040 - }, - { - "epoch": 10.44, - "learning_rate": 3.1928671328671328e-06, - "loss": 0.4897, - "step": 12050 - }, - { - "epoch": 10.45, - "learning_rate": 3.192167832167832e-06, - "loss": 0.4381, - "step": 12060 - }, - { - "epoch": 10.46, - "learning_rate": 3.1914685314685313e-06, - "loss": 0.4138, - "step": 12070 - }, - { - "epoch": 10.47, - "learning_rate": 3.190769230769231e-06, - "loss": 0.4278, - "step": 12080 - }, - { - "epoch": 10.48, - "learning_rate": 3.19006993006993e-06, - "loss": 0.4777, - "step": 12090 - }, - { - "epoch": 10.49, - "learning_rate": 3.189370629370629e-06, - "loss": 0.3806, - "step": 12100 - }, - { - "epoch": 10.49, - "learning_rate": 3.1886713286713285e-06, - "loss": 0.4316, - "step": 12110 - }, - { - "epoch": 10.5, - "learning_rate": 3.187972027972028e-06, - "loss": 0.359, - "step": 12120 - }, - { - "epoch": 10.51, - "learning_rate": 3.1872727272727275e-06, - "loss": 0.4141, - "step": 12130 - }, - { - "epoch": 10.52, - "learning_rate": 3.186573426573426e-06, - "loss": 0.4678, - "step": 12140 - }, - { - "epoch": 10.53, - "learning_rate": 3.1858741258741256e-06, - "loss": 0.5613, - "step": 12150 - }, - { - "epoch": 10.54, - "learning_rate": 3.185174825174825e-06, - "loss": 0.4073, - "step": 12160 - }, - { - "epoch": 10.55, - "learning_rate": 3.184475524475524e-06, - "loss": 0.3658, - "step": 12170 - }, - { - "epoch": 10.55, - "learning_rate": 3.1837762237762237e-06, - "loss": 0.4292, - "step": 12180 - }, - { - "epoch": 10.56, - "learning_rate": 3.183076923076923e-06, - "loss": 0.3994, - "step": 12190 - }, - { - "epoch": 10.57, - "learning_rate": 3.1823776223776223e-06, - "loss": 0.3395, - "step": 12200 - }, - { - "epoch": 10.58, - "learning_rate": 3.1816783216783213e-06, - "loss": 0.3992, - "step": 12210 - }, - { - "epoch": 10.59, - "learning_rate": 3.180979020979021e-06, - "loss": 0.382, - "step": 12220 - }, - { - "epoch": 10.6, - "learning_rate": 3.1802797202797203e-06, - "loss": 0.4397, - "step": 12230 - }, - { - "epoch": 10.61, - "learning_rate": 3.1795804195804194e-06, - "loss": 0.4188, - "step": 12240 - }, - { - "epoch": 10.61, - "learning_rate": 3.1788811188811185e-06, - "loss": 0.3643, - "step": 12250 - }, - { - "epoch": 10.62, - "learning_rate": 3.178181818181818e-06, - "loss": 0.4586, - "step": 12260 - }, - { - "epoch": 10.63, - "learning_rate": 3.1774825174825175e-06, - "loss": 0.3905, - "step": 12270 - }, - { - "epoch": 10.64, - "learning_rate": 3.1767832167832165e-06, - "loss": 0.4422, - "step": 12280 - }, - { - "epoch": 10.65, - "learning_rate": 3.176083916083916e-06, - "loss": 0.3952, - "step": 12290 - }, - { - "epoch": 10.66, - "learning_rate": 3.175384615384615e-06, - "loss": 0.4059, - "step": 12300 - }, - { - "epoch": 10.67, - "learning_rate": 3.1746853146853146e-06, - "loss": 0.4235, - "step": 12310 - }, - { - "epoch": 10.68, - "learning_rate": 3.1739860139860137e-06, - "loss": 0.408, - "step": 12320 - }, - { - "epoch": 10.68, - "learning_rate": 3.173286713286713e-06, - "loss": 0.3726, - "step": 12330 - }, - { - "epoch": 10.69, - "learning_rate": 3.1725874125874127e-06, - "loss": 0.4191, - "step": 12340 - }, - { - "epoch": 10.7, - "learning_rate": 3.1718881118881118e-06, - "loss": 0.3919, - "step": 12350 - }, - { - "epoch": 10.71, - "learning_rate": 3.171188811188811e-06, - "loss": 0.4135, - "step": 12360 - }, - { - "epoch": 10.72, - "learning_rate": 3.1704895104895103e-06, - "loss": 0.449, - "step": 12370 - }, - { - "epoch": 10.73, - "learning_rate": 3.16979020979021e-06, - "loss": 0.4839, - "step": 12380 - }, - { - "epoch": 10.74, - "learning_rate": 3.169090909090909e-06, - "loss": 0.3793, - "step": 12390 - }, - { - "epoch": 10.74, - "learning_rate": 3.1683916083916084e-06, - "loss": 0.4173, - "step": 12400 - }, - { - "epoch": 10.75, - "learning_rate": 3.1676923076923075e-06, - "loss": 0.3964, - "step": 12410 - }, - { - "epoch": 10.76, - "learning_rate": 3.1669930069930065e-06, - "loss": 0.4478, - "step": 12420 - }, - { - "epoch": 10.77, - "learning_rate": 3.166293706293706e-06, - "loss": 0.4247, - "step": 12430 - }, - { - "epoch": 10.78, - "learning_rate": 3.1655944055944055e-06, - "loss": 0.4806, - "step": 12440 - }, - { - "epoch": 10.79, - "learning_rate": 3.164895104895105e-06, - "loss": 0.4104, - "step": 12450 - }, - { - "epoch": 10.8, - "learning_rate": 3.164195804195804e-06, - "loss": 0.4602, - "step": 12460 - }, - { - "epoch": 10.81, - "learning_rate": 3.163496503496503e-06, - "loss": 0.3707, - "step": 12470 - }, - { - "epoch": 10.81, - "learning_rate": 3.1627972027972027e-06, - "loss": 0.3626, - "step": 12480 - }, - { - "epoch": 10.82, - "learning_rate": 3.162097902097902e-06, - "loss": 0.4234, - "step": 12490 - }, - { - "epoch": 10.83, - "learning_rate": 3.1613986013986012e-06, - "loss": 0.37, - "step": 12500 - }, - { - "epoch": 10.84, - "learning_rate": 3.1606993006993007e-06, - "loss": 0.3754, - "step": 12510 - }, - { - "epoch": 10.85, - "learning_rate": 3.16e-06, - "loss": 0.4232, - "step": 12520 - }, - { - "epoch": 10.86, - "learning_rate": 3.159300699300699e-06, - "loss": 0.4205, - "step": 12530 - }, - { - "epoch": 10.87, - "learning_rate": 3.1586013986013984e-06, - "loss": 0.3652, - "step": 12540 - }, - { - "epoch": 10.87, - "learning_rate": 3.157902097902098e-06, - "loss": 0.4103, - "step": 12550 - }, - { - "epoch": 10.88, - "learning_rate": 3.1572027972027974e-06, - "loss": 0.4234, - "step": 12560 - }, - { - "epoch": 10.89, - "learning_rate": 3.156503496503496e-06, - "loss": 0.356, - "step": 12570 - }, - { - "epoch": 10.9, - "learning_rate": 3.1558041958041955e-06, - "loss": 0.4116, - "step": 12580 - }, - { - "epoch": 10.91, - "learning_rate": 3.155104895104895e-06, - "loss": 0.4963, - "step": 12590 - }, - { - "epoch": 10.92, - "learning_rate": 3.154405594405594e-06, - "loss": 0.4658, - "step": 12600 - }, - { - "epoch": 10.93, - "learning_rate": 3.1537062937062936e-06, - "loss": 0.4356, - "step": 12610 - }, - { - "epoch": 10.94, - "learning_rate": 3.153006993006993e-06, - "loss": 0.4288, - "step": 12620 - }, - { - "epoch": 10.94, - "learning_rate": 3.152307692307692e-06, - "loss": 0.3944, - "step": 12630 - }, - { - "epoch": 10.95, - "learning_rate": 3.1516083916083912e-06, - "loss": 0.4145, - "step": 12640 - }, - { - "epoch": 10.96, - "learning_rate": 3.1509090909090907e-06, - "loss": 0.4038, - "step": 12650 - }, - { - "epoch": 10.97, - "learning_rate": 3.1502097902097902e-06, - "loss": 0.4021, - "step": 12660 - }, - { - "epoch": 10.98, - "learning_rate": 3.1495104895104897e-06, - "loss": 0.377, - "step": 12670 - }, - { - "epoch": 10.99, - "learning_rate": 3.1488111888111884e-06, - "loss": 0.3921, - "step": 12680 - }, - { - "epoch": 11.0, - "learning_rate": 3.148111888111888e-06, - "loss": 0.4245, - "step": 12690 - }, - { - "epoch": 11.0, - "eval_loss": 0.5647190809249878, - "eval_runtime": 134.3558, - "eval_samples_per_second": 3.96, - "eval_steps_per_second": 1.98, - "eval_wer": 0.2560905058815967, - "step": 12694 - }, - { - "epoch": 11.01, - "learning_rate": 3.1474125874125874e-06, - "loss": 0.3689, - "step": 12700 - }, - { - "epoch": 11.01, - "learning_rate": 3.1467132867132864e-06, - "loss": 0.3827, - "step": 12710 - }, - { - "epoch": 11.02, - "learning_rate": 3.146013986013986e-06, - "loss": 0.3676, - "step": 12720 - }, - { - "epoch": 11.03, - "learning_rate": 3.1453146853146854e-06, - "loss": 0.4533, - "step": 12730 - }, - { - "epoch": 11.04, - "learning_rate": 3.1446153846153845e-06, - "loss": 0.4324, - "step": 12740 - }, - { - "epoch": 11.05, - "learning_rate": 3.1439160839160836e-06, - "loss": 0.442, - "step": 12750 - }, - { - "epoch": 11.06, - "learning_rate": 3.143216783216783e-06, - "loss": 0.3553, - "step": 12760 - }, - { - "epoch": 11.07, - "learning_rate": 3.1425174825174826e-06, - "loss": 0.4051, - "step": 12770 - }, - { - "epoch": 11.07, - "learning_rate": 3.1418181818181817e-06, - "loss": 0.4422, - "step": 12780 - }, - { - "epoch": 11.08, - "learning_rate": 3.1411188811188807e-06, - "loss": 0.4083, - "step": 12790 - }, - { - "epoch": 11.09, - "learning_rate": 3.1404195804195802e-06, - "loss": 0.3878, - "step": 12800 - }, - { - "epoch": 11.1, - "learning_rate": 3.1397202797202797e-06, - "loss": 0.4111, - "step": 12810 - }, - { - "epoch": 11.11, - "learning_rate": 3.139020979020979e-06, - "loss": 0.4363, - "step": 12820 - }, - { - "epoch": 11.12, - "learning_rate": 3.1383216783216783e-06, - "loss": 0.4326, - "step": 12830 - }, - { - "epoch": 11.13, - "learning_rate": 3.1376223776223778e-06, - "loss": 0.393, - "step": 12840 - }, - { - "epoch": 11.14, - "learning_rate": 3.1369230769230764e-06, - "loss": 0.4463, - "step": 12850 - }, - { - "epoch": 11.14, - "learning_rate": 3.136223776223776e-06, - "loss": 0.4079, - "step": 12860 - }, - { - "epoch": 11.15, - "learning_rate": 3.1355244755244754e-06, - "loss": 0.4008, - "step": 12870 - }, - { - "epoch": 11.16, - "learning_rate": 3.134825174825175e-06, - "loss": 0.4737, - "step": 12880 - }, - { - "epoch": 11.17, - "learning_rate": 3.134125874125874e-06, - "loss": 0.4459, - "step": 12890 - }, - { - "epoch": 11.18, - "learning_rate": 3.133426573426573e-06, - "loss": 0.4121, - "step": 12900 - }, - { - "epoch": 11.19, - "learning_rate": 3.1327272727272726e-06, - "loss": 0.4312, - "step": 12910 - }, - { - "epoch": 11.2, - "learning_rate": 3.132027972027972e-06, - "loss": 0.3916, - "step": 12920 - }, - { - "epoch": 11.2, - "learning_rate": 3.131328671328671e-06, - "loss": 0.3627, - "step": 12930 - }, - { - "epoch": 11.21, - "learning_rate": 3.1306293706293706e-06, - "loss": 0.4057, - "step": 12940 - }, - { - "epoch": 11.22, - "learning_rate": 3.1299300699300697e-06, - "loss": 0.3761, - "step": 12950 - }, - { - "epoch": 11.23, - "learning_rate": 3.1292307692307688e-06, - "loss": 0.4694, - "step": 12960 - }, - { - "epoch": 11.24, - "learning_rate": 3.1285314685314683e-06, - "loss": 0.3899, - "step": 12970 - }, - { - "epoch": 11.25, - "learning_rate": 3.1278321678321678e-06, - "loss": 0.3499, - "step": 12980 - }, - { - "epoch": 11.26, - "learning_rate": 3.1271328671328673e-06, - "loss": 0.4372, - "step": 12990 - }, - { - "epoch": 11.27, - "learning_rate": 3.1264335664335664e-06, - "loss": 0.4522, - "step": 13000 - }, - { - "epoch": 11.27, - "learning_rate": 3.1257342657342654e-06, - "loss": 0.3943, - "step": 13010 - }, - { - "epoch": 11.28, - "learning_rate": 3.125034965034965e-06, - "loss": 0.3741, - "step": 13020 - }, - { - "epoch": 11.29, - "learning_rate": 3.124335664335664e-06, - "loss": 0.3595, - "step": 13030 - }, - { - "epoch": 11.3, - "learning_rate": 3.1236363636363635e-06, - "loss": 0.4889, - "step": 13040 - }, - { - "epoch": 11.31, - "learning_rate": 3.122937062937063e-06, - "loss": 0.3744, - "step": 13050 - }, - { - "epoch": 11.32, - "learning_rate": 3.122237762237762e-06, - "loss": 0.4061, - "step": 13060 - }, - { - "epoch": 11.33, - "learning_rate": 3.121538461538461e-06, - "loss": 0.4333, - "step": 13070 - }, - { - "epoch": 11.33, - "learning_rate": 3.1208391608391606e-06, - "loss": 0.3838, - "step": 13080 - }, - { - "epoch": 11.34, - "learning_rate": 3.12013986013986e-06, - "loss": 0.4064, - "step": 13090 - }, - { - "epoch": 11.35, - "learning_rate": 3.1194405594405596e-06, - "loss": 0.4572, - "step": 13100 - }, - { - "epoch": 11.36, - "learning_rate": 3.1187412587412583e-06, - "loss": 0.3864, - "step": 13110 - }, - { - "epoch": 11.37, - "learning_rate": 3.1180419580419578e-06, - "loss": 0.4353, - "step": 13120 - }, - { - "epoch": 11.38, - "learning_rate": 3.1173426573426573e-06, - "loss": 0.4305, - "step": 13130 - }, - { - "epoch": 11.39, - "learning_rate": 3.1166433566433563e-06, - "loss": 0.4294, - "step": 13140 - }, - { - "epoch": 11.39, - "learning_rate": 3.115944055944056e-06, - "loss": 0.3242, - "step": 13150 - }, - { - "epoch": 11.4, - "learning_rate": 3.1152447552447553e-06, - "loss": 0.3815, - "step": 13160 - }, - { - "epoch": 11.41, - "learning_rate": 3.1145454545454544e-06, - "loss": 0.3437, - "step": 13170 - }, - { - "epoch": 11.42, - "learning_rate": 3.1138461538461535e-06, - "loss": 0.4029, - "step": 13180 - }, - { - "epoch": 11.43, - "learning_rate": 3.113146853146853e-06, - "loss": 0.4357, - "step": 13190 - }, - { - "epoch": 11.44, - "learning_rate": 3.1124475524475525e-06, - "loss": 0.4073, - "step": 13200 - }, - { - "epoch": 11.45, - "learning_rate": 3.1117482517482516e-06, - "loss": 0.3962, - "step": 13210 - }, - { - "epoch": 11.46, - "learning_rate": 3.1110489510489506e-06, - "loss": 0.3896, - "step": 13220 - }, - { - "epoch": 11.46, - "learning_rate": 3.11034965034965e-06, - "loss": 0.422, - "step": 13230 - }, - { - "epoch": 11.47, - "learning_rate": 3.1096503496503496e-06, - "loss": 0.3918, - "step": 13240 - }, - { - "epoch": 11.48, - "learning_rate": 3.1089510489510487e-06, - "loss": 0.3884, - "step": 13250 - }, - { - "epoch": 11.49, - "learning_rate": 3.108251748251748e-06, - "loss": 0.4256, - "step": 13260 - }, - { - "epoch": 11.5, - "learning_rate": 3.1075524475524477e-06, - "loss": 0.4003, - "step": 13270 - }, - { - "epoch": 11.51, - "learning_rate": 3.1068531468531468e-06, - "loss": 0.3744, - "step": 13280 - }, - { - "epoch": 11.52, - "learning_rate": 3.106153846153846e-06, - "loss": 0.4673, - "step": 13290 - }, - { - "epoch": 11.52, - "learning_rate": 3.1054545454545453e-06, - "loss": 0.473, - "step": 13300 - }, - { - "epoch": 11.53, - "learning_rate": 3.104755244755245e-06, - "loss": 0.3683, - "step": 13310 - }, - { - "epoch": 11.54, - "learning_rate": 3.104055944055944e-06, - "loss": 0.3906, - "step": 13320 - }, - { - "epoch": 11.55, - "learning_rate": 3.103356643356643e-06, - "loss": 0.4705, - "step": 13330 - }, - { - "epoch": 11.56, - "learning_rate": 3.1026573426573425e-06, - "loss": 0.4346, - "step": 13340 - }, - { - "epoch": 11.57, - "learning_rate": 3.101958041958042e-06, - "loss": 0.3415, - "step": 13350 - }, - { - "epoch": 11.58, - "learning_rate": 3.101258741258741e-06, - "loss": 0.3599, - "step": 13360 - }, - { - "epoch": 11.59, - "learning_rate": 3.1005594405594405e-06, - "loss": 0.3877, - "step": 13370 - }, - { - "epoch": 11.59, - "learning_rate": 3.09986013986014e-06, - "loss": 0.4167, - "step": 13380 - }, - { - "epoch": 11.6, - "learning_rate": 3.0991608391608387e-06, - "loss": 0.4292, - "step": 13390 - }, - { - "epoch": 11.61, - "learning_rate": 3.098461538461538e-06, - "loss": 0.4469, - "step": 13400 - }, - { - "epoch": 11.62, - "learning_rate": 3.0977622377622377e-06, - "loss": 0.4273, - "step": 13410 - }, - { - "epoch": 11.63, - "learning_rate": 3.097062937062937e-06, - "loss": 0.3338, - "step": 13420 - }, - { - "epoch": 11.64, - "learning_rate": 3.0963636363636362e-06, - "loss": 0.422, - "step": 13430 - }, - { - "epoch": 11.65, - "learning_rate": 3.0956643356643353e-06, - "loss": 0.4025, - "step": 13440 - }, - { - "epoch": 11.65, - "learning_rate": 3.094965034965035e-06, - "loss": 0.4044, - "step": 13450 - }, - { - "epoch": 11.66, - "learning_rate": 3.0942657342657343e-06, - "loss": 0.4187, - "step": 13460 - }, - { - "epoch": 11.67, - "learning_rate": 3.0935664335664334e-06, - "loss": 0.3947, - "step": 13470 - }, - { - "epoch": 11.68, - "learning_rate": 3.092867132867133e-06, - "loss": 0.3553, - "step": 13480 - }, - { - "epoch": 11.69, - "learning_rate": 3.092167832167832e-06, - "loss": 0.4187, - "step": 13490 - }, - { - "epoch": 11.7, - "learning_rate": 3.091468531468531e-06, - "loss": 0.4666, - "step": 13500 - }, - { - "epoch": 11.71, - "learning_rate": 3.0907692307692305e-06, - "loss": 0.4248, - "step": 13510 - }, - { - "epoch": 11.72, - "learning_rate": 3.09006993006993e-06, - "loss": 0.362, - "step": 13520 - }, - { - "epoch": 11.72, - "learning_rate": 3.0893706293706295e-06, - "loss": 0.4296, - "step": 13530 - }, - { - "epoch": 11.73, - "learning_rate": 3.0886713286713286e-06, - "loss": 0.3882, - "step": 13540 - }, - { - "epoch": 11.74, - "learning_rate": 3.0879720279720277e-06, - "loss": 0.3709, - "step": 13550 - }, - { - "epoch": 11.75, - "learning_rate": 3.087272727272727e-06, - "loss": 0.3679, - "step": 13560 - }, - { - "epoch": 11.76, - "learning_rate": 3.0865734265734262e-06, - "loss": 0.4126, - "step": 13570 - }, - { - "epoch": 11.77, - "learning_rate": 3.0858741258741257e-06, - "loss": 0.4288, - "step": 13580 - }, - { - "epoch": 11.78, - "learning_rate": 3.0851748251748252e-06, - "loss": 0.3786, - "step": 13590 - }, - { - "epoch": 11.78, - "learning_rate": 3.0844755244755243e-06, - "loss": 0.381, - "step": 13600 - }, - { - "epoch": 11.79, - "learning_rate": 3.0837762237762234e-06, - "loss": 0.4091, - "step": 13610 - }, - { - "epoch": 11.8, - "learning_rate": 3.083076923076923e-06, - "loss": 0.3875, - "step": 13620 - }, - { - "epoch": 11.81, - "learning_rate": 3.0823776223776224e-06, - "loss": 0.3907, - "step": 13630 - }, - { - "epoch": 11.82, - "learning_rate": 3.081678321678322e-06, - "loss": 0.3664, - "step": 13640 - }, - { - "epoch": 11.83, - "learning_rate": 3.080979020979021e-06, - "loss": 0.3494, - "step": 13650 - }, - { - "epoch": 11.84, - "learning_rate": 3.08027972027972e-06, - "loss": 0.3899, - "step": 13660 - }, - { - "epoch": 11.85, - "learning_rate": 3.0795804195804195e-06, - "loss": 0.4002, - "step": 13670 - }, - { - "epoch": 11.85, - "learning_rate": 3.0788811188811186e-06, - "loss": 0.5063, - "step": 13680 - }, - { - "epoch": 11.86, - "learning_rate": 3.078181818181818e-06, - "loss": 0.4773, - "step": 13690 - }, - { - "epoch": 11.87, - "learning_rate": 3.0774825174825176e-06, - "loss": 0.3547, - "step": 13700 - }, - { - "epoch": 11.88, - "learning_rate": 3.0767832167832167e-06, - "loss": 0.3995, - "step": 13710 - }, - { - "epoch": 11.89, - "learning_rate": 3.0760839160839157e-06, - "loss": 0.4126, - "step": 13720 - }, - { - "epoch": 11.9, - "learning_rate": 3.0753846153846152e-06, - "loss": 0.3785, - "step": 13730 - }, - { - "epoch": 11.91, - "learning_rate": 3.0746853146853147e-06, - "loss": 0.4024, - "step": 13740 - }, - { - "epoch": 11.91, - "learning_rate": 3.073986013986014e-06, - "loss": 0.3838, - "step": 13750 - }, - { - "epoch": 11.92, - "learning_rate": 3.073286713286713e-06, - "loss": 0.4221, - "step": 13760 - }, - { - "epoch": 11.93, - "learning_rate": 3.0725874125874124e-06, - "loss": 0.4061, - "step": 13770 - }, - { - "epoch": 11.94, - "learning_rate": 3.071888111888112e-06, - "loss": 0.4233, - "step": 13780 - }, - { - "epoch": 11.95, - "learning_rate": 3.071188811188811e-06, - "loss": 0.3744, - "step": 13790 - }, - { - "epoch": 11.96, - "learning_rate": 3.0704895104895104e-06, - "loss": 0.409, - "step": 13800 - }, - { - "epoch": 11.97, - "learning_rate": 3.06979020979021e-06, - "loss": 0.4319, - "step": 13810 - }, - { - "epoch": 11.98, - "learning_rate": 3.0690909090909086e-06, - "loss": 0.4032, - "step": 13820 - }, - { - "epoch": 11.98, - "learning_rate": 3.068391608391608e-06, - "loss": 0.4338, - "step": 13830 - }, - { - "epoch": 11.99, - "learning_rate": 3.0676923076923076e-06, - "loss": 0.3946, - "step": 13840 - }, - { - "epoch": 12.0, - "eval_loss": 0.5525963306427002, - "eval_runtime": 133.5393, - "eval_samples_per_second": 3.984, - "eval_steps_per_second": 1.992, - "eval_wer": 0.26348267660860064, - "step": 13848 - }, - { - "epoch": 12.0, - "learning_rate": 3.066993006993007e-06, - "loss": 0.3896, - "step": 13850 - }, - { - "epoch": 12.01, - "learning_rate": 3.066293706293706e-06, - "loss": 0.4106, - "step": 13860 - }, - { - "epoch": 12.02, - "learning_rate": 3.0655944055944052e-06, - "loss": 0.4001, - "step": 13870 - }, - { - "epoch": 12.03, - "learning_rate": 3.0648951048951047e-06, - "loss": 0.3334, - "step": 13880 - }, - { - "epoch": 12.04, - "learning_rate": 3.0641958041958042e-06, - "loss": 0.3551, - "step": 13890 - }, - { - "epoch": 12.05, - "learning_rate": 3.0634965034965033e-06, - "loss": 0.4169, - "step": 13900 - }, - { - "epoch": 12.05, - "learning_rate": 3.0627972027972028e-06, - "loss": 0.3991, - "step": 13910 - }, - { - "epoch": 12.06, - "learning_rate": 3.0620979020979023e-06, - "loss": 0.4, - "step": 13920 - }, - { - "epoch": 12.07, - "learning_rate": 3.061398601398601e-06, - "loss": 0.4013, - "step": 13930 - }, - { - "epoch": 12.08, - "learning_rate": 3.0606993006993004e-06, - "loss": 0.3758, - "step": 13940 - }, - { - "epoch": 12.09, - "learning_rate": 3.06e-06, - "loss": 0.4109, - "step": 13950 - }, - { - "epoch": 12.1, - "learning_rate": 3.0593006993006994e-06, - "loss": 0.4589, - "step": 13960 - }, - { - "epoch": 12.11, - "learning_rate": 3.0586713286713285e-06, - "loss": 0.4093, - "step": 13970 - }, - { - "epoch": 12.11, - "learning_rate": 3.057972027972028e-06, - "loss": 0.422, - "step": 13980 - }, - { - "epoch": 12.12, - "learning_rate": 3.057272727272727e-06, - "loss": 0.4142, - "step": 13990 - }, - { - "epoch": 12.13, - "learning_rate": 3.0565734265734265e-06, - "loss": 0.394, - "step": 14000 - }, - { - "epoch": 12.14, - "learning_rate": 3.055874125874126e-06, - "loss": 0.4007, - "step": 14010 - }, - { - "epoch": 12.15, - "learning_rate": 3.0551748251748247e-06, - "loss": 0.3457, - "step": 14020 - }, - { - "epoch": 12.16, - "learning_rate": 3.054475524475524e-06, - "loss": 0.3427, - "step": 14030 - }, - { - "epoch": 12.17, - "learning_rate": 3.0537762237762237e-06, - "loss": 0.4197, - "step": 14040 - }, - { - "epoch": 12.17, - "learning_rate": 3.053076923076923e-06, - "loss": 0.3985, - "step": 14050 - }, - { - "epoch": 12.18, - "learning_rate": 3.0523776223776222e-06, - "loss": 0.3557, - "step": 14060 - }, - { - "epoch": 12.19, - "learning_rate": 3.0516783216783213e-06, - "loss": 0.389, - "step": 14070 - }, - { - "epoch": 12.2, - "learning_rate": 3.050979020979021e-06, - "loss": 0.4019, - "step": 14080 - }, - { - "epoch": 12.21, - "learning_rate": 3.0502797202797203e-06, - "loss": 0.3896, - "step": 14090 - }, - { - "epoch": 12.22, - "learning_rate": 3.0495804195804194e-06, - "loss": 0.3969, - "step": 14100 - }, - { - "epoch": 12.23, - "learning_rate": 3.048881118881119e-06, - "loss": 0.3983, - "step": 14110 - }, - { - "epoch": 12.24, - "learning_rate": 3.0481818181818184e-06, - "loss": 0.3853, - "step": 14120 - }, - { - "epoch": 12.24, - "learning_rate": 3.047482517482517e-06, - "loss": 0.405, - "step": 14130 - }, - { - "epoch": 12.25, - "learning_rate": 3.0467832167832165e-06, - "loss": 0.4416, - "step": 14140 - }, - { - "epoch": 12.26, - "learning_rate": 3.046083916083916e-06, - "loss": 0.4443, - "step": 14150 - }, - { - "epoch": 12.27, - "learning_rate": 3.0453846153846155e-06, - "loss": 0.4276, - "step": 14160 - }, - { - "epoch": 12.28, - "learning_rate": 3.0446853146853146e-06, - "loss": 0.3815, - "step": 14170 - }, - { - "epoch": 12.29, - "learning_rate": 3.0439860139860137e-06, - "loss": 0.3975, - "step": 14180 - }, - { - "epoch": 12.3, - "learning_rate": 3.043286713286713e-06, - "loss": 0.4268, - "step": 14190 - }, - { - "epoch": 12.3, - "learning_rate": 3.0425874125874122e-06, - "loss": 0.3851, - "step": 14200 - }, - { - "epoch": 12.31, - "learning_rate": 3.0418881118881117e-06, - "loss": 0.4057, - "step": 14210 - }, - { - "epoch": 12.32, - "learning_rate": 3.0411888111888112e-06, - "loss": 0.407, - "step": 14220 - }, - { - "epoch": 12.33, - "learning_rate": 3.0404895104895107e-06, - "loss": 0.4224, - "step": 14230 - }, - { - "epoch": 12.34, - "learning_rate": 3.0397902097902094e-06, - "loss": 0.4311, - "step": 14240 - }, - { - "epoch": 12.35, - "learning_rate": 3.039090909090909e-06, - "loss": 0.4162, - "step": 14250 - }, - { - "epoch": 12.36, - "learning_rate": 3.0383916083916084e-06, - "loss": 0.4437, - "step": 14260 - }, - { - "epoch": 12.37, - "learning_rate": 3.037692307692308e-06, - "loss": 0.4052, - "step": 14270 - }, - { - "epoch": 12.37, - "learning_rate": 3.036993006993007e-06, - "loss": 0.3864, - "step": 14280 - }, - { - "epoch": 12.38, - "learning_rate": 3.036293706293706e-06, - "loss": 0.4052, - "step": 14290 - }, - { - "epoch": 12.39, - "learning_rate": 3.0355944055944055e-06, - "loss": 0.3948, - "step": 14300 - }, - { - "epoch": 12.4, - "learning_rate": 3.0348951048951046e-06, - "loss": 0.4039, - "step": 14310 - }, - { - "epoch": 12.41, - "learning_rate": 3.034195804195804e-06, - "loss": 0.3865, - "step": 14320 - }, - { - "epoch": 12.42, - "learning_rate": 3.0334965034965036e-06, - "loss": 0.3794, - "step": 14330 - }, - { - "epoch": 12.43, - "learning_rate": 3.0327972027972026e-06, - "loss": 0.4173, - "step": 14340 - }, - { - "epoch": 12.43, - "learning_rate": 3.0320979020979017e-06, - "loss": 0.4037, - "step": 14350 - }, - { - "epoch": 12.44, - "learning_rate": 3.0313986013986012e-06, - "loss": 0.4497, - "step": 14360 - }, - { - "epoch": 12.45, - "learning_rate": 3.0306993006993007e-06, - "loss": 0.4244, - "step": 14370 - }, - { - "epoch": 12.46, - "learning_rate": 3.03e-06, - "loss": 0.3988, - "step": 14380 - }, - { - "epoch": 12.47, - "learning_rate": 3.0293006993006993e-06, - "loss": 0.4545, - "step": 14390 - }, - { - "epoch": 12.48, - "learning_rate": 3.0286013986013984e-06, - "loss": 0.5355, - "step": 14400 - }, - { - "epoch": 12.49, - "learning_rate": 3.027902097902098e-06, - "loss": 0.3757, - "step": 14410 - }, - { - "epoch": 12.5, - "learning_rate": 3.027202797202797e-06, - "loss": 0.3856, - "step": 14420 - }, - { - "epoch": 12.5, - "learning_rate": 3.0265034965034964e-06, - "loss": 0.4305, - "step": 14430 - }, - { - "epoch": 12.51, - "learning_rate": 3.025804195804196e-06, - "loss": 0.4123, - "step": 14440 - }, - { - "epoch": 12.52, - "learning_rate": 3.0251048951048946e-06, - "loss": 0.3745, - "step": 14450 - }, - { - "epoch": 12.53, - "learning_rate": 3.024405594405594e-06, - "loss": 0.357, - "step": 14460 - }, - { - "epoch": 12.54, - "learning_rate": 3.0237062937062936e-06, - "loss": 0.3626, - "step": 14470 - }, - { - "epoch": 12.55, - "learning_rate": 3.023006993006993e-06, - "loss": 0.3647, - "step": 14480 - }, - { - "epoch": 12.56, - "learning_rate": 3.022307692307692e-06, - "loss": 0.3769, - "step": 14490 - }, - { - "epoch": 12.56, - "learning_rate": 3.0216083916083916e-06, - "loss": 0.4741, - "step": 14500 - }, - { - "epoch": 12.57, - "learning_rate": 3.0209090909090907e-06, - "loss": 0.3898, - "step": 14510 - }, - { - "epoch": 12.58, - "learning_rate": 3.02020979020979e-06, - "loss": 0.3792, - "step": 14520 - }, - { - "epoch": 12.59, - "learning_rate": 3.0195104895104893e-06, - "loss": 0.3776, - "step": 14530 - }, - { - "epoch": 12.6, - "learning_rate": 3.0188111888111888e-06, - "loss": 0.4141, - "step": 14540 - }, - { - "epoch": 12.61, - "learning_rate": 3.0181118881118883e-06, - "loss": 0.3948, - "step": 14550 - }, - { - "epoch": 12.62, - "learning_rate": 3.017412587412587e-06, - "loss": 0.3601, - "step": 14560 - }, - { - "epoch": 12.63, - "learning_rate": 3.0167132867132864e-06, - "loss": 0.4267, - "step": 14570 - }, - { - "epoch": 12.63, - "learning_rate": 3.016013986013986e-06, - "loss": 0.4611, - "step": 14580 - }, - { - "epoch": 12.64, - "learning_rate": 3.0153146853146854e-06, - "loss": 0.4253, - "step": 14590 - }, - { - "epoch": 12.65, - "learning_rate": 3.0146153846153845e-06, - "loss": 0.4089, - "step": 14600 - }, - { - "epoch": 12.66, - "learning_rate": 3.0139160839160836e-06, - "loss": 0.3613, - "step": 14610 - }, - { - "epoch": 12.67, - "learning_rate": 3.013216783216783e-06, - "loss": 0.3582, - "step": 14620 - }, - { - "epoch": 12.68, - "learning_rate": 3.012517482517482e-06, - "loss": 0.3913, - "step": 14630 - }, - { - "epoch": 12.69, - "learning_rate": 3.0118181818181816e-06, - "loss": 0.4095, - "step": 14640 - }, - { - "epoch": 12.69, - "learning_rate": 3.011118881118881e-06, - "loss": 0.3807, - "step": 14650 - }, - { - "epoch": 12.7, - "learning_rate": 3.0104195804195806e-06, - "loss": 0.4255, - "step": 14660 - }, - { - "epoch": 12.71, - "learning_rate": 3.0097202797202793e-06, - "loss": 0.385, - "step": 14670 - }, - { - "epoch": 12.72, - "learning_rate": 3.0090209790209788e-06, - "loss": 0.3581, - "step": 14680 - }, - { - "epoch": 12.73, - "learning_rate": 3.0083216783216783e-06, - "loss": 0.407, - "step": 14690 - }, - { - "epoch": 12.74, - "learning_rate": 3.0076223776223778e-06, - "loss": 0.4068, - "step": 14700 - }, - { - "epoch": 12.75, - "learning_rate": 3.006923076923077e-06, - "loss": 0.4436, - "step": 14710 - }, - { - "epoch": 12.76, - "learning_rate": 3.006223776223776e-06, - "loss": 0.3818, - "step": 14720 - }, - { - "epoch": 12.76, - "learning_rate": 3.0055244755244754e-06, - "loss": 0.3307, - "step": 14730 - }, - { - "epoch": 12.77, - "learning_rate": 3.0048251748251745e-06, - "loss": 0.4024, - "step": 14740 - }, - { - "epoch": 12.78, - "learning_rate": 3.004125874125874e-06, - "loss": 0.4657, - "step": 14750 - }, - { - "epoch": 12.79, - "learning_rate": 3.0034265734265735e-06, - "loss": 0.4503, - "step": 14760 - }, - { - "epoch": 12.8, - "learning_rate": 3.002727272727273e-06, - "loss": 0.3551, - "step": 14770 - }, - { - "epoch": 12.81, - "learning_rate": 3.0020279720279716e-06, - "loss": 0.4221, - "step": 14780 - }, - { - "epoch": 12.82, - "learning_rate": 3.001328671328671e-06, - "loss": 0.3889, - "step": 14790 - }, - { - "epoch": 12.82, - "learning_rate": 3.0006293706293706e-06, - "loss": 0.3709, - "step": 14800 - }, - { - "epoch": 12.83, - "learning_rate": 2.9999300699300697e-06, - "loss": 0.4108, - "step": 14810 - }, - { - "epoch": 12.84, - "learning_rate": 2.999230769230769e-06, - "loss": 0.402, - "step": 14820 - }, - { - "epoch": 12.85, - "learning_rate": 2.9985314685314683e-06, - "loss": 0.3713, - "step": 14830 - }, - { - "epoch": 12.86, - "learning_rate": 2.9978321678321678e-06, - "loss": 0.4058, - "step": 14840 - }, - { - "epoch": 12.87, - "learning_rate": 2.997132867132867e-06, - "loss": 0.3828, - "step": 14850 - }, - { - "epoch": 12.88, - "learning_rate": 2.9964335664335663e-06, - "loss": 0.3566, - "step": 14860 - }, - { - "epoch": 12.89, - "learning_rate": 2.995734265734266e-06, - "loss": 0.3908, - "step": 14870 - }, - { - "epoch": 12.89, - "learning_rate": 2.9950349650349653e-06, - "loss": 0.4369, - "step": 14880 - }, - { - "epoch": 12.9, - "learning_rate": 2.994335664335664e-06, - "loss": 0.4022, - "step": 14890 - }, - { - "epoch": 12.91, - "learning_rate": 2.9936363636363635e-06, - "loss": 0.4866, - "step": 14900 - }, - { - "epoch": 12.92, - "learning_rate": 2.992937062937063e-06, - "loss": 0.4089, - "step": 14910 - }, - { - "epoch": 12.93, - "learning_rate": 2.992237762237762e-06, - "loss": 0.3921, - "step": 14920 - }, - { - "epoch": 12.94, - "learning_rate": 2.9915384615384615e-06, - "loss": 0.4111, - "step": 14930 - }, - { - "epoch": 12.95, - "learning_rate": 2.9908391608391606e-06, - "loss": 0.3707, - "step": 14940 - }, - { - "epoch": 12.95, - "learning_rate": 2.99013986013986e-06, - "loss": 0.5013, - "step": 14950 - }, - { - "epoch": 12.96, - "learning_rate": 2.989440559440559e-06, - "loss": 0.4334, - "step": 14960 - }, - { - "epoch": 12.97, - "learning_rate": 2.9887412587412587e-06, - "loss": 0.4315, - "step": 14970 - }, - { - "epoch": 12.98, - "learning_rate": 2.988041958041958e-06, - "loss": 0.382, - "step": 14980 - }, - { - "epoch": 12.99, - "learning_rate": 2.987342657342657e-06, - "loss": 0.3887, - "step": 14990 - }, - { - "epoch": 13.0, - "learning_rate": 2.9866433566433563e-06, - "loss": 0.3722, - "step": 15000 - }, - { - "epoch": 13.0, - "eval_loss": 0.5786426663398743, - "eval_runtime": 133.9404, - "eval_samples_per_second": 3.972, - "eval_steps_per_second": 1.986, - "eval_wer": 0.25654046409976217, - "step": 15002 - }, - { - "epoch": 13.01, - "learning_rate": 2.985944055944056e-06, - "loss": 0.3685, - "step": 15010 - }, - { - "epoch": 13.02, - "learning_rate": 2.9852447552447553e-06, - "loss": 0.3702, - "step": 15020 - }, - { - "epoch": 13.02, - "learning_rate": 2.9845454545454544e-06, - "loss": 0.3794, - "step": 15030 - }, - { - "epoch": 13.03, - "learning_rate": 2.983846153846154e-06, - "loss": 0.3762, - "step": 15040 - }, - { - "epoch": 13.04, - "learning_rate": 2.983146853146853e-06, - "loss": 0.4761, - "step": 15050 - }, - { - "epoch": 13.05, - "learning_rate": 2.9824475524475525e-06, - "loss": 0.401, - "step": 15060 - }, - { - "epoch": 13.06, - "learning_rate": 2.9817482517482515e-06, - "loss": 0.4142, - "step": 15070 - }, - { - "epoch": 13.07, - "learning_rate": 2.981048951048951e-06, - "loss": 0.3326, - "step": 15080 - }, - { - "epoch": 13.08, - "learning_rate": 2.9803496503496505e-06, - "loss": 0.3793, - "step": 15090 - }, - { - "epoch": 13.08, - "learning_rate": 2.979650349650349e-06, - "loss": 0.3986, - "step": 15100 - }, - { - "epoch": 13.09, - "learning_rate": 2.9789510489510487e-06, - "loss": 0.3771, - "step": 15110 - }, - { - "epoch": 13.1, - "learning_rate": 2.978251748251748e-06, - "loss": 0.3902, - "step": 15120 - }, - { - "epoch": 13.11, - "learning_rate": 2.9775524475524477e-06, - "loss": 0.3795, - "step": 15130 - }, - { - "epoch": 13.12, - "learning_rate": 2.9768531468531467e-06, - "loss": 0.4201, - "step": 15140 - }, - { - "epoch": 13.13, - "learning_rate": 2.976153846153846e-06, - "loss": 0.409, - "step": 15150 - }, - { - "epoch": 13.14, - "learning_rate": 2.9754545454545453e-06, - "loss": 0.4454, - "step": 15160 - }, - { - "epoch": 13.15, - "learning_rate": 2.9747552447552444e-06, - "loss": 0.44, - "step": 15170 - }, - { - "epoch": 13.15, - "learning_rate": 2.974055944055944e-06, - "loss": 0.413, - "step": 15180 - }, - { - "epoch": 13.16, - "learning_rate": 2.9733566433566434e-06, - "loss": 0.3937, - "step": 15190 - }, - { - "epoch": 13.17, - "learning_rate": 2.972657342657343e-06, - "loss": 0.3827, - "step": 15200 - }, - { - "epoch": 13.18, - "learning_rate": 2.9719580419580415e-06, - "loss": 0.3791, - "step": 15210 - }, - { - "epoch": 13.19, - "learning_rate": 2.971258741258741e-06, - "loss": 0.3759, - "step": 15220 - }, - { - "epoch": 13.2, - "learning_rate": 2.9705594405594405e-06, - "loss": 0.3828, - "step": 15230 - }, - { - "epoch": 13.21, - "learning_rate": 2.96986013986014e-06, - "loss": 0.3988, - "step": 15240 - }, - { - "epoch": 13.21, - "learning_rate": 2.969160839160839e-06, - "loss": 0.4248, - "step": 15250 - }, - { - "epoch": 13.22, - "learning_rate": 2.968461538461538e-06, - "loss": 0.472, - "step": 15260 - }, - { - "epoch": 13.23, - "learning_rate": 2.9677622377622377e-06, - "loss": 0.3754, - "step": 15270 - }, - { - "epoch": 13.24, - "learning_rate": 2.9670629370629367e-06, - "loss": 0.3814, - "step": 15280 - }, - { - "epoch": 13.25, - "learning_rate": 2.9663636363636362e-06, - "loss": 0.4308, - "step": 15290 - }, - { - "epoch": 13.26, - "learning_rate": 2.9656643356643357e-06, - "loss": 0.3784, - "step": 15300 - }, - { - "epoch": 13.27, - "learning_rate": 2.9649650349650352e-06, - "loss": 0.435, - "step": 15310 - }, - { - "epoch": 13.28, - "learning_rate": 2.964265734265734e-06, - "loss": 0.4053, - "step": 15320 - }, - { - "epoch": 13.28, - "learning_rate": 2.9635664335664334e-06, - "loss": 0.4048, - "step": 15330 - }, - { - "epoch": 13.29, - "learning_rate": 2.962867132867133e-06, - "loss": 0.4112, - "step": 15340 - }, - { - "epoch": 13.3, - "learning_rate": 2.962167832167832e-06, - "loss": 0.3558, - "step": 15350 - }, - { - "epoch": 13.31, - "learning_rate": 2.9614685314685314e-06, - "loss": 0.4515, - "step": 15360 - }, - { - "epoch": 13.32, - "learning_rate": 2.9607692307692305e-06, - "loss": 0.3856, - "step": 15370 - }, - { - "epoch": 13.33, - "learning_rate": 2.96006993006993e-06, - "loss": 0.3782, - "step": 15380 - }, - { - "epoch": 13.34, - "learning_rate": 2.959370629370629e-06, - "loss": 0.4126, - "step": 15390 - }, - { - "epoch": 13.34, - "learning_rate": 2.9586713286713286e-06, - "loss": 0.3945, - "step": 15400 - }, - { - "epoch": 13.35, - "learning_rate": 2.957972027972028e-06, - "loss": 0.4101, - "step": 15410 - }, - { - "epoch": 13.36, - "learning_rate": 2.9572727272727267e-06, - "loss": 0.4763, - "step": 15420 - }, - { - "epoch": 13.37, - "learning_rate": 2.9565734265734262e-06, - "loss": 0.3442, - "step": 15430 - }, - { - "epoch": 13.38, - "learning_rate": 2.9558741258741257e-06, - "loss": 0.3997, - "step": 15440 - }, - { - "epoch": 13.39, - "learning_rate": 2.955174825174825e-06, - "loss": 0.4133, - "step": 15450 - }, - { - "epoch": 13.4, - "learning_rate": 2.9544755244755243e-06, - "loss": 0.4239, - "step": 15460 - }, - { - "epoch": 13.41, - "learning_rate": 2.9537762237762238e-06, - "loss": 0.4066, - "step": 15470 - }, - { - "epoch": 13.41, - "learning_rate": 2.953076923076923e-06, - "loss": 0.3706, - "step": 15480 - }, - { - "epoch": 13.42, - "learning_rate": 2.9523776223776223e-06, - "loss": 0.3928, - "step": 15490 - }, - { - "epoch": 13.43, - "learning_rate": 2.9516783216783214e-06, - "loss": 0.4208, - "step": 15500 - }, - { - "epoch": 13.44, - "learning_rate": 2.950979020979021e-06, - "loss": 0.4563, - "step": 15510 - }, - { - "epoch": 13.45, - "learning_rate": 2.9502797202797204e-06, - "loss": 0.4204, - "step": 15520 - }, - { - "epoch": 13.46, - "learning_rate": 2.949580419580419e-06, - "loss": 0.3688, - "step": 15530 - }, - { - "epoch": 13.47, - "learning_rate": 2.9488811188811186e-06, - "loss": 0.478, - "step": 15540 - }, - { - "epoch": 13.47, - "learning_rate": 2.948181818181818e-06, - "loss": 0.4186, - "step": 15550 - }, - { - "epoch": 13.48, - "learning_rate": 2.9474825174825176e-06, - "loss": 0.3855, - "step": 15560 - }, - { - "epoch": 13.49, - "learning_rate": 2.9467832167832166e-06, - "loss": 0.4161, - "step": 15570 - }, - { - "epoch": 13.5, - "learning_rate": 2.946083916083916e-06, - "loss": 0.3894, - "step": 15580 - }, - { - "epoch": 13.51, - "learning_rate": 2.945384615384615e-06, - "loss": 0.4233, - "step": 15590 - }, - { - "epoch": 13.52, - "learning_rate": 2.9446853146853143e-06, - "loss": 0.504, - "step": 15600 - }, - { - "epoch": 13.53, - "learning_rate": 2.9439860139860138e-06, - "loss": 0.4012, - "step": 15610 - }, - { - "epoch": 13.54, - "learning_rate": 2.9432867132867133e-06, - "loss": 0.3991, - "step": 15620 - }, - { - "epoch": 13.54, - "learning_rate": 2.9425874125874128e-06, - "loss": 0.4202, - "step": 15630 - }, - { - "epoch": 13.55, - "learning_rate": 2.9418881118881114e-06, - "loss": 0.4122, - "step": 15640 - }, - { - "epoch": 13.56, - "learning_rate": 2.941188811188811e-06, - "loss": 0.4015, - "step": 15650 - }, - { - "epoch": 13.57, - "learning_rate": 2.9404895104895104e-06, - "loss": 0.4611, - "step": 15660 - }, - { - "epoch": 13.58, - "learning_rate": 2.93979020979021e-06, - "loss": 0.3858, - "step": 15670 - }, - { - "epoch": 13.59, - "learning_rate": 2.939090909090909e-06, - "loss": 0.3611, - "step": 15680 - }, - { - "epoch": 13.6, - "learning_rate": 2.9383916083916085e-06, - "loss": 0.4195, - "step": 15690 - }, - { - "epoch": 13.6, - "learning_rate": 2.9376923076923076e-06, - "loss": 0.4241, - "step": 15700 - }, - { - "epoch": 13.61, - "learning_rate": 2.9369930069930066e-06, - "loss": 0.3334, - "step": 15710 - }, - { - "epoch": 13.62, - "learning_rate": 2.936293706293706e-06, - "loss": 0.3701, - "step": 15720 - }, - { - "epoch": 13.63, - "learning_rate": 2.9355944055944056e-06, - "loss": 0.4322, - "step": 15730 - }, - { - "epoch": 13.64, - "learning_rate": 2.934895104895105e-06, - "loss": 0.4141, - "step": 15740 - }, - { - "epoch": 13.65, - "learning_rate": 2.9341958041958038e-06, - "loss": 0.3971, - "step": 15750 - }, - { - "epoch": 13.66, - "learning_rate": 2.9334965034965033e-06, - "loss": 0.368, - "step": 15760 - }, - { - "epoch": 13.67, - "learning_rate": 2.9327972027972028e-06, - "loss": 0.328, - "step": 15770 - }, - { - "epoch": 13.67, - "learning_rate": 2.932097902097902e-06, - "loss": 0.3849, - "step": 15780 - }, - { - "epoch": 13.68, - "learning_rate": 2.9313986013986013e-06, - "loss": 0.4378, - "step": 15790 - }, - { - "epoch": 13.69, - "learning_rate": 2.9306993006993004e-06, - "loss": 0.3931, - "step": 15800 - }, - { - "epoch": 13.7, - "learning_rate": 2.93e-06, - "loss": 0.3739, - "step": 15810 - }, - { - "epoch": 13.71, - "learning_rate": 2.929300699300699e-06, - "loss": 0.3899, - "step": 15820 - }, - { - "epoch": 13.72, - "learning_rate": 2.9286013986013985e-06, - "loss": 0.4047, - "step": 15830 - }, - { - "epoch": 13.73, - "learning_rate": 2.927902097902098e-06, - "loss": 0.4169, - "step": 15840 - }, - { - "epoch": 13.73, - "learning_rate": 2.9272027972027975e-06, - "loss": 0.4546, - "step": 15850 - }, - { - "epoch": 13.74, - "learning_rate": 2.926503496503496e-06, - "loss": 0.3633, - "step": 15860 - }, - { - "epoch": 13.75, - "learning_rate": 2.9258041958041956e-06, - "loss": 0.4205, - "step": 15870 - }, - { - "epoch": 13.76, - "learning_rate": 2.925104895104895e-06, - "loss": 0.4143, - "step": 15880 - }, - { - "epoch": 13.77, - "learning_rate": 2.924405594405594e-06, - "loss": 0.3766, - "step": 15890 - }, - { - "epoch": 13.78, - "learning_rate": 2.9237062937062937e-06, - "loss": 0.4132, - "step": 15900 - }, - { - "epoch": 13.79, - "learning_rate": 2.9230069930069928e-06, - "loss": 0.4101, - "step": 15910 - }, - { - "epoch": 13.8, - "learning_rate": 2.9223076923076922e-06, - "loss": 0.4221, - "step": 15920 - }, - { - "epoch": 13.8, - "learning_rate": 2.9216083916083913e-06, - "loss": 0.3648, - "step": 15930 - }, - { - "epoch": 13.81, - "learning_rate": 2.920909090909091e-06, - "loss": 0.4157, - "step": 15940 - }, - { - "epoch": 13.82, - "learning_rate": 2.9202097902097903e-06, - "loss": 0.4349, - "step": 15950 - }, - { - "epoch": 13.83, - "learning_rate": 2.919510489510489e-06, - "loss": 0.4585, - "step": 15960 - }, - { - "epoch": 13.84, - "learning_rate": 2.9188111888111885e-06, - "loss": 0.4467, - "step": 15970 - }, - { - "epoch": 13.85, - "learning_rate": 2.918111888111888e-06, - "loss": 0.3707, - "step": 15980 - }, - { - "epoch": 13.86, - "learning_rate": 2.9174125874125875e-06, - "loss": 0.4144, - "step": 15990 - }, - { - "epoch": 13.86, - "learning_rate": 2.9167132867132865e-06, - "loss": 0.4674, - "step": 16000 - }, - { - "epoch": 13.87, - "learning_rate": 2.916013986013986e-06, - "loss": 0.4244, - "step": 16010 - }, - { - "epoch": 13.88, - "learning_rate": 2.915314685314685e-06, - "loss": 0.3754, - "step": 16020 - }, - { - "epoch": 13.89, - "learning_rate": 2.9146153846153846e-06, - "loss": 0.3857, - "step": 16030 - }, - { - "epoch": 13.9, - "learning_rate": 2.9139160839160837e-06, - "loss": 0.3695, - "step": 16040 - }, - { - "epoch": 13.91, - "learning_rate": 2.913216783216783e-06, - "loss": 0.4657, - "step": 16050 - }, - { - "epoch": 13.92, - "learning_rate": 2.9125174825174827e-06, - "loss": 0.4059, - "step": 16060 - }, - { - "epoch": 13.93, - "learning_rate": 2.9118181818181813e-06, - "loss": 0.442, - "step": 16070 - }, - { - "epoch": 13.93, - "learning_rate": 2.911118881118881e-06, - "loss": 0.3858, - "step": 16080 - }, - { - "epoch": 13.94, - "learning_rate": 2.9104195804195803e-06, - "loss": 0.4101, - "step": 16090 - }, - { - "epoch": 13.95, - "learning_rate": 2.90972027972028e-06, - "loss": 0.4026, - "step": 16100 - }, - { - "epoch": 13.96, - "learning_rate": 2.909020979020979e-06, - "loss": 0.3701, - "step": 16110 - }, - { - "epoch": 13.97, - "learning_rate": 2.9083216783216784e-06, - "loss": 0.4064, - "step": 16120 - }, - { - "epoch": 13.98, - "learning_rate": 2.9076223776223774e-06, - "loss": 0.4078, - "step": 16130 - }, - { - "epoch": 13.99, - "learning_rate": 2.9069230769230765e-06, - "loss": 0.3893, - "step": 16140 - }, - { - "epoch": 13.99, - "learning_rate": 2.906223776223776e-06, - "loss": 0.3558, - "step": 16150 - }, - { - "epoch": 14.0, - "eval_loss": 0.5589486360549927, - "eval_runtime": 132.8357, - "eval_samples_per_second": 4.005, - "eval_steps_per_second": 2.002, - "eval_wer": 0.26380407533586164, - "step": 16156 - }, - { - "epoch": 14.0, - "learning_rate": 2.9055244755244755e-06, - "loss": 0.4281, - "step": 16160 - }, - { - "epoch": 14.01, - "learning_rate": 2.904825174825175e-06, - "loss": 0.4123, - "step": 16170 - }, - { - "epoch": 14.02, - "learning_rate": 2.9041258741258737e-06, - "loss": 0.3568, - "step": 16180 - }, - { - "epoch": 14.03, - "learning_rate": 2.903426573426573e-06, - "loss": 0.3891, - "step": 16190 - }, - { - "epoch": 14.04, - "learning_rate": 2.9027272727272727e-06, - "loss": 0.4301, - "step": 16200 - }, - { - "epoch": 14.05, - "learning_rate": 2.902027972027972e-06, - "loss": 0.4633, - "step": 16210 - }, - { - "epoch": 14.06, - "learning_rate": 2.9013286713286712e-06, - "loss": 0.3918, - "step": 16220 - }, - { - "epoch": 14.06, - "learning_rate": 2.9006293706293707e-06, - "loss": 0.3432, - "step": 16230 - }, - { - "epoch": 14.07, - "learning_rate": 2.89993006993007e-06, - "loss": 0.4055, - "step": 16240 - }, - { - "epoch": 14.08, - "learning_rate": 2.899230769230769e-06, - "loss": 0.3804, - "step": 16250 - }, - { - "epoch": 14.09, - "learning_rate": 2.8985314685314684e-06, - "loss": 0.4274, - "step": 16260 - }, - { - "epoch": 14.1, - "learning_rate": 2.897832167832168e-06, - "loss": 0.4067, - "step": 16270 - }, - { - "epoch": 14.11, - "learning_rate": 2.8971328671328674e-06, - "loss": 0.3626, - "step": 16280 - }, - { - "epoch": 14.12, - "learning_rate": 2.896433566433566e-06, - "loss": 0.3951, - "step": 16290 - }, - { - "epoch": 14.12, - "learning_rate": 2.8957342657342655e-06, - "loss": 0.401, - "step": 16300 - }, - { - "epoch": 14.13, - "learning_rate": 2.895034965034965e-06, - "loss": 0.4691, - "step": 16310 - }, - { - "epoch": 14.14, - "learning_rate": 2.894335664335664e-06, - "loss": 0.3822, - "step": 16320 - }, - { - "epoch": 14.15, - "learning_rate": 2.8936363636363636e-06, - "loss": 0.4677, - "step": 16330 - }, - { - "epoch": 14.16, - "learning_rate": 2.8929370629370626e-06, - "loss": 0.3749, - "step": 16340 - }, - { - "epoch": 14.17, - "learning_rate": 2.892237762237762e-06, - "loss": 0.3705, - "step": 16350 - }, - { - "epoch": 14.18, - "learning_rate": 2.8915384615384612e-06, - "loss": 0.4783, - "step": 16360 - }, - { - "epoch": 14.19, - "learning_rate": 2.8908391608391607e-06, - "loss": 0.4133, - "step": 16370 - }, - { - "epoch": 14.19, - "learning_rate": 2.8901398601398602e-06, - "loss": 0.4054, - "step": 16380 - }, - { - "epoch": 14.2, - "learning_rate": 2.8894405594405593e-06, - "loss": 0.4013, - "step": 16390 - }, - { - "epoch": 14.21, - "learning_rate": 2.8887412587412584e-06, - "loss": 0.4116, - "step": 16400 - }, - { - "epoch": 14.22, - "learning_rate": 2.888041958041958e-06, - "loss": 0.3836, - "step": 16410 - }, - { - "epoch": 14.23, - "learning_rate": 2.8873426573426574e-06, - "loss": 0.372, - "step": 16420 - }, - { - "epoch": 14.24, - "learning_rate": 2.8866433566433564e-06, - "loss": 0.3784, - "step": 16430 - }, - { - "epoch": 14.25, - "learning_rate": 2.885944055944056e-06, - "loss": 0.36, - "step": 16440 - }, - { - "epoch": 14.25, - "learning_rate": 2.885244755244755e-06, - "loss": 0.3712, - "step": 16450 - }, - { - "epoch": 14.26, - "learning_rate": 2.8845454545454545e-06, - "loss": 0.4185, - "step": 16460 - }, - { - "epoch": 14.27, - "learning_rate": 2.8838461538461536e-06, - "loss": 0.4046, - "step": 16470 - }, - { - "epoch": 14.28, - "learning_rate": 2.883146853146853e-06, - "loss": 0.3876, - "step": 16480 - }, - { - "epoch": 14.29, - "learning_rate": 2.8824475524475526e-06, - "loss": 0.4056, - "step": 16490 - }, - { - "epoch": 14.3, - "learning_rate": 2.8817482517482516e-06, - "loss": 0.3989, - "step": 16500 - }, - { - "epoch": 14.31, - "learning_rate": 2.8810489510489507e-06, - "loss": 0.3513, - "step": 16510 - }, - { - "epoch": 14.32, - "learning_rate": 2.88034965034965e-06, - "loss": 0.3871, - "step": 16520 - }, - { - "epoch": 14.32, - "learning_rate": 2.8796503496503497e-06, - "loss": 0.4363, - "step": 16530 - }, - { - "epoch": 14.33, - "learning_rate": 2.8789510489510488e-06, - "loss": 0.4149, - "step": 16540 - }, - { - "epoch": 14.34, - "learning_rate": 2.8782517482517483e-06, - "loss": 0.3772, - "step": 16550 - }, - { - "epoch": 14.35, - "learning_rate": 2.8775524475524473e-06, - "loss": 0.4088, - "step": 16560 - }, - { - "epoch": 14.36, - "learning_rate": 2.8768531468531464e-06, - "loss": 0.3692, - "step": 16570 - }, - { - "epoch": 14.37, - "learning_rate": 2.876153846153846e-06, - "loss": 0.4181, - "step": 16580 - }, - { - "epoch": 14.38, - "learning_rate": 2.8754545454545454e-06, - "loss": 0.4705, - "step": 16590 - }, - { - "epoch": 14.38, - "learning_rate": 2.874755244755245e-06, - "loss": 0.3912, - "step": 16600 - }, - { - "epoch": 14.39, - "learning_rate": 2.8740559440559436e-06, - "loss": 0.3983, - "step": 16610 - }, - { - "epoch": 14.4, - "learning_rate": 2.873356643356643e-06, - "loss": 0.4027, - "step": 16620 - }, - { - "epoch": 14.41, - "learning_rate": 2.8726573426573426e-06, - "loss": 0.3157, - "step": 16630 - }, - { - "epoch": 14.42, - "learning_rate": 2.871958041958042e-06, - "loss": 0.4119, - "step": 16640 - }, - { - "epoch": 14.43, - "learning_rate": 2.871258741258741e-06, - "loss": 0.3853, - "step": 16650 - }, - { - "epoch": 14.44, - "learning_rate": 2.8705594405594406e-06, - "loss": 0.3858, - "step": 16660 - }, - { - "epoch": 14.45, - "learning_rate": 2.8698601398601397e-06, - "loss": 0.3623, - "step": 16670 - }, - { - "epoch": 14.45, - "learning_rate": 2.8691608391608388e-06, - "loss": 0.3513, - "step": 16680 - }, - { - "epoch": 14.46, - "learning_rate": 2.8684615384615383e-06, - "loss": 0.3665, - "step": 16690 - }, - { - "epoch": 14.47, - "learning_rate": 2.8677622377622378e-06, - "loss": 0.3952, - "step": 16700 - }, - { - "epoch": 14.48, - "learning_rate": 2.8670629370629373e-06, - "loss": 0.4067, - "step": 16710 - }, - { - "epoch": 14.49, - "learning_rate": 2.866363636363636e-06, - "loss": 0.4177, - "step": 16720 - }, - { - "epoch": 14.5, - "learning_rate": 2.8656643356643354e-06, - "loss": 0.3951, - "step": 16730 - }, - { - "epoch": 14.51, - "learning_rate": 2.864965034965035e-06, - "loss": 0.4074, - "step": 16740 - }, - { - "epoch": 14.51, - "learning_rate": 2.864265734265734e-06, - "loss": 0.4256, - "step": 16750 - }, - { - "epoch": 14.52, - "learning_rate": 2.8635664335664335e-06, - "loss": 0.3896, - "step": 16760 - }, - { - "epoch": 14.53, - "learning_rate": 2.862867132867133e-06, - "loss": 0.4105, - "step": 16770 - }, - { - "epoch": 14.54, - "learning_rate": 2.862167832167832e-06, - "loss": 0.3995, - "step": 16780 - }, - { - "epoch": 14.55, - "learning_rate": 2.861468531468531e-06, - "loss": 0.4183, - "step": 16790 - }, - { - "epoch": 14.56, - "learning_rate": 2.8607692307692306e-06, - "loss": 0.4463, - "step": 16800 - }, - { - "epoch": 14.57, - "learning_rate": 2.86006993006993e-06, - "loss": 0.4485, - "step": 16810 - }, - { - "epoch": 14.58, - "learning_rate": 2.8593706293706296e-06, - "loss": 0.4317, - "step": 16820 - }, - { - "epoch": 14.58, - "learning_rate": 2.8586713286713283e-06, - "loss": 0.3431, - "step": 16830 - }, - { - "epoch": 14.59, - "learning_rate": 2.8579720279720278e-06, - "loss": 0.4122, - "step": 16840 - }, - { - "epoch": 14.6, - "learning_rate": 2.8572727272727273e-06, - "loss": 0.4, - "step": 16850 - }, - { - "epoch": 14.61, - "learning_rate": 2.8565734265734263e-06, - "loss": 0.3648, - "step": 16860 - }, - { - "epoch": 14.62, - "learning_rate": 2.855874125874126e-06, - "loss": 0.4101, - "step": 16870 - }, - { - "epoch": 14.63, - "learning_rate": 2.8551748251748253e-06, - "loss": 0.3953, - "step": 16880 - }, - { - "epoch": 14.64, - "learning_rate": 2.8544755244755244e-06, - "loss": 0.3571, - "step": 16890 - }, - { - "epoch": 14.64, - "learning_rate": 2.8537762237762235e-06, - "loss": 0.4135, - "step": 16900 - }, - { - "epoch": 14.65, - "learning_rate": 2.853076923076923e-06, - "loss": 0.3993, - "step": 16910 - }, - { - "epoch": 14.66, - "learning_rate": 2.8523776223776225e-06, - "loss": 0.4097, - "step": 16920 - }, - { - "epoch": 14.67, - "learning_rate": 2.8516783216783215e-06, - "loss": 0.4438, - "step": 16930 - }, - { - "epoch": 14.68, - "learning_rate": 2.8509790209790206e-06, - "loss": 0.4313, - "step": 16940 - }, - { - "epoch": 14.69, - "learning_rate": 2.85027972027972e-06, - "loss": 0.4028, - "step": 16950 - }, - { - "epoch": 14.7, - "learning_rate": 2.8495804195804196e-06, - "loss": 0.441, - "step": 16960 - }, - { - "epoch": 14.71, - "learning_rate": 2.8488811188811187e-06, - "loss": 0.4112, - "step": 16970 - }, - { - "epoch": 14.71, - "learning_rate": 2.848181818181818e-06, - "loss": 0.399, - "step": 16980 - }, - { - "epoch": 14.72, - "learning_rate": 2.8474825174825172e-06, - "loss": 0.3647, - "step": 16990 - }, - { - "epoch": 14.73, - "learning_rate": 2.8467832167832167e-06, - "loss": 0.3807, - "step": 17000 - }, - { - "epoch": 14.74, - "learning_rate": 2.846083916083916e-06, - "loss": 0.4839, - "step": 17010 - }, - { - "epoch": 14.75, - "learning_rate": 2.8453846153846153e-06, - "loss": 0.4013, - "step": 17020 - }, - { - "epoch": 14.76, - "learning_rate": 2.844685314685315e-06, - "loss": 0.3263, - "step": 17030 - }, - { - "epoch": 14.77, - "learning_rate": 2.843986013986014e-06, - "loss": 0.3927, - "step": 17040 - }, - { - "epoch": 14.77, - "learning_rate": 2.843286713286713e-06, - "loss": 0.3766, - "step": 17050 - }, - { - "epoch": 14.78, - "learning_rate": 2.8425874125874125e-06, - "loss": 0.4393, - "step": 17060 - }, - { - "epoch": 14.79, - "learning_rate": 2.841888111888112e-06, - "loss": 0.409, - "step": 17070 - }, - { - "epoch": 14.8, - "learning_rate": 2.841188811188811e-06, - "loss": 0.3585, - "step": 17080 - }, - { - "epoch": 14.81, - "learning_rate": 2.8404895104895105e-06, - "loss": 0.392, - "step": 17090 - }, - { - "epoch": 14.82, - "learning_rate": 2.8397902097902096e-06, - "loss": 0.417, - "step": 17100 - }, - { - "epoch": 14.83, - "learning_rate": 2.8390909090909087e-06, - "loss": 0.4063, - "step": 17110 - }, - { - "epoch": 14.83, - "learning_rate": 2.838391608391608e-06, - "loss": 0.3751, - "step": 17120 - }, - { - "epoch": 14.84, - "learning_rate": 2.8376923076923077e-06, - "loss": 0.3907, - "step": 17130 - }, - { - "epoch": 14.85, - "learning_rate": 2.836993006993007e-06, - "loss": 0.4433, - "step": 17140 - }, - { - "epoch": 14.86, - "learning_rate": 2.836293706293706e-06, - "loss": 0.4271, - "step": 17150 - }, - { - "epoch": 14.87, - "learning_rate": 2.8355944055944053e-06, - "loss": 0.4155, - "step": 17160 - }, - { - "epoch": 14.88, - "learning_rate": 2.834895104895105e-06, - "loss": 0.3911, - "step": 17170 - }, - { - "epoch": 14.89, - "learning_rate": 2.8341958041958043e-06, - "loss": 0.3268, - "step": 17180 - }, - { - "epoch": 14.9, - "learning_rate": 2.8334965034965034e-06, - "loss": 0.3477, - "step": 17190 - }, - { - "epoch": 14.9, - "learning_rate": 2.832797202797203e-06, - "loss": 0.4478, - "step": 17200 - }, - { - "epoch": 14.91, - "learning_rate": 2.832097902097902e-06, - "loss": 0.4441, - "step": 17210 - }, - { - "epoch": 14.92, - "learning_rate": 2.831398601398601e-06, - "loss": 0.4519, - "step": 17220 - }, - { - "epoch": 14.93, - "learning_rate": 2.8306993006993005e-06, - "loss": 0.4354, - "step": 17230 - }, - { - "epoch": 14.94, - "learning_rate": 2.83e-06, - "loss": 0.3698, - "step": 17240 - }, - { - "epoch": 14.95, - "learning_rate": 2.8293006993006995e-06, - "loss": 0.4287, - "step": 17250 - }, - { - "epoch": 14.96, - "learning_rate": 2.828601398601398e-06, - "loss": 0.4025, - "step": 17260 - }, - { - "epoch": 14.96, - "learning_rate": 2.8279020979020977e-06, - "loss": 0.4039, - "step": 17270 - }, - { - "epoch": 14.97, - "learning_rate": 2.827202797202797e-06, - "loss": 0.3422, - "step": 17280 - }, - { - "epoch": 14.98, - "learning_rate": 2.8265034965034962e-06, - "loss": 0.3912, - "step": 17290 - }, - { - "epoch": 14.99, - "learning_rate": 2.8258041958041957e-06, - "loss": 0.4358, - "step": 17300 - }, - { - "epoch": 15.0, - "learning_rate": 2.8251048951048952e-06, - "loss": 0.392, - "step": 17310 - }, - { - "epoch": 15.0, - "eval_loss": 0.5580989122390747, - "eval_runtime": 134.5878, - "eval_samples_per_second": 3.953, - "eval_steps_per_second": 1.976, - "eval_wer": 0.2593044931542071, - "step": 17310 - }, - { - "epoch": 15.01, - "learning_rate": 2.8244055944055943e-06, - "loss": 0.4794, - "step": 17320 - }, - { - "epoch": 15.02, - "learning_rate": 2.8237062937062934e-06, - "loss": 0.3538, - "step": 17330 - }, - { - "epoch": 15.03, - "learning_rate": 2.823006993006993e-06, - "loss": 0.432, - "step": 17340 - }, - { - "epoch": 15.03, - "learning_rate": 2.8223076923076924e-06, - "loss": 0.3713, - "step": 17350 - }, - { - "epoch": 15.04, - "learning_rate": 2.821608391608392e-06, - "loss": 0.4383, - "step": 17360 - }, - { - "epoch": 15.05, - "learning_rate": 2.8209090909090905e-06, - "loss": 0.4064, - "step": 17370 - }, - { - "epoch": 15.06, - "learning_rate": 2.82020979020979e-06, - "loss": 0.4444, - "step": 17380 - }, - { - "epoch": 15.07, - "learning_rate": 2.8195104895104895e-06, - "loss": 0.383, - "step": 17390 - }, - { - "epoch": 15.08, - "learning_rate": 2.8188111888111886e-06, - "loss": 0.413, - "step": 17400 - }, - { - "epoch": 15.09, - "learning_rate": 2.818111888111888e-06, - "loss": 0.4161, - "step": 17410 - }, - { - "epoch": 15.1, - "learning_rate": 2.8174125874125876e-06, - "loss": 0.3648, - "step": 17420 - }, - { - "epoch": 15.1, - "learning_rate": 2.8167132867132866e-06, - "loss": 0.3707, - "step": 17430 - }, - { - "epoch": 15.11, - "learning_rate": 2.8160139860139857e-06, - "loss": 0.3794, - "step": 17440 - }, - { - "epoch": 15.12, - "learning_rate": 2.815314685314685e-06, - "loss": 0.4292, - "step": 17450 - }, - { - "epoch": 15.13, - "learning_rate": 2.8146153846153847e-06, - "loss": 0.468, - "step": 17460 - }, - { - "epoch": 15.14, - "learning_rate": 2.8139160839160838e-06, - "loss": 0.3645, - "step": 17470 - }, - { - "epoch": 15.15, - "learning_rate": 2.813216783216783e-06, - "loss": 0.4114, - "step": 17480 - }, - { - "epoch": 15.16, - "learning_rate": 2.8125174825174824e-06, - "loss": 0.4202, - "step": 17490 - }, - { - "epoch": 15.16, - "learning_rate": 2.811818181818182e-06, - "loss": 0.4196, - "step": 17500 - }, - { - "epoch": 15.17, - "learning_rate": 2.811118881118881e-06, - "loss": 0.3847, - "step": 17510 - }, - { - "epoch": 15.18, - "learning_rate": 2.8104195804195804e-06, - "loss": 0.4578, - "step": 17520 - }, - { - "epoch": 15.19, - "learning_rate": 2.8097202797202795e-06, - "loss": 0.3375, - "step": 17530 - }, - { - "epoch": 15.2, - "learning_rate": 2.8090209790209786e-06, - "loss": 0.3479, - "step": 17540 - }, - { - "epoch": 15.21, - "learning_rate": 2.808321678321678e-06, - "loss": 0.3807, - "step": 17550 - }, - { - "epoch": 15.22, - "learning_rate": 2.8076223776223776e-06, - "loss": 0.4187, - "step": 17560 - }, - { - "epoch": 15.23, - "learning_rate": 2.806923076923077e-06, - "loss": 0.3555, - "step": 17570 - }, - { - "epoch": 15.23, - "learning_rate": 2.806223776223776e-06, - "loss": 0.403, - "step": 17580 - }, - { - "epoch": 15.24, - "learning_rate": 2.805524475524475e-06, - "loss": 0.3263, - "step": 17590 - }, - { - "epoch": 15.25, - "learning_rate": 2.8048251748251747e-06, - "loss": 0.3526, - "step": 17600 - }, - { - "epoch": 15.26, - "learning_rate": 2.804125874125874e-06, - "loss": 0.3838, - "step": 17610 - }, - { - "epoch": 15.27, - "learning_rate": 2.8034265734265733e-06, - "loss": 0.4049, - "step": 17620 - }, - { - "epoch": 15.28, - "learning_rate": 2.8027272727272728e-06, - "loss": 0.4254, - "step": 17630 - }, - { - "epoch": 15.29, - "learning_rate": 2.802027972027972e-06, - "loss": 0.3857, - "step": 17640 - }, - { - "epoch": 15.29, - "learning_rate": 2.801328671328671e-06, - "loss": 0.3738, - "step": 17650 - }, - { - "epoch": 15.3, - "learning_rate": 2.8006293706293704e-06, - "loss": 0.389, - "step": 17660 - }, - { - "epoch": 15.31, - "learning_rate": 2.79993006993007e-06, - "loss": 0.4428, - "step": 17670 - }, - { - "epoch": 15.32, - "learning_rate": 2.7992307692307694e-06, - "loss": 0.36, - "step": 17680 - }, - { - "epoch": 15.33, - "learning_rate": 2.798531468531468e-06, - "loss": 0.3858, - "step": 17690 - }, - { - "epoch": 15.34, - "learning_rate": 2.7978321678321676e-06, - "loss": 0.4003, - "step": 17700 - }, - { - "epoch": 15.35, - "learning_rate": 2.797132867132867e-06, - "loss": 0.4563, - "step": 17710 - }, - { - "epoch": 15.36, - "learning_rate": 2.796433566433566e-06, - "loss": 0.3905, - "step": 17720 - }, - { - "epoch": 15.36, - "learning_rate": 2.7957342657342656e-06, - "loss": 0.3633, - "step": 17730 - }, - { - "epoch": 15.37, - "learning_rate": 2.795034965034965e-06, - "loss": 0.3883, - "step": 17740 - }, - { - "epoch": 15.38, - "learning_rate": 2.794335664335664e-06, - "loss": 0.3688, - "step": 17750 - }, - { - "epoch": 15.39, - "learning_rate": 2.7936363636363633e-06, - "loss": 0.4025, - "step": 17760 - }, - { - "epoch": 15.4, - "learning_rate": 2.7929370629370628e-06, - "loss": 0.3778, - "step": 17770 - }, - { - "epoch": 15.41, - "learning_rate": 2.7922377622377623e-06, - "loss": 0.4241, - "step": 17780 - }, - { - "epoch": 15.42, - "learning_rate": 2.7915384615384618e-06, - "loss": 0.3872, - "step": 17790 - }, - { - "epoch": 15.42, - "learning_rate": 2.7908391608391604e-06, - "loss": 0.3909, - "step": 17800 - }, - { - "epoch": 15.43, - "learning_rate": 2.79013986013986e-06, - "loss": 0.3407, - "step": 17810 - }, - { - "epoch": 15.44, - "learning_rate": 2.7894405594405594e-06, - "loss": 0.3655, - "step": 17820 - }, - { - "epoch": 15.45, - "learning_rate": 2.7887412587412585e-06, - "loss": 0.3589, - "step": 17830 - }, - { - "epoch": 15.46, - "learning_rate": 2.788041958041958e-06, - "loss": 0.4076, - "step": 17840 - }, - { - "epoch": 15.47, - "learning_rate": 2.7873426573426575e-06, - "loss": 0.4224, - "step": 17850 - }, - { - "epoch": 15.48, - "learning_rate": 2.7866433566433565e-06, - "loss": 0.3787, - "step": 17860 - }, - { - "epoch": 15.49, - "learning_rate": 2.7859440559440556e-06, - "loss": 0.4452, - "step": 17870 - }, - { - "epoch": 15.49, - "learning_rate": 2.785244755244755e-06, - "loss": 0.37, - "step": 17880 - }, - { - "epoch": 15.5, - "learning_rate": 2.7845454545454546e-06, - "loss": 0.3824, - "step": 17890 - }, - { - "epoch": 15.51, - "learning_rate": 2.7838461538461537e-06, - "loss": 0.3833, - "step": 17900 - }, - { - "epoch": 15.52, - "learning_rate": 2.7831468531468528e-06, - "loss": 0.4135, - "step": 17910 - }, - { - "epoch": 15.53, - "learning_rate": 2.7824475524475522e-06, - "loss": 0.4404, - "step": 17920 - }, - { - "epoch": 15.54, - "learning_rate": 2.7817482517482517e-06, - "loss": 0.362, - "step": 17930 - }, - { - "epoch": 15.55, - "learning_rate": 2.781048951048951e-06, - "loss": 0.421, - "step": 17940 - }, - { - "epoch": 15.55, - "learning_rate": 2.7803496503496503e-06, - "loss": 0.4144, - "step": 17950 - }, - { - "epoch": 15.56, - "learning_rate": 2.77965034965035e-06, - "loss": 0.4041, - "step": 17960 - }, - { - "epoch": 15.57, - "learning_rate": 2.778951048951049e-06, - "loss": 0.3806, - "step": 17970 - }, - { - "epoch": 15.58, - "learning_rate": 2.778251748251748e-06, - "loss": 0.4288, - "step": 17980 - }, - { - "epoch": 15.59, - "learning_rate": 2.7775524475524475e-06, - "loss": 0.3813, - "step": 17990 - }, - { - "epoch": 15.6, - "learning_rate": 2.776853146853147e-06, - "loss": 0.3247, - "step": 18000 - }, - { - "epoch": 15.61, - "learning_rate": 2.776153846153846e-06, - "loss": 0.3454, - "step": 18010 - }, - { - "epoch": 15.61, - "learning_rate": 2.775454545454545e-06, - "loss": 0.3573, - "step": 18020 - }, - { - "epoch": 15.62, - "learning_rate": 2.7747552447552446e-06, - "loss": 0.4104, - "step": 18030 - }, - { - "epoch": 15.63, - "learning_rate": 2.774055944055944e-06, - "loss": 0.36, - "step": 18040 - }, - { - "epoch": 15.64, - "learning_rate": 2.773356643356643e-06, - "loss": 0.3871, - "step": 18050 - }, - { - "epoch": 15.65, - "learning_rate": 2.7726573426573427e-06, - "loss": 0.3662, - "step": 18060 - }, - { - "epoch": 15.66, - "learning_rate": 2.7719580419580417e-06, - "loss": 0.3593, - "step": 18070 - }, - { - "epoch": 15.67, - "learning_rate": 2.771258741258741e-06, - "loss": 0.3884, - "step": 18080 - }, - { - "epoch": 15.68, - "learning_rate": 2.7705594405594403e-06, - "loss": 0.3671, - "step": 18090 - }, - { - "epoch": 15.68, - "learning_rate": 2.76986013986014e-06, - "loss": 0.3949, - "step": 18100 - }, - { - "epoch": 15.69, - "learning_rate": 2.7691608391608393e-06, - "loss": 0.3839, - "step": 18110 - }, - { - "epoch": 15.7, - "learning_rate": 2.7684615384615384e-06, - "loss": 0.4158, - "step": 18120 - }, - { - "epoch": 15.71, - "learning_rate": 2.7677622377622374e-06, - "loss": 0.3239, - "step": 18130 - }, - { - "epoch": 15.72, - "learning_rate": 2.767062937062937e-06, - "loss": 0.3464, - "step": 18140 - }, - { - "epoch": 15.73, - "learning_rate": 2.7663636363636364e-06, - "loss": 0.3884, - "step": 18150 - }, - { - "epoch": 15.74, - "learning_rate": 2.7656643356643355e-06, - "loss": 0.4807, - "step": 18160 - }, - { - "epoch": 15.74, - "learning_rate": 2.764965034965035e-06, - "loss": 0.3784, - "step": 18170 - }, - { - "epoch": 15.75, - "learning_rate": 2.764265734265734e-06, - "loss": 0.3405, - "step": 18180 - }, - { - "epoch": 15.76, - "learning_rate": 2.763566433566433e-06, - "loss": 0.4299, - "step": 18190 - }, - { - "epoch": 15.77, - "learning_rate": 2.7628671328671327e-06, - "loss": 0.4014, - "step": 18200 - }, - { - "epoch": 15.78, - "learning_rate": 2.762167832167832e-06, - "loss": 0.4313, - "step": 18210 - }, - { - "epoch": 15.79, - "learning_rate": 2.7614685314685317e-06, - "loss": 0.4522, - "step": 18220 - }, - { - "epoch": 15.8, - "learning_rate": 2.7607692307692307e-06, - "loss": 0.4019, - "step": 18230 - }, - { - "epoch": 15.81, - "learning_rate": 2.76006993006993e-06, - "loss": 0.4175, - "step": 18240 - }, - { - "epoch": 15.81, - "learning_rate": 2.7593706293706293e-06, - "loss": 0.3939, - "step": 18250 - }, - { - "epoch": 15.82, - "learning_rate": 2.7586713286713284e-06, - "loss": 0.4423, - "step": 18260 - }, - { - "epoch": 15.83, - "learning_rate": 2.757972027972028e-06, - "loss": 0.414, - "step": 18270 - }, - { - "epoch": 15.84, - "learning_rate": 2.7572727272727274e-06, - "loss": 0.3687, - "step": 18280 - }, - { - "epoch": 15.85, - "learning_rate": 2.7565734265734264e-06, - "loss": 0.3526, - "step": 18290 - }, - { - "epoch": 15.86, - "learning_rate": 2.7558741258741255e-06, - "loss": 0.389, - "step": 18300 - }, - { - "epoch": 15.87, - "learning_rate": 2.755174825174825e-06, - "loss": 0.4634, - "step": 18310 - }, - { - "epoch": 15.87, - "learning_rate": 2.7544755244755245e-06, - "loss": 0.3854, - "step": 18320 - }, - { - "epoch": 15.88, - "learning_rate": 2.7538461538461535e-06, - "loss": 0.4101, - "step": 18330 - }, - { - "epoch": 15.89, - "learning_rate": 2.753146853146853e-06, - "loss": 0.4215, - "step": 18340 - }, - { - "epoch": 15.9, - "learning_rate": 2.752447552447552e-06, - "loss": 0.4324, - "step": 18350 - }, - { - "epoch": 15.91, - "learning_rate": 2.7517482517482516e-06, - "loss": 0.3848, - "step": 18360 - }, - { - "epoch": 15.92, - "learning_rate": 2.751048951048951e-06, - "loss": 0.3643, - "step": 18370 - }, - { - "epoch": 15.93, - "learning_rate": 2.75034965034965e-06, - "loss": 0.4236, - "step": 18380 - }, - { - "epoch": 15.94, - "learning_rate": 2.7496503496503493e-06, - "loss": 0.3534, - "step": 18390 - }, - { - "epoch": 15.94, - "learning_rate": 2.7489510489510488e-06, - "loss": 0.4274, - "step": 18400 - }, - { - "epoch": 15.95, - "learning_rate": 2.7482517482517482e-06, - "loss": 0.4021, - "step": 18410 - }, - { - "epoch": 15.96, - "learning_rate": 2.7476223776223773e-06, - "loss": 0.3989, - "step": 18420 - }, - { - "epoch": 15.97, - "learning_rate": 2.7469230769230768e-06, - "loss": 0.3813, - "step": 18430 - }, - { - "epoch": 15.98, - "learning_rate": 2.746223776223776e-06, - "loss": 0.382, - "step": 18440 - }, - { - "epoch": 15.99, - "learning_rate": 2.7455244755244754e-06, - "loss": 0.4029, - "step": 18450 - }, - { - "epoch": 16.0, - "learning_rate": 2.744825174825175e-06, - "loss": 0.401, - "step": 18460 - }, - { - "epoch": 16.0, - "eval_loss": 0.5527588725090027, - "eval_runtime": 134.4619, - "eval_samples_per_second": 3.957, - "eval_steps_per_second": 1.978, - "eval_wer": 0.25660474384521437, - "step": 18464 - }, - { - "epoch": 16.01, - "learning_rate": 2.7441258741258743e-06, - "loss": 0.3866, - "step": 18470 - }, - { - "epoch": 16.01, - "learning_rate": 2.743426573426573e-06, - "loss": 0.408, - "step": 18480 - }, - { - "epoch": 16.02, - "learning_rate": 2.7427272727272725e-06, - "loss": 0.3622, - "step": 18490 - }, - { - "epoch": 16.03, - "learning_rate": 2.742027972027972e-06, - "loss": 0.3686, - "step": 18500 - }, - { - "epoch": 16.04, - "learning_rate": 2.7413286713286715e-06, - "loss": 0.451, - "step": 18510 - }, - { - "epoch": 16.05, - "learning_rate": 2.7406293706293706e-06, - "loss": 0.3892, - "step": 18520 - }, - { - "epoch": 16.06, - "learning_rate": 2.7399300699300696e-06, - "loss": 0.3524, - "step": 18530 - }, - { - "epoch": 16.07, - "learning_rate": 2.739230769230769e-06, - "loss": 0.4344, - "step": 18540 - }, - { - "epoch": 16.07, - "learning_rate": 2.738531468531468e-06, - "loss": 0.3783, - "step": 18550 - }, - { - "epoch": 16.08, - "learning_rate": 2.7378321678321677e-06, - "loss": 0.3873, - "step": 18560 - }, - { - "epoch": 16.09, - "learning_rate": 2.737132867132867e-06, - "loss": 0.3959, - "step": 18570 - }, - { - "epoch": 16.1, - "learning_rate": 2.7364335664335667e-06, - "loss": 0.4067, - "step": 18580 - }, - { - "epoch": 16.11, - "learning_rate": 2.7357342657342653e-06, - "loss": 0.3906, - "step": 18590 - }, - { - "epoch": 16.12, - "learning_rate": 2.735034965034965e-06, - "loss": 0.4194, - "step": 18600 - }, - { - "epoch": 16.13, - "learning_rate": 2.7343356643356643e-06, - "loss": 0.4019, - "step": 18610 - }, - { - "epoch": 16.14, - "learning_rate": 2.7336363636363634e-06, - "loss": 0.4133, - "step": 18620 - }, - { - "epoch": 16.14, - "learning_rate": 2.732937062937063e-06, - "loss": 0.3734, - "step": 18630 - }, - { - "epoch": 16.15, - "learning_rate": 2.732237762237762e-06, - "loss": 0.3443, - "step": 18640 - }, - { - "epoch": 16.16, - "learning_rate": 2.7315384615384615e-06, - "loss": 0.4262, - "step": 18650 - }, - { - "epoch": 16.17, - "learning_rate": 2.7308391608391606e-06, - "loss": 0.4021, - "step": 18660 - }, - { - "epoch": 16.18, - "learning_rate": 2.73013986013986e-06, - "loss": 0.3941, - "step": 18670 - }, - { - "epoch": 16.19, - "learning_rate": 2.7294405594405595e-06, - "loss": 0.4043, - "step": 18680 - }, - { - "epoch": 16.2, - "learning_rate": 2.7287412587412586e-06, - "loss": 0.3946, - "step": 18690 - }, - { - "epoch": 16.2, - "learning_rate": 2.7280419580419577e-06, - "loss": 0.3554, - "step": 18700 - }, - { - "epoch": 16.21, - "learning_rate": 2.727342657342657e-06, - "loss": 0.3961, - "step": 18710 - }, - { - "epoch": 16.22, - "learning_rate": 2.7266433566433567e-06, - "loss": 0.4002, - "step": 18720 - }, - { - "epoch": 16.23, - "learning_rate": 2.7259440559440558e-06, - "loss": 0.3996, - "step": 18730 - }, - { - "epoch": 16.24, - "learning_rate": 2.7252447552447553e-06, - "loss": 0.3419, - "step": 18740 - }, - { - "epoch": 16.25, - "learning_rate": 2.7245454545454543e-06, - "loss": 0.3855, - "step": 18750 - }, - { - "epoch": 16.26, - "learning_rate": 2.723846153846154e-06, - "loss": 0.454, - "step": 18760 - }, - { - "epoch": 16.27, - "learning_rate": 2.723146853146853e-06, - "loss": 0.3747, - "step": 18770 - }, - { - "epoch": 16.27, - "learning_rate": 2.7224475524475524e-06, - "loss": 0.366, - "step": 18780 - }, - { - "epoch": 16.28, - "learning_rate": 2.721748251748252e-06, - "loss": 0.4218, - "step": 18790 - }, - { - "epoch": 16.29, - "learning_rate": 2.7210489510489505e-06, - "loss": 0.3791, - "step": 18800 - }, - { - "epoch": 16.3, - "learning_rate": 2.72034965034965e-06, - "loss": 0.4636, - "step": 18810 - }, - { - "epoch": 16.31, - "learning_rate": 2.7196503496503495e-06, - "loss": 0.3836, - "step": 18820 - }, - { - "epoch": 16.32, - "learning_rate": 2.718951048951049e-06, - "loss": 0.4457, - "step": 18830 - }, - { - "epoch": 16.33, - "learning_rate": 2.718251748251748e-06, - "loss": 0.3602, - "step": 18840 - }, - { - "epoch": 16.33, - "learning_rate": 2.717552447552447e-06, - "loss": 0.4125, - "step": 18850 - }, - { - "epoch": 16.34, - "learning_rate": 2.7168531468531467e-06, - "loss": 0.4183, - "step": 18860 - }, - { - "epoch": 16.35, - "learning_rate": 2.716153846153846e-06, - "loss": 0.3852, - "step": 18870 - }, - { - "epoch": 16.36, - "learning_rate": 2.7154545454545453e-06, - "loss": 0.427, - "step": 18880 - }, - { - "epoch": 16.37, - "learning_rate": 2.7147552447552447e-06, - "loss": 0.3541, - "step": 18890 - }, - { - "epoch": 16.38, - "learning_rate": 2.7140559440559442e-06, - "loss": 0.3876, - "step": 18900 - }, - { - "epoch": 16.39, - "learning_rate": 2.713356643356643e-06, - "loss": 0.4169, - "step": 18910 - }, - { - "epoch": 16.39, - "learning_rate": 2.7126573426573424e-06, - "loss": 0.3701, - "step": 18920 - }, - { - "epoch": 16.4, - "learning_rate": 2.711958041958042e-06, - "loss": 0.418, - "step": 18930 - }, - { - "epoch": 16.41, - "learning_rate": 2.7112587412587414e-06, - "loss": 0.3641, - "step": 18940 - }, - { - "epoch": 16.42, - "learning_rate": 2.7105594405594405e-06, - "loss": 0.3692, - "step": 18950 - }, - { - "epoch": 16.43, - "learning_rate": 2.7098601398601395e-06, - "loss": 0.4281, - "step": 18960 - }, - { - "epoch": 16.44, - "learning_rate": 2.709160839160839e-06, - "loss": 0.3755, - "step": 18970 - }, - { - "epoch": 16.45, - "learning_rate": 2.708461538461538e-06, - "loss": 0.3857, - "step": 18980 - }, - { - "epoch": 16.46, - "learning_rate": 2.7077622377622376e-06, - "loss": 0.4253, - "step": 18990 - }, - { - "epoch": 16.46, - "learning_rate": 2.707062937062937e-06, - "loss": 0.3912, - "step": 19000 - }, - { - "epoch": 16.47, - "learning_rate": 2.7063636363636366e-06, - "loss": 0.429, - "step": 19010 - }, - { - "epoch": 16.48, - "learning_rate": 2.7056643356643352e-06, - "loss": 0.4558, - "step": 19020 - }, - { - "epoch": 16.49, - "learning_rate": 2.7049650349650347e-06, - "loss": 0.4172, - "step": 19030 - }, - { - "epoch": 16.5, - "learning_rate": 2.7042657342657342e-06, - "loss": 0.4004, - "step": 19040 - }, - { - "epoch": 16.51, - "learning_rate": 2.7035664335664337e-06, - "loss": 0.4207, - "step": 19050 - }, - { - "epoch": 16.52, - "learning_rate": 2.702867132867133e-06, - "loss": 0.4373, - "step": 19060 - }, - { - "epoch": 16.52, - "learning_rate": 2.702167832167832e-06, - "loss": 0.4508, - "step": 19070 - }, - { - "epoch": 16.53, - "learning_rate": 2.7014685314685314e-06, - "loss": 0.4109, - "step": 19080 - }, - { - "epoch": 16.54, - "learning_rate": 2.7007692307692305e-06, - "loss": 0.4186, - "step": 19090 - }, - { - "epoch": 16.55, - "learning_rate": 2.70006993006993e-06, - "loss": 0.3652, - "step": 19100 - }, - { - "epoch": 16.56, - "learning_rate": 2.6993706293706294e-06, - "loss": 0.4016, - "step": 19110 - }, - { - "epoch": 16.57, - "learning_rate": 2.698671328671329e-06, - "loss": 0.4264, - "step": 19120 - }, - { - "epoch": 16.58, - "learning_rate": 2.6979720279720276e-06, - "loss": 0.3732, - "step": 19130 - }, - { - "epoch": 16.59, - "learning_rate": 2.697272727272727e-06, - "loss": 0.3571, - "step": 19140 - }, - { - "epoch": 16.59, - "learning_rate": 2.6965734265734266e-06, - "loss": 0.4206, - "step": 19150 - }, - { - "epoch": 16.6, - "learning_rate": 2.6958741258741257e-06, - "loss": 0.3823, - "step": 19160 - }, - { - "epoch": 16.61, - "learning_rate": 2.695174825174825e-06, - "loss": 0.3829, - "step": 19170 - }, - { - "epoch": 16.62, - "learning_rate": 2.6944755244755242e-06, - "loss": 0.392, - "step": 19180 - }, - { - "epoch": 16.63, - "learning_rate": 2.6937762237762237e-06, - "loss": 0.3682, - "step": 19190 - }, - { - "epoch": 16.64, - "learning_rate": 2.693076923076923e-06, - "loss": 0.4124, - "step": 19200 - }, - { - "epoch": 16.65, - "learning_rate": 2.6923776223776223e-06, - "loss": 0.3521, - "step": 19210 - }, - { - "epoch": 16.65, - "learning_rate": 2.691678321678322e-06, - "loss": 0.3398, - "step": 19220 - }, - { - "epoch": 16.66, - "learning_rate": 2.690979020979021e-06, - "loss": 0.3953, - "step": 19230 - }, - { - "epoch": 16.67, - "learning_rate": 2.69027972027972e-06, - "loss": 0.3081, - "step": 19240 - }, - { - "epoch": 16.68, - "learning_rate": 2.6895804195804194e-06, - "loss": 0.3745, - "step": 19250 - }, - { - "epoch": 16.69, - "learning_rate": 2.688881118881119e-06, - "loss": 0.3325, - "step": 19260 - }, - { - "epoch": 16.7, - "learning_rate": 2.688181818181818e-06, - "loss": 0.3733, - "step": 19270 - }, - { - "epoch": 16.71, - "learning_rate": 2.6874825174825175e-06, - "loss": 0.5077, - "step": 19280 - }, - { - "epoch": 16.72, - "learning_rate": 2.6867832167832166e-06, - "loss": 0.384, - "step": 19290 - }, - { - "epoch": 16.72, - "learning_rate": 2.686083916083916e-06, - "loss": 0.3758, - "step": 19300 - }, - { - "epoch": 16.73, - "learning_rate": 2.685384615384615e-06, - "loss": 0.359, - "step": 19310 - }, - { - "epoch": 16.74, - "learning_rate": 2.6846853146853146e-06, - "loss": 0.4364, - "step": 19320 - }, - { - "epoch": 16.75, - "learning_rate": 2.683986013986014e-06, - "loss": 0.4155, - "step": 19330 - }, - { - "epoch": 16.76, - "learning_rate": 2.683286713286713e-06, - "loss": 0.3362, - "step": 19340 - }, - { - "epoch": 16.77, - "learning_rate": 2.6825874125874123e-06, - "loss": 0.3266, - "step": 19350 - }, - { - "epoch": 16.78, - "learning_rate": 2.6818881118881118e-06, - "loss": 0.396, - "step": 19360 - }, - { - "epoch": 16.78, - "learning_rate": 2.6811888111888113e-06, - "loss": 0.4046, - "step": 19370 - }, - { - "epoch": 16.79, - "learning_rate": 2.6804895104895104e-06, - "loss": 0.3826, - "step": 19380 - }, - { - "epoch": 16.8, - "learning_rate": 2.67979020979021e-06, - "loss": 0.4214, - "step": 19390 - }, - { - "epoch": 16.81, - "learning_rate": 2.679090909090909e-06, - "loss": 0.4371, - "step": 19400 - }, - { - "epoch": 16.82, - "learning_rate": 2.678391608391608e-06, - "loss": 0.4201, - "step": 19410 - }, - { - "epoch": 16.83, - "learning_rate": 2.6776923076923075e-06, - "loss": 0.4438, - "step": 19420 - }, - { - "epoch": 16.84, - "learning_rate": 2.676993006993007e-06, - "loss": 0.404, - "step": 19430 - }, - { - "epoch": 16.85, - "learning_rate": 2.6762937062937065e-06, - "loss": 0.3562, - "step": 19440 - }, - { - "epoch": 16.85, - "learning_rate": 2.675594405594405e-06, - "loss": 0.4756, - "step": 19450 - }, - { - "epoch": 16.86, - "learning_rate": 2.6748951048951046e-06, - "loss": 0.407, - "step": 19460 - }, - { - "epoch": 16.87, - "learning_rate": 2.674195804195804e-06, - "loss": 0.4391, - "step": 19470 - }, - { - "epoch": 16.88, - "learning_rate": 2.6734965034965036e-06, - "loss": 0.3603, - "step": 19480 - }, - { - "epoch": 16.89, - "learning_rate": 2.6727972027972027e-06, - "loss": 0.3468, - "step": 19490 - }, - { - "epoch": 16.9, - "learning_rate": 2.6720979020979018e-06, - "loss": 0.3874, - "step": 19500 - }, - { - "epoch": 16.91, - "learning_rate": 2.6713986013986013e-06, - "loss": 0.4372, - "step": 19510 - }, - { - "epoch": 16.91, - "learning_rate": 2.6706993006993004e-06, - "loss": 0.3371, - "step": 19520 - }, - { - "epoch": 16.92, - "learning_rate": 2.67e-06, - "loss": 0.351, - "step": 19530 - }, - { - "epoch": 16.93, - "learning_rate": 2.6693006993006993e-06, - "loss": 0.3351, - "step": 19540 - }, - { - "epoch": 16.94, - "learning_rate": 2.668601398601399e-06, - "loss": 0.3939, - "step": 19550 - }, - { - "epoch": 16.95, - "learning_rate": 2.6679020979020975e-06, - "loss": 0.3767, - "step": 19560 - }, - { - "epoch": 16.96, - "learning_rate": 2.667202797202797e-06, - "loss": 0.4356, - "step": 19570 - }, - { - "epoch": 16.97, - "learning_rate": 2.6665034965034965e-06, - "loss": 0.4077, - "step": 19580 - }, - { - "epoch": 16.98, - "learning_rate": 2.6658041958041956e-06, - "loss": 0.3415, - "step": 19590 - }, - { - "epoch": 16.98, - "learning_rate": 2.665104895104895e-06, - "loss": 0.3812, - "step": 19600 - }, - { - "epoch": 16.99, - "learning_rate": 2.664405594405594e-06, - "loss": 0.4391, - "step": 19610 - }, - { - "epoch": 17.0, - "eval_loss": 0.5583595633506775, - "eval_runtime": 135.8775, - "eval_samples_per_second": 3.915, - "eval_steps_per_second": 1.958, - "eval_wer": 0.25544770842707465, - "step": 19618 - }, - { - "epoch": 17.0, - "learning_rate": 2.6637062937062936e-06, - "loss": 0.4462, - "step": 19620 - }, - { - "epoch": 17.01, - "learning_rate": 2.6630069930069927e-06, - "loss": 0.4311, - "step": 19630 - }, - { - "epoch": 17.02, - "learning_rate": 2.662307692307692e-06, - "loss": 0.3632, - "step": 19640 - }, - { - "epoch": 17.03, - "learning_rate": 2.6616083916083917e-06, - "loss": 0.3747, - "step": 19650 - }, - { - "epoch": 17.04, - "learning_rate": 2.660909090909091e-06, - "loss": 0.3097, - "step": 19660 - }, - { - "epoch": 17.05, - "learning_rate": 2.66020979020979e-06, - "loss": 0.4059, - "step": 19670 - }, - { - "epoch": 17.05, - "learning_rate": 2.6595104895104893e-06, - "loss": 0.3929, - "step": 19680 - }, - { - "epoch": 17.06, - "learning_rate": 2.658811188811189e-06, - "loss": 0.4335, - "step": 19690 - }, - { - "epoch": 17.07, - "learning_rate": 2.658111888111888e-06, - "loss": 0.3721, - "step": 19700 - }, - { - "epoch": 17.08, - "learning_rate": 2.6574125874125874e-06, - "loss": 0.3538, - "step": 19710 - }, - { - "epoch": 17.09, - "learning_rate": 2.6567132867132865e-06, - "loss": 0.3729, - "step": 19720 - }, - { - "epoch": 17.1, - "learning_rate": 2.656013986013986e-06, - "loss": 0.413, - "step": 19730 - }, - { - "epoch": 17.11, - "learning_rate": 2.655314685314685e-06, - "loss": 0.3944, - "step": 19740 - }, - { - "epoch": 17.11, - "learning_rate": 2.6546153846153845e-06, - "loss": 0.3932, - "step": 19750 - }, - { - "epoch": 17.12, - "learning_rate": 2.653916083916084e-06, - "loss": 0.3938, - "step": 19760 - }, - { - "epoch": 17.13, - "learning_rate": 2.6532167832167827e-06, - "loss": 0.3072, - "step": 19770 - }, - { - "epoch": 17.14, - "learning_rate": 2.652517482517482e-06, - "loss": 0.3738, - "step": 19780 - }, - { - "epoch": 17.15, - "learning_rate": 2.6518181818181817e-06, - "loss": 0.3518, - "step": 19790 - }, - { - "epoch": 17.16, - "learning_rate": 2.651118881118881e-06, - "loss": 0.3591, - "step": 19800 - }, - { - "epoch": 17.17, - "learning_rate": 2.6504195804195803e-06, - "loss": 0.4291, - "step": 19810 - }, - { - "epoch": 17.17, - "learning_rate": 2.6497202797202798e-06, - "loss": 0.4052, - "step": 19820 - }, - { - "epoch": 17.18, - "learning_rate": 2.649020979020979e-06, - "loss": 0.3796, - "step": 19830 - }, - { - "epoch": 17.19, - "learning_rate": 2.6483216783216783e-06, - "loss": 0.3255, - "step": 19840 - }, - { - "epoch": 17.2, - "learning_rate": 2.6476223776223774e-06, - "loss": 0.3811, - "step": 19850 - }, - { - "epoch": 17.21, - "learning_rate": 2.646923076923077e-06, - "loss": 0.4578, - "step": 19860 - }, - { - "epoch": 17.22, - "learning_rate": 2.6462237762237764e-06, - "loss": 0.4539, - "step": 19870 - }, - { - "epoch": 17.23, - "learning_rate": 2.645524475524475e-06, - "loss": 0.3946, - "step": 19880 - }, - { - "epoch": 17.24, - "learning_rate": 2.6448251748251745e-06, - "loss": 0.4328, - "step": 19890 - }, - { - "epoch": 17.24, - "learning_rate": 2.644125874125874e-06, - "loss": 0.4009, - "step": 19900 - }, - { - "epoch": 17.25, - "learning_rate": 2.6434265734265735e-06, - "loss": 0.373, - "step": 19910 - }, - { - "epoch": 17.26, - "learning_rate": 2.6427272727272726e-06, - "loss": 0.3561, - "step": 19920 - }, - { - "epoch": 17.27, - "learning_rate": 2.642027972027972e-06, - "loss": 0.3972, - "step": 19930 - }, - { - "epoch": 17.28, - "learning_rate": 2.641328671328671e-06, - "loss": 0.3716, - "step": 19940 - }, - { - "epoch": 17.29, - "learning_rate": 2.6406293706293702e-06, - "loss": 0.3482, - "step": 19950 - }, - { - "epoch": 17.3, - "learning_rate": 2.6399300699300697e-06, - "loss": 0.3972, - "step": 19960 - }, - { - "epoch": 17.3, - "learning_rate": 2.6392307692307692e-06, - "loss": 0.4394, - "step": 19970 - }, - { - "epoch": 17.31, - "learning_rate": 2.6385314685314687e-06, - "loss": 0.4083, - "step": 19980 - }, - { - "epoch": 17.32, - "learning_rate": 2.6378321678321674e-06, - "loss": 0.3908, - "step": 19990 - }, - { - "epoch": 17.33, - "learning_rate": 2.637132867132867e-06, - "loss": 0.4101, - "step": 20000 - }, - { - "epoch": 17.34, - "learning_rate": 2.6364335664335664e-06, - "loss": 0.3879, - "step": 20010 - }, - { - "epoch": 17.35, - "learning_rate": 2.635734265734266e-06, - "loss": 0.4163, - "step": 20020 - }, - { - "epoch": 17.36, - "learning_rate": 2.635034965034965e-06, - "loss": 0.3777, - "step": 20030 - }, - { - "epoch": 17.37, - "learning_rate": 2.634335664335664e-06, - "loss": 0.3931, - "step": 20040 - }, - { - "epoch": 17.37, - "learning_rate": 2.6336363636363635e-06, - "loss": 0.374, - "step": 20050 - }, - { - "epoch": 17.38, - "learning_rate": 2.6329370629370626e-06, - "loss": 0.4067, - "step": 20060 - }, - { - "epoch": 17.39, - "learning_rate": 2.632237762237762e-06, - "loss": 0.3838, - "step": 20070 - }, - { - "epoch": 17.4, - "learning_rate": 2.6315384615384616e-06, - "loss": 0.4246, - "step": 20080 - }, - { - "epoch": 17.41, - "learning_rate": 2.630839160839161e-06, - "loss": 0.395, - "step": 20090 - }, - { - "epoch": 17.42, - "learning_rate": 2.6301398601398597e-06, - "loss": 0.3462, - "step": 20100 - }, - { - "epoch": 17.43, - "learning_rate": 2.6294405594405592e-06, - "loss": 0.4599, - "step": 20110 - }, - { - "epoch": 17.43, - "learning_rate": 2.6287412587412587e-06, - "loss": 0.3861, - "step": 20120 - }, - { - "epoch": 17.44, - "learning_rate": 2.628041958041958e-06, - "loss": 0.3687, - "step": 20130 - }, - { - "epoch": 17.45, - "learning_rate": 2.6273426573426573e-06, - "loss": 0.4269, - "step": 20140 - }, - { - "epoch": 17.46, - "learning_rate": 2.6266433566433564e-06, - "loss": 0.4417, - "step": 20150 - }, - { - "epoch": 17.47, - "learning_rate": 2.625944055944056e-06, - "loss": 0.4375, - "step": 20160 - }, - { - "epoch": 17.48, - "learning_rate": 2.625244755244755e-06, - "loss": 0.3211, - "step": 20170 - }, - { - "epoch": 17.49, - "learning_rate": 2.6245454545454544e-06, - "loss": 0.3927, - "step": 20180 - }, - { - "epoch": 17.5, - "learning_rate": 2.623846153846154e-06, - "loss": 0.3841, - "step": 20190 - }, - { - "epoch": 17.5, - "learning_rate": 2.6231468531468534e-06, - "loss": 0.3553, - "step": 20200 - }, - { - "epoch": 17.51, - "learning_rate": 2.622447552447552e-06, - "loss": 0.4109, - "step": 20210 - }, - { - "epoch": 17.52, - "learning_rate": 2.6217482517482516e-06, - "loss": 0.4795, - "step": 20220 - }, - { - "epoch": 17.53, - "learning_rate": 2.621048951048951e-06, - "loss": 0.3969, - "step": 20230 - }, - { - "epoch": 17.54, - "learning_rate": 2.62034965034965e-06, - "loss": 0.3544, - "step": 20240 - }, - { - "epoch": 17.55, - "learning_rate": 2.6196503496503497e-06, - "loss": 0.4274, - "step": 20250 - }, - { - "epoch": 17.56, - "learning_rate": 2.6189510489510487e-06, - "loss": 0.4053, - "step": 20260 - }, - { - "epoch": 17.56, - "learning_rate": 2.6182517482517482e-06, - "loss": 0.4198, - "step": 20270 - }, - { - "epoch": 17.57, - "learning_rate": 2.6175524475524473e-06, - "loss": 0.4458, - "step": 20280 - }, - { - "epoch": 17.58, - "learning_rate": 2.616853146853147e-06, - "loss": 0.3737, - "step": 20290 - }, - { - "epoch": 17.59, - "learning_rate": 2.6161538461538463e-06, - "loss": 0.385, - "step": 20300 - }, - { - "epoch": 17.6, - "learning_rate": 2.615454545454545e-06, - "loss": 0.3633, - "step": 20310 - }, - { - "epoch": 17.61, - "learning_rate": 2.6147552447552444e-06, - "loss": 0.3667, - "step": 20320 - }, - { - "epoch": 17.62, - "learning_rate": 2.614055944055944e-06, - "loss": 0.3878, - "step": 20330 - }, - { - "epoch": 17.63, - "learning_rate": 2.6133566433566434e-06, - "loss": 0.3853, - "step": 20340 - }, - { - "epoch": 17.63, - "learning_rate": 2.6126573426573425e-06, - "loss": 0.3476, - "step": 20350 - }, - { - "epoch": 17.64, - "learning_rate": 2.611958041958042e-06, - "loss": 0.3953, - "step": 20360 - }, - { - "epoch": 17.65, - "learning_rate": 2.611258741258741e-06, - "loss": 0.4068, - "step": 20370 - }, - { - "epoch": 17.66, - "learning_rate": 2.6105594405594406e-06, - "loss": 0.4064, - "step": 20380 - }, - { - "epoch": 17.67, - "learning_rate": 2.6098601398601396e-06, - "loss": 0.3617, - "step": 20390 - }, - { - "epoch": 17.68, - "learning_rate": 2.609160839160839e-06, - "loss": 0.376, - "step": 20400 - }, - { - "epoch": 17.69, - "learning_rate": 2.6084615384615386e-06, - "loss": 0.4201, - "step": 20410 - }, - { - "epoch": 17.69, - "learning_rate": 2.6077622377622373e-06, - "loss": 0.4321, - "step": 20420 - }, - { - "epoch": 17.7, - "learning_rate": 2.6070629370629368e-06, - "loss": 0.3209, - "step": 20430 - }, - { - "epoch": 17.71, - "learning_rate": 2.6063636363636363e-06, - "loss": 0.3947, - "step": 20440 - }, - { - "epoch": 17.72, - "learning_rate": 2.6056643356643358e-06, - "loss": 0.4086, - "step": 20450 - }, - { - "epoch": 17.73, - "learning_rate": 2.604965034965035e-06, - "loss": 0.4005, - "step": 20460 - }, - { - "epoch": 17.74, - "learning_rate": 2.6042657342657343e-06, - "loss": 0.4692, - "step": 20470 - }, - { - "epoch": 17.75, - "learning_rate": 2.6035664335664334e-06, - "loss": 0.3993, - "step": 20480 - }, - { - "epoch": 17.76, - "learning_rate": 2.6028671328671325e-06, - "loss": 0.3955, - "step": 20490 - }, - { - "epoch": 17.76, - "learning_rate": 2.602167832167832e-06, - "loss": 0.3767, - "step": 20500 - }, - { - "epoch": 17.77, - "learning_rate": 2.6014685314685315e-06, - "loss": 0.3714, - "step": 20510 - }, - { - "epoch": 17.78, - "learning_rate": 2.600769230769231e-06, - "loss": 0.4252, - "step": 20520 - }, - { - "epoch": 17.79, - "learning_rate": 2.6000699300699296e-06, - "loss": 0.3484, - "step": 20530 - }, - { - "epoch": 17.8, - "learning_rate": 2.599370629370629e-06, - "loss": 0.4087, - "step": 20540 - }, - { - "epoch": 17.81, - "learning_rate": 2.5986713286713286e-06, - "loss": 0.4252, - "step": 20550 - }, - { - "epoch": 17.82, - "learning_rate": 2.5979720279720277e-06, - "loss": 0.427, - "step": 20560 - }, - { - "epoch": 17.82, - "learning_rate": 2.597272727272727e-06, - "loss": 0.3832, - "step": 20570 - }, - { - "epoch": 17.83, - "learning_rate": 2.5965734265734263e-06, - "loss": 0.4301, - "step": 20580 - }, - { - "epoch": 17.84, - "learning_rate": 2.5958741258741258e-06, - "loss": 0.4196, - "step": 20590 - }, - { - "epoch": 17.85, - "learning_rate": 2.595174825174825e-06, - "loss": 0.3853, - "step": 20600 - }, - { - "epoch": 17.86, - "learning_rate": 2.5944755244755243e-06, - "loss": 0.4572, - "step": 20610 - }, - { - "epoch": 17.87, - "learning_rate": 2.593776223776224e-06, - "loss": 0.4236, - "step": 20620 - }, - { - "epoch": 17.88, - "learning_rate": 2.5930769230769233e-06, - "loss": 0.3852, - "step": 20630 - }, - { - "epoch": 17.89, - "learning_rate": 2.592377622377622e-06, - "loss": 0.3795, - "step": 20640 - }, - { - "epoch": 17.89, - "learning_rate": 2.5916783216783215e-06, - "loss": 0.4265, - "step": 20650 - }, - { - "epoch": 17.9, - "learning_rate": 2.590979020979021e-06, - "loss": 0.4455, - "step": 20660 - }, - { - "epoch": 17.91, - "learning_rate": 2.59027972027972e-06, - "loss": 0.4368, - "step": 20670 - }, - { - "epoch": 17.92, - "learning_rate": 2.5895804195804195e-06, - "loss": 0.4364, - "step": 20680 - }, - { - "epoch": 17.93, - "learning_rate": 2.5888811188811186e-06, - "loss": 0.4531, - "step": 20690 - }, - { - "epoch": 17.94, - "learning_rate": 2.588181818181818e-06, - "loss": 0.39, - "step": 20700 - }, - { - "epoch": 17.95, - "learning_rate": 2.587482517482517e-06, - "loss": 0.3788, - "step": 20710 - }, - { - "epoch": 17.95, - "learning_rate": 2.5867832167832167e-06, - "loss": 0.3861, - "step": 20720 - }, - { - "epoch": 17.96, - "learning_rate": 2.586083916083916e-06, - "loss": 0.385, - "step": 20730 - }, - { - "epoch": 17.97, - "learning_rate": 2.5853846153846153e-06, - "loss": 0.369, - "step": 20740 - }, - { - "epoch": 17.98, - "learning_rate": 2.5846853146853143e-06, - "loss": 0.4202, - "step": 20750 - }, - { - "epoch": 17.99, - "learning_rate": 2.583986013986014e-06, - "loss": 0.3634, - "step": 20760 - }, - { - "epoch": 18.0, - "learning_rate": 2.5832867132867133e-06, - "loss": 0.4082, - "step": 20770 - }, - { - "epoch": 18.0, - "eval_loss": 0.560993492603302, - "eval_runtime": 134.8261, - "eval_samples_per_second": 3.946, - "eval_steps_per_second": 1.973, - "eval_wer": 0.2528122388635341, - "step": 20772 - }, - { - "epoch": 18.01, - "learning_rate": 2.5825874125874124e-06, - "loss": 0.427, - "step": 20780 - }, - { - "epoch": 18.02, - "learning_rate": 2.581888111888112e-06, - "loss": 0.3963, - "step": 20790 - }, - { - "epoch": 18.02, - "learning_rate": 2.581188811188811e-06, - "loss": 0.3682, - "step": 20800 - }, - { - "epoch": 18.03, - "learning_rate": 2.5804895104895105e-06, - "loss": 0.4136, - "step": 20810 - }, - { - "epoch": 18.04, - "learning_rate": 2.5797902097902095e-06, - "loss": 0.4609, - "step": 20820 - }, - { - "epoch": 18.05, - "learning_rate": 2.579090909090909e-06, - "loss": 0.3814, - "step": 20830 - }, - { - "epoch": 18.06, - "learning_rate": 2.5783916083916085e-06, - "loss": 0.3502, - "step": 20840 - }, - { - "epoch": 18.07, - "learning_rate": 2.577692307692307e-06, - "loss": 0.4283, - "step": 20850 - }, - { - "epoch": 18.08, - "learning_rate": 2.5769930069930067e-06, - "loss": 0.3669, - "step": 20860 - }, - { - "epoch": 18.08, - "learning_rate": 2.576293706293706e-06, - "loss": 0.4066, - "step": 20870 - }, - { - "epoch": 18.09, - "learning_rate": 2.5755944055944057e-06, - "loss": 0.4107, - "step": 20880 - }, - { - "epoch": 18.1, - "learning_rate": 2.5748951048951047e-06, - "loss": 0.3645, - "step": 20890 - }, - { - "epoch": 18.11, - "learning_rate": 2.5741958041958042e-06, - "loss": 0.3502, - "step": 20900 - }, - { - "epoch": 18.12, - "learning_rate": 2.5734965034965033e-06, - "loss": 0.4241, - "step": 20910 - }, - { - "epoch": 18.13, - "learning_rate": 2.5727972027972024e-06, - "loss": 0.3582, - "step": 20920 - }, - { - "epoch": 18.14, - "learning_rate": 2.572097902097902e-06, - "loss": 0.3864, - "step": 20930 - }, - { - "epoch": 18.15, - "learning_rate": 2.5713986013986014e-06, - "loss": 0.3675, - "step": 20940 - }, - { - "epoch": 18.15, - "learning_rate": 2.570699300699301e-06, - "loss": 0.3774, - "step": 20950 - }, - { - "epoch": 18.16, - "learning_rate": 2.5699999999999995e-06, - "loss": 0.4393, - "step": 20960 - }, - { - "epoch": 18.17, - "learning_rate": 2.569300699300699e-06, - "loss": 0.4115, - "step": 20970 - }, - { - "epoch": 18.18, - "learning_rate": 2.5686013986013985e-06, - "loss": 0.3484, - "step": 20980 - }, - { - "epoch": 18.19, - "learning_rate": 2.567902097902098e-06, - "loss": 0.3803, - "step": 20990 - }, - { - "epoch": 18.2, - "learning_rate": 2.567202797202797e-06, - "loss": 0.3447, - "step": 21000 - }, - { - "epoch": 18.21, - "learning_rate": 2.5665034965034966e-06, - "loss": 0.4175, - "step": 21010 - }, - { - "epoch": 18.21, - "learning_rate": 2.5658041958041957e-06, - "loss": 0.4695, - "step": 21020 - }, - { - "epoch": 18.22, - "learning_rate": 2.5651048951048947e-06, - "loss": 0.4124, - "step": 21030 - }, - { - "epoch": 18.23, - "learning_rate": 2.5644055944055942e-06, - "loss": 0.3712, - "step": 21040 - }, - { - "epoch": 18.24, - "learning_rate": 2.5637062937062937e-06, - "loss": 0.5031, - "step": 21050 - }, - { - "epoch": 18.25, - "learning_rate": 2.5630069930069932e-06, - "loss": 0.3665, - "step": 21060 - }, - { - "epoch": 18.26, - "learning_rate": 2.562307692307692e-06, - "loss": 0.3783, - "step": 21070 - }, - { - "epoch": 18.27, - "learning_rate": 2.5616083916083914e-06, - "loss": 0.4238, - "step": 21080 - }, - { - "epoch": 18.28, - "learning_rate": 2.560909090909091e-06, - "loss": 0.3632, - "step": 21090 - }, - { - "epoch": 18.28, - "learning_rate": 2.56020979020979e-06, - "loss": 0.4002, - "step": 21100 - }, - { - "epoch": 18.29, - "learning_rate": 2.5595104895104894e-06, - "loss": 0.3893, - "step": 21110 - }, - { - "epoch": 18.3, - "learning_rate": 2.558811188811189e-06, - "loss": 0.4453, - "step": 21120 - }, - { - "epoch": 18.31, - "learning_rate": 2.558111888111888e-06, - "loss": 0.3853, - "step": 21130 - }, - { - "epoch": 18.32, - "learning_rate": 2.557412587412587e-06, - "loss": 0.4136, - "step": 21140 - }, - { - "epoch": 18.33, - "learning_rate": 2.5567132867132866e-06, - "loss": 0.3396, - "step": 21150 - }, - { - "epoch": 18.34, - "learning_rate": 2.556013986013986e-06, - "loss": 0.373, - "step": 21160 - }, - { - "epoch": 18.34, - "learning_rate": 2.5553146853146856e-06, - "loss": 0.4376, - "step": 21170 - }, - { - "epoch": 18.35, - "learning_rate": 2.5546153846153842e-06, - "loss": 0.3995, - "step": 21180 - }, - { - "epoch": 18.36, - "learning_rate": 2.5539160839160837e-06, - "loss": 0.3925, - "step": 21190 - }, - { - "epoch": 18.37, - "learning_rate": 2.5532167832167832e-06, - "loss": 0.3515, - "step": 21200 - }, - { - "epoch": 18.38, - "learning_rate": 2.5525174825174823e-06, - "loss": 0.4145, - "step": 21210 - }, - { - "epoch": 18.39, - "learning_rate": 2.551818181818182e-06, - "loss": 0.3953, - "step": 21220 - }, - { - "epoch": 18.4, - "learning_rate": 2.551118881118881e-06, - "loss": 0.4111, - "step": 21230 - }, - { - "epoch": 18.41, - "learning_rate": 2.5504195804195804e-06, - "loss": 0.3434, - "step": 21240 - }, - { - "epoch": 18.41, - "learning_rate": 2.5497202797202794e-06, - "loss": 0.4359, - "step": 21250 - }, - { - "epoch": 18.42, - "learning_rate": 2.549020979020979e-06, - "loss": 0.3937, - "step": 21260 - }, - { - "epoch": 18.43, - "learning_rate": 2.5483216783216784e-06, - "loss": 0.3623, - "step": 21270 - }, - { - "epoch": 18.44, - "learning_rate": 2.5476223776223775e-06, - "loss": 0.3874, - "step": 21280 - }, - { - "epoch": 18.45, - "learning_rate": 2.5469230769230766e-06, - "loss": 0.4689, - "step": 21290 - }, - { - "epoch": 18.46, - "learning_rate": 2.546223776223776e-06, - "loss": 0.3915, - "step": 21300 - }, - { - "epoch": 18.47, - "learning_rate": 2.5455244755244756e-06, - "loss": 0.411, - "step": 21310 - }, - { - "epoch": 18.47, - "learning_rate": 2.5448251748251746e-06, - "loss": 0.4007, - "step": 21320 - }, - { - "epoch": 18.48, - "learning_rate": 2.544125874125874e-06, - "loss": 0.362, - "step": 21330 - }, - { - "epoch": 18.49, - "learning_rate": 2.5434265734265732e-06, - "loss": 0.4242, - "step": 21340 - }, - { - "epoch": 18.5, - "learning_rate": 2.5427272727272727e-06, - "loss": 0.3352, - "step": 21350 - }, - { - "epoch": 18.51, - "learning_rate": 2.542027972027972e-06, - "loss": 0.3417, - "step": 21360 - }, - { - "epoch": 18.52, - "learning_rate": 2.5413286713286713e-06, - "loss": 0.3786, - "step": 21370 - }, - { - "epoch": 18.53, - "learning_rate": 2.5406293706293708e-06, - "loss": 0.3854, - "step": 21380 - }, - { - "epoch": 18.54, - "learning_rate": 2.5399300699300694e-06, - "loss": 0.4607, - "step": 21390 - }, - { - "epoch": 18.54, - "learning_rate": 2.539230769230769e-06, - "loss": 0.345, - "step": 21400 - }, - { - "epoch": 18.55, - "learning_rate": 2.5385314685314684e-06, - "loss": 0.3871, - "step": 21410 - }, - { - "epoch": 18.56, - "learning_rate": 2.537832167832168e-06, - "loss": 0.4067, - "step": 21420 - }, - { - "epoch": 18.57, - "learning_rate": 2.537132867132867e-06, - "loss": 0.3858, - "step": 21430 - }, - { - "epoch": 18.58, - "learning_rate": 2.5364335664335665e-06, - "loss": 0.4136, - "step": 21440 - }, - { - "epoch": 18.59, - "learning_rate": 2.5357342657342656e-06, - "loss": 0.3779, - "step": 21450 - }, - { - "epoch": 18.6, - "learning_rate": 2.5350349650349646e-06, - "loss": 0.3737, - "step": 21460 - }, - { - "epoch": 18.6, - "learning_rate": 2.534335664335664e-06, - "loss": 0.4113, - "step": 21470 - }, - { - "epoch": 18.61, - "learning_rate": 2.5336363636363636e-06, - "loss": 0.354, - "step": 21480 - }, - { - "epoch": 18.62, - "learning_rate": 2.532937062937063e-06, - "loss": 0.383, - "step": 21490 - }, - { - "epoch": 18.63, - "learning_rate": 2.5322377622377618e-06, - "loss": 0.3859, - "step": 21500 - }, - { - "epoch": 18.64, - "learning_rate": 2.5315384615384613e-06, - "loss": 0.3904, - "step": 21510 - }, - { - "epoch": 18.65, - "learning_rate": 2.5308391608391608e-06, - "loss": 0.381, - "step": 21520 - }, - { - "epoch": 18.66, - "learning_rate": 2.53013986013986e-06, - "loss": 0.4758, - "step": 21530 - }, - { - "epoch": 18.67, - "learning_rate": 2.5294405594405593e-06, - "loss": 0.4253, - "step": 21540 - }, - { - "epoch": 18.67, - "learning_rate": 2.528741258741259e-06, - "loss": 0.3751, - "step": 21550 - }, - { - "epoch": 18.68, - "learning_rate": 2.528041958041958e-06, - "loss": 0.3658, - "step": 21560 - }, - { - "epoch": 18.69, - "learning_rate": 2.527342657342657e-06, - "loss": 0.4032, - "step": 21570 - }, - { - "epoch": 18.7, - "learning_rate": 2.5266433566433565e-06, - "loss": 0.3402, - "step": 21580 - }, - { - "epoch": 18.71, - "learning_rate": 2.525944055944056e-06, - "loss": 0.364, - "step": 21590 - }, - { - "epoch": 18.72, - "learning_rate": 2.5252447552447555e-06, - "loss": 0.3297, - "step": 21600 - }, - { - "epoch": 18.73, - "learning_rate": 2.524545454545454e-06, - "loss": 0.456, - "step": 21610 - }, - { - "epoch": 18.73, - "learning_rate": 2.5238461538461536e-06, - "loss": 0.4218, - "step": 21620 - }, - { - "epoch": 18.74, - "learning_rate": 2.523146853146853e-06, - "loss": 0.3752, - "step": 21630 - }, - { - "epoch": 18.75, - "learning_rate": 2.522447552447552e-06, - "loss": 0.3573, - "step": 21640 - }, - { - "epoch": 18.76, - "learning_rate": 2.5217482517482517e-06, - "loss": 0.3968, - "step": 21650 - }, - { - "epoch": 18.77, - "learning_rate": 2.521048951048951e-06, - "loss": 0.3725, - "step": 21660 - }, - { - "epoch": 18.78, - "learning_rate": 2.5203496503496503e-06, - "loss": 0.3844, - "step": 21670 - }, - { - "epoch": 18.79, - "learning_rate": 2.5196503496503493e-06, - "loss": 0.4076, - "step": 21680 - }, - { - "epoch": 18.8, - "learning_rate": 2.518951048951049e-06, - "loss": 0.4098, - "step": 21690 - }, - { - "epoch": 18.8, - "learning_rate": 2.5182517482517483e-06, - "loss": 0.3585, - "step": 21700 - }, - { - "epoch": 18.81, - "learning_rate": 2.5175524475524474e-06, - "loss": 0.4506, - "step": 21710 - }, - { - "epoch": 18.82, - "learning_rate": 2.5168531468531465e-06, - "loss": 0.4148, - "step": 21720 - }, - { - "epoch": 18.83, - "learning_rate": 2.516153846153846e-06, - "loss": 0.3211, - "step": 21730 - }, - { - "epoch": 18.84, - "learning_rate": 2.5154545454545455e-06, - "loss": 0.3571, - "step": 21740 - }, - { - "epoch": 18.85, - "learning_rate": 2.5147552447552445e-06, - "loss": 0.378, - "step": 21750 - }, - { - "epoch": 18.86, - "learning_rate": 2.514055944055944e-06, - "loss": 0.4275, - "step": 21760 - }, - { - "epoch": 18.86, - "learning_rate": 2.513356643356643e-06, - "loss": 0.4126, - "step": 21770 - }, - { - "epoch": 18.87, - "learning_rate": 2.5126573426573426e-06, - "loss": 0.4135, - "step": 21780 - }, - { - "epoch": 18.88, - "learning_rate": 2.5119580419580417e-06, - "loss": 0.3731, - "step": 21790 - }, - { - "epoch": 18.89, - "learning_rate": 2.511258741258741e-06, - "loss": 0.3684, - "step": 21800 - }, - { - "epoch": 18.9, - "learning_rate": 2.5105594405594407e-06, - "loss": 0.346, - "step": 21810 - }, - { - "epoch": 18.91, - "learning_rate": 2.5098601398601398e-06, - "loss": 0.3587, - "step": 21820 - }, - { - "epoch": 18.92, - "learning_rate": 2.509160839160839e-06, - "loss": 0.4568, - "step": 21830 - }, - { - "epoch": 18.93, - "learning_rate": 2.5084615384615383e-06, - "loss": 0.4482, - "step": 21840 - }, - { - "epoch": 18.93, - "learning_rate": 2.507762237762238e-06, - "loss": 0.3697, - "step": 21850 - }, - { - "epoch": 18.94, - "learning_rate": 2.507062937062937e-06, - "loss": 0.3989, - "step": 21860 - }, - { - "epoch": 18.95, - "learning_rate": 2.5063636363636364e-06, - "loss": 0.4218, - "step": 21870 - }, - { - "epoch": 18.96, - "learning_rate": 2.5056643356643355e-06, - "loss": 0.3684, - "step": 21880 - }, - { - "epoch": 18.97, - "learning_rate": 2.5049650349650345e-06, - "loss": 0.4327, - "step": 21890 - }, - { - "epoch": 18.98, - "learning_rate": 2.504265734265734e-06, - "loss": 0.4212, - "step": 21900 - }, - { - "epoch": 18.99, - "learning_rate": 2.5035664335664335e-06, - "loss": 0.3928, - "step": 21910 - }, - { - "epoch": 18.99, - "learning_rate": 2.502867132867133e-06, - "loss": 0.4316, - "step": 21920 - }, - { - "epoch": 19.0, - "eval_loss": 0.5407825112342834, - "eval_runtime": 135.3965, - "eval_samples_per_second": 3.929, - "eval_steps_per_second": 1.965, - "eval_wer": 0.2506910072636112, - "step": 21926 - }, - { - "epoch": 19.0, - "learning_rate": 2.502167832167832e-06, - "loss": 0.389, - "step": 21930 - }, - { - "epoch": 19.01, - "learning_rate": 2.501468531468531e-06, - "loss": 0.3784, - "step": 21940 - }, - { - "epoch": 19.02, - "learning_rate": 2.5007692307692307e-06, - "loss": 0.3543, - "step": 21950 - }, - { - "epoch": 19.03, - "learning_rate": 2.50006993006993e-06, - "loss": 0.4176, - "step": 21960 - }, - { - "epoch": 19.04, - "learning_rate": 2.4993706293706292e-06, - "loss": 0.4456, - "step": 21970 - }, - { - "epoch": 19.05, - "learning_rate": 2.4986713286713287e-06, - "loss": 0.432, - "step": 21980 - }, - { - "epoch": 19.06, - "learning_rate": 2.497972027972028e-06, - "loss": 0.4524, - "step": 21990 - }, - { - "epoch": 19.06, - "learning_rate": 2.497272727272727e-06, - "loss": 0.3371, - "step": 22000 - }, - { - "epoch": 19.07, - "learning_rate": 2.4965734265734264e-06, - "loss": 0.3873, - "step": 22010 - }, - { - "epoch": 19.08, - "learning_rate": 2.495874125874126e-06, - "loss": 0.3631, - "step": 22020 - }, - { - "epoch": 19.09, - "learning_rate": 2.4951748251748254e-06, - "loss": 0.3886, - "step": 22030 - }, - { - "epoch": 19.1, - "learning_rate": 2.494475524475524e-06, - "loss": 0.3754, - "step": 22040 - }, - { - "epoch": 19.11, - "learning_rate": 2.4937762237762235e-06, - "loss": 0.425, - "step": 22050 - }, - { - "epoch": 19.12, - "learning_rate": 2.493076923076923e-06, - "loss": 0.3737, - "step": 22060 - }, - { - "epoch": 19.12, - "learning_rate": 2.492377622377622e-06, - "loss": 0.4261, - "step": 22070 - }, - { - "epoch": 19.13, - "learning_rate": 2.4916783216783216e-06, - "loss": 0.3958, - "step": 22080 - }, - { - "epoch": 19.14, - "learning_rate": 2.490979020979021e-06, - "loss": 0.3736, - "step": 22090 - }, - { - "epoch": 19.15, - "learning_rate": 2.49027972027972e-06, - "loss": 0.3276, - "step": 22100 - }, - { - "epoch": 19.16, - "learning_rate": 2.4895804195804192e-06, - "loss": 0.3589, - "step": 22110 - }, - { - "epoch": 19.17, - "learning_rate": 2.4888811188811187e-06, - "loss": 0.4129, - "step": 22120 - }, - { - "epoch": 19.18, - "learning_rate": 2.4881818181818182e-06, - "loss": 0.3523, - "step": 22130 - }, - { - "epoch": 19.19, - "learning_rate": 2.4874825174825177e-06, - "loss": 0.4183, - "step": 22140 - }, - { - "epoch": 19.19, - "learning_rate": 2.4867832167832164e-06, - "loss": 0.3582, - "step": 22150 - }, - { - "epoch": 19.2, - "learning_rate": 2.486083916083916e-06, - "loss": 0.387, - "step": 22160 - }, - { - "epoch": 19.21, - "learning_rate": 2.4853846153846154e-06, - "loss": 0.412, - "step": 22170 - }, - { - "epoch": 19.22, - "learning_rate": 2.4846853146853144e-06, - "loss": 0.3966, - "step": 22180 - }, - { - "epoch": 19.23, - "learning_rate": 2.483986013986014e-06, - "loss": 0.4483, - "step": 22190 - }, - { - "epoch": 19.24, - "learning_rate": 2.4832867132867134e-06, - "loss": 0.3605, - "step": 22200 - }, - { - "epoch": 19.25, - "learning_rate": 2.4825874125874125e-06, - "loss": 0.4112, - "step": 22210 - }, - { - "epoch": 19.25, - "learning_rate": 2.4818881118881116e-06, - "loss": 0.3792, - "step": 22220 - }, - { - "epoch": 19.26, - "learning_rate": 2.481188811188811e-06, - "loss": 0.3607, - "step": 22230 - }, - { - "epoch": 19.27, - "learning_rate": 2.4804895104895106e-06, - "loss": 0.4215, - "step": 22240 - }, - { - "epoch": 19.28, - "learning_rate": 2.4797902097902097e-06, - "loss": 0.4503, - "step": 22250 - }, - { - "epoch": 19.29, - "learning_rate": 2.4790909090909087e-06, - "loss": 0.4321, - "step": 22260 - }, - { - "epoch": 19.3, - "learning_rate": 2.4783916083916082e-06, - "loss": 0.367, - "step": 22270 - }, - { - "epoch": 19.31, - "learning_rate": 2.4776923076923077e-06, - "loss": 0.3698, - "step": 22280 - }, - { - "epoch": 19.32, - "learning_rate": 2.476993006993007e-06, - "loss": 0.3944, - "step": 22290 - }, - { - "epoch": 19.32, - "learning_rate": 2.4762937062937063e-06, - "loss": 0.3623, - "step": 22300 - }, - { - "epoch": 19.33, - "learning_rate": 2.4755944055944058e-06, - "loss": 0.408, - "step": 22310 - }, - { - "epoch": 19.34, - "learning_rate": 2.474895104895105e-06, - "loss": 0.4196, - "step": 22320 - }, - { - "epoch": 19.35, - "learning_rate": 2.474195804195804e-06, - "loss": 0.367, - "step": 22330 - }, - { - "epoch": 19.36, - "learning_rate": 2.4734965034965034e-06, - "loss": 0.3914, - "step": 22340 - }, - { - "epoch": 19.37, - "learning_rate": 2.472797202797203e-06, - "loss": 0.4052, - "step": 22350 - }, - { - "epoch": 19.38, - "learning_rate": 2.472097902097902e-06, - "loss": 0.3447, - "step": 22360 - }, - { - "epoch": 19.38, - "learning_rate": 2.471398601398601e-06, - "loss": 0.4061, - "step": 22370 - }, - { - "epoch": 19.39, - "learning_rate": 2.4706993006993006e-06, - "loss": 0.4787, - "step": 22380 - }, - { - "epoch": 19.4, - "learning_rate": 2.47e-06, - "loss": 0.4053, - "step": 22390 - }, - { - "epoch": 19.41, - "learning_rate": 2.469300699300699e-06, - "loss": 0.3524, - "step": 22400 - }, - { - "epoch": 19.42, - "learning_rate": 2.4686013986013986e-06, - "loss": 0.4586, - "step": 22410 - }, - { - "epoch": 19.43, - "learning_rate": 2.4679020979020977e-06, - "loss": 0.3858, - "step": 22420 - }, - { - "epoch": 19.44, - "learning_rate": 2.4672027972027968e-06, - "loss": 0.3866, - "step": 22430 - }, - { - "epoch": 19.45, - "learning_rate": 2.4665034965034963e-06, - "loss": 0.354, - "step": 22440 - }, - { - "epoch": 19.45, - "learning_rate": 2.4658041958041958e-06, - "loss": 0.3874, - "step": 22450 - }, - { - "epoch": 19.46, - "learning_rate": 2.4651048951048953e-06, - "loss": 0.4058, - "step": 22460 - }, - { - "epoch": 19.47, - "learning_rate": 2.4644055944055943e-06, - "loss": 0.4326, - "step": 22470 - }, - { - "epoch": 19.48, - "learning_rate": 2.4637062937062934e-06, - "loss": 0.3791, - "step": 22480 - }, - { - "epoch": 19.49, - "learning_rate": 2.463006993006993e-06, - "loss": 0.4037, - "step": 22490 - }, - { - "epoch": 19.5, - "learning_rate": 2.462307692307692e-06, - "loss": 0.391, - "step": 22500 - }, - { - "epoch": 19.51, - "learning_rate": 2.4616083916083915e-06, - "loss": 0.403, - "step": 22510 - }, - { - "epoch": 19.51, - "learning_rate": 2.460909090909091e-06, - "loss": 0.3796, - "step": 22520 - }, - { - "epoch": 19.52, - "learning_rate": 2.46020979020979e-06, - "loss": 0.4075, - "step": 22530 - }, - { - "epoch": 19.53, - "learning_rate": 2.459510489510489e-06, - "loss": 0.442, - "step": 22540 - }, - { - "epoch": 19.54, - "learning_rate": 2.4588111888111886e-06, - "loss": 0.3926, - "step": 22550 - }, - { - "epoch": 19.55, - "learning_rate": 2.458111888111888e-06, - "loss": 0.3807, - "step": 22560 - }, - { - "epoch": 19.56, - "learning_rate": 2.4574125874125876e-06, - "loss": 0.4076, - "step": 22570 - }, - { - "epoch": 19.57, - "learning_rate": 2.4567132867132863e-06, - "loss": 0.4484, - "step": 22580 - }, - { - "epoch": 19.58, - "learning_rate": 2.4560139860139858e-06, - "loss": 0.3222, - "step": 22590 - }, - { - "epoch": 19.58, - "learning_rate": 2.4553146853146853e-06, - "loss": 0.4182, - "step": 22600 - }, - { - "epoch": 19.59, - "learning_rate": 2.4546153846153843e-06, - "loss": 0.3973, - "step": 22610 - }, - { - "epoch": 19.6, - "learning_rate": 2.453916083916084e-06, - "loss": 0.4256, - "step": 22620 - }, - { - "epoch": 19.61, - "learning_rate": 2.4532167832167833e-06, - "loss": 0.4119, - "step": 22630 - }, - { - "epoch": 19.62, - "learning_rate": 2.4525174825174824e-06, - "loss": 0.3956, - "step": 22640 - }, - { - "epoch": 19.63, - "learning_rate": 2.4518181818181815e-06, - "loss": 0.3509, - "step": 22650 - }, - { - "epoch": 19.64, - "learning_rate": 2.451118881118881e-06, - "loss": 0.3464, - "step": 22660 - }, - { - "epoch": 19.64, - "learning_rate": 2.4504195804195805e-06, - "loss": 0.4038, - "step": 22670 - }, - { - "epoch": 19.65, - "learning_rate": 2.4497202797202796e-06, - "loss": 0.3272, - "step": 22680 - }, - { - "epoch": 19.66, - "learning_rate": 2.4490209790209786e-06, - "loss": 0.3358, - "step": 22690 - }, - { - "epoch": 19.67, - "learning_rate": 2.448321678321678e-06, - "loss": 0.4066, - "step": 22700 - }, - { - "epoch": 19.68, - "learning_rate": 2.4476223776223776e-06, - "loss": 0.3879, - "step": 22710 - }, - { - "epoch": 19.69, - "learning_rate": 2.4469230769230767e-06, - "loss": 0.3762, - "step": 22720 - }, - { - "epoch": 19.7, - "learning_rate": 2.446223776223776e-06, - "loss": 0.4083, - "step": 22730 - }, - { - "epoch": 19.71, - "learning_rate": 2.4455244755244757e-06, - "loss": 0.4895, - "step": 22740 - }, - { - "epoch": 19.71, - "learning_rate": 2.4448251748251748e-06, - "loss": 0.3472, - "step": 22750 - }, - { - "epoch": 19.72, - "learning_rate": 2.444125874125874e-06, - "loss": 0.3847, - "step": 22760 - }, - { - "epoch": 19.73, - "learning_rate": 2.4434265734265733e-06, - "loss": 0.4201, - "step": 22770 - }, - { - "epoch": 19.74, - "learning_rate": 2.442727272727273e-06, - "loss": 0.3952, - "step": 22780 - }, - { - "epoch": 19.75, - "learning_rate": 2.442027972027972e-06, - "loss": 0.3627, - "step": 22790 - }, - { - "epoch": 19.76, - "learning_rate": 2.441328671328671e-06, - "loss": 0.3866, - "step": 22800 - }, - { - "epoch": 19.77, - "learning_rate": 2.4406293706293705e-06, - "loss": 0.4224, - "step": 22810 - }, - { - "epoch": 19.77, - "learning_rate": 2.43993006993007e-06, - "loss": 0.4178, - "step": 22820 - }, - { - "epoch": 19.78, - "learning_rate": 2.439230769230769e-06, - "loss": 0.4198, - "step": 22830 - }, - { - "epoch": 19.79, - "learning_rate": 2.4385314685314685e-06, - "loss": 0.3951, - "step": 22840 - }, - { - "epoch": 19.8, - "learning_rate": 2.437832167832168e-06, - "loss": 0.3302, - "step": 22850 - }, - { - "epoch": 19.81, - "learning_rate": 2.437202797202797e-06, - "loss": 0.3735, - "step": 22860 - }, - { - "epoch": 19.82, - "learning_rate": 2.4365034965034966e-06, - "loss": 0.4324, - "step": 22870 - }, - { - "epoch": 19.83, - "learning_rate": 2.4358041958041956e-06, - "loss": 0.3774, - "step": 22880 - }, - { - "epoch": 19.83, - "learning_rate": 2.4351048951048947e-06, - "loss": 0.3634, - "step": 22890 - }, - { - "epoch": 19.84, - "learning_rate": 2.4344055944055942e-06, - "loss": 0.3314, - "step": 22900 - }, - { - "epoch": 19.85, - "learning_rate": 2.4337062937062937e-06, - "loss": 0.412, - "step": 22910 - }, - { - "epoch": 19.86, - "learning_rate": 2.4330069930069928e-06, - "loss": 0.4328, - "step": 22920 - }, - { - "epoch": 19.87, - "learning_rate": 2.4323076923076923e-06, - "loss": 0.4351, - "step": 22930 - }, - { - "epoch": 19.88, - "learning_rate": 2.4316083916083918e-06, - "loss": 0.3949, - "step": 22940 - }, - { - "epoch": 19.89, - "learning_rate": 2.430909090909091e-06, - "loss": 0.3694, - "step": 22950 - }, - { - "epoch": 19.9, - "learning_rate": 2.43020979020979e-06, - "loss": 0.4665, - "step": 22960 - }, - { - "epoch": 19.9, - "learning_rate": 2.4295104895104894e-06, - "loss": 0.3563, - "step": 22970 - }, - { - "epoch": 19.91, - "learning_rate": 2.428811188811189e-06, - "loss": 0.3771, - "step": 22980 - }, - { - "epoch": 19.92, - "learning_rate": 2.428111888111888e-06, - "loss": 0.3597, - "step": 22990 - }, - { - "epoch": 19.93, - "learning_rate": 2.427412587412587e-06, - "loss": 0.4063, - "step": 23000 - }, - { - "epoch": 19.94, - "learning_rate": 2.4267132867132866e-06, - "loss": 0.3725, - "step": 23010 - }, - { - "epoch": 19.95, - "learning_rate": 2.426013986013986e-06, - "loss": 0.4306, - "step": 23020 - }, - { - "epoch": 19.96, - "learning_rate": 2.425314685314685e-06, - "loss": 0.3789, - "step": 23030 - }, - { - "epoch": 19.96, - "learning_rate": 2.4246153846153846e-06, - "loss": 0.4015, - "step": 23040 - }, - { - "epoch": 19.97, - "learning_rate": 2.423916083916084e-06, - "loss": 0.4076, - "step": 23050 - }, - { - "epoch": 19.98, - "learning_rate": 2.4232167832167828e-06, - "loss": 0.3486, - "step": 23060 - }, - { - "epoch": 19.99, - "learning_rate": 2.4225174825174823e-06, - "loss": 0.3632, - "step": 23070 - }, - { - "epoch": 20.0, - "learning_rate": 2.4218181818181818e-06, - "loss": 0.3136, - "step": 23080 - }, - { - "epoch": 20.0, - "eval_loss": 0.5591942071914673, - "eval_runtime": 134.7021, - "eval_samples_per_second": 3.949, - "eval_steps_per_second": 1.975, - "eval_wer": 0.25249084013627304, - "step": 23080 - }, - { - "epoch": 20.01, - "learning_rate": 2.4211188811188813e-06, - "loss": 0.3984, - "step": 23090 - }, - { - "epoch": 20.02, - "learning_rate": 2.4204195804195803e-06, - "loss": 0.4126, - "step": 23100 - }, - { - "epoch": 20.03, - "learning_rate": 2.4197202797202794e-06, - "loss": 0.4086, - "step": 23110 - }, - { - "epoch": 20.03, - "learning_rate": 2.419020979020979e-06, - "loss": 0.374, - "step": 23120 - }, - { - "epoch": 20.04, - "learning_rate": 2.418321678321678e-06, - "loss": 0.367, - "step": 23130 - }, - { - "epoch": 20.05, - "learning_rate": 2.4176223776223775e-06, - "loss": 0.3317, - "step": 23140 - }, - { - "epoch": 20.06, - "learning_rate": 2.416923076923077e-06, - "loss": 0.3914, - "step": 23150 - }, - { - "epoch": 20.07, - "learning_rate": 2.4162237762237765e-06, - "loss": 0.384, - "step": 23160 - }, - { - "epoch": 20.08, - "learning_rate": 2.415524475524475e-06, - "loss": 0.3982, - "step": 23170 - }, - { - "epoch": 20.09, - "learning_rate": 2.4148251748251746e-06, - "loss": 0.385, - "step": 23180 - }, - { - "epoch": 20.1, - "learning_rate": 2.414125874125874e-06, - "loss": 0.4257, - "step": 23190 - }, - { - "epoch": 20.1, - "learning_rate": 2.4134265734265736e-06, - "loss": 0.3899, - "step": 23200 - }, - { - "epoch": 20.11, - "learning_rate": 2.4127272727272727e-06, - "loss": 0.3788, - "step": 23210 - }, - { - "epoch": 20.12, - "learning_rate": 2.4120279720279718e-06, - "loss": 0.3876, - "step": 23220 - }, - { - "epoch": 20.13, - "learning_rate": 2.4113286713286713e-06, - "loss": 0.3267, - "step": 23230 - }, - { - "epoch": 20.14, - "learning_rate": 2.4106293706293703e-06, - "loss": 0.4032, - "step": 23240 - }, - { - "epoch": 20.15, - "learning_rate": 2.40993006993007e-06, - "loss": 0.3677, - "step": 23250 - }, - { - "epoch": 20.16, - "learning_rate": 2.4092307692307693e-06, - "loss": 0.3476, - "step": 23260 - }, - { - "epoch": 20.16, - "learning_rate": 2.4085314685314684e-06, - "loss": 0.3811, - "step": 23270 - }, - { - "epoch": 20.17, - "learning_rate": 2.4078321678321675e-06, - "loss": 0.4277, - "step": 23280 - }, - { - "epoch": 20.18, - "learning_rate": 2.407132867132867e-06, - "loss": 0.4007, - "step": 23290 - }, - { - "epoch": 20.19, - "learning_rate": 2.4064335664335665e-06, - "loss": 0.3914, - "step": 23300 - }, - { - "epoch": 20.2, - "learning_rate": 2.4057342657342655e-06, - "loss": 0.3485, - "step": 23310 - }, - { - "epoch": 20.21, - "learning_rate": 2.405034965034965e-06, - "loss": 0.3969, - "step": 23320 - }, - { - "epoch": 20.22, - "learning_rate": 2.404335664335664e-06, - "loss": 0.4566, - "step": 23330 - }, - { - "epoch": 20.23, - "learning_rate": 2.4036363636363636e-06, - "loss": 0.3597, - "step": 23340 - }, - { - "epoch": 20.23, - "learning_rate": 2.4029370629370627e-06, - "loss": 0.3356, - "step": 23350 - }, - { - "epoch": 20.24, - "learning_rate": 2.402237762237762e-06, - "loss": 0.3972, - "step": 23360 - }, - { - "epoch": 20.25, - "learning_rate": 2.4015384615384617e-06, - "loss": 0.3903, - "step": 23370 - }, - { - "epoch": 20.26, - "learning_rate": 2.4008391608391607e-06, - "loss": 0.3691, - "step": 23380 - }, - { - "epoch": 20.27, - "learning_rate": 2.40013986013986e-06, - "loss": 0.3839, - "step": 23390 - }, - { - "epoch": 20.28, - "learning_rate": 2.3994405594405593e-06, - "loss": 0.3857, - "step": 23400 - }, - { - "epoch": 20.29, - "learning_rate": 2.398741258741259e-06, - "loss": 0.4017, - "step": 23410 - }, - { - "epoch": 20.29, - "learning_rate": 2.398041958041958e-06, - "loss": 0.4107, - "step": 23420 - }, - { - "epoch": 20.3, - "learning_rate": 2.397342657342657e-06, - "loss": 0.3938, - "step": 23430 - }, - { - "epoch": 20.31, - "learning_rate": 2.3966433566433565e-06, - "loss": 0.3747, - "step": 23440 - }, - { - "epoch": 20.32, - "learning_rate": 2.395944055944056e-06, - "loss": 0.338, - "step": 23450 - }, - { - "epoch": 20.33, - "learning_rate": 2.395244755244755e-06, - "loss": 0.4039, - "step": 23460 - }, - { - "epoch": 20.34, - "learning_rate": 2.3945454545454545e-06, - "loss": 0.3897, - "step": 23470 - }, - { - "epoch": 20.35, - "learning_rate": 2.393846153846154e-06, - "loss": 0.3777, - "step": 23480 - }, - { - "epoch": 20.36, - "learning_rate": 2.3931468531468527e-06, - "loss": 0.3809, - "step": 23490 - }, - { - "epoch": 20.36, - "learning_rate": 2.392447552447552e-06, - "loss": 0.4123, - "step": 23500 - }, - { - "epoch": 20.37, - "learning_rate": 2.3917482517482517e-06, - "loss": 0.3184, - "step": 23510 - }, - { - "epoch": 20.38, - "learning_rate": 2.391048951048951e-06, - "loss": 0.4499, - "step": 23520 - }, - { - "epoch": 20.39, - "learning_rate": 2.3903496503496502e-06, - "loss": 0.3823, - "step": 23530 - }, - { - "epoch": 20.4, - "learning_rate": 2.3896503496503493e-06, - "loss": 0.3515, - "step": 23540 - }, - { - "epoch": 20.41, - "learning_rate": 2.388951048951049e-06, - "loss": 0.3879, - "step": 23550 - }, - { - "epoch": 20.42, - "learning_rate": 2.3882517482517483e-06, - "loss": 0.3481, - "step": 23560 - }, - { - "epoch": 20.42, - "learning_rate": 2.3875524475524474e-06, - "loss": 0.4421, - "step": 23570 - }, - { - "epoch": 20.43, - "learning_rate": 2.386853146853147e-06, - "loss": 0.4234, - "step": 23580 - }, - { - "epoch": 20.44, - "learning_rate": 2.3861538461538464e-06, - "loss": 0.3732, - "step": 23590 - }, - { - "epoch": 20.45, - "learning_rate": 2.385454545454545e-06, - "loss": 0.3774, - "step": 23600 - }, - { - "epoch": 20.46, - "learning_rate": 2.3847552447552445e-06, - "loss": 0.3846, - "step": 23610 - }, - { - "epoch": 20.47, - "learning_rate": 2.384055944055944e-06, - "loss": 0.4003, - "step": 23620 - }, - { - "epoch": 20.48, - "learning_rate": 2.3833566433566435e-06, - "loss": 0.4432, - "step": 23630 - }, - { - "epoch": 20.49, - "learning_rate": 2.3826573426573426e-06, - "loss": 0.4091, - "step": 23640 - }, - { - "epoch": 20.49, - "learning_rate": 2.3819580419580417e-06, - "loss": 0.4014, - "step": 23650 - }, - { - "epoch": 20.5, - "learning_rate": 2.381258741258741e-06, - "loss": 0.3904, - "step": 23660 - }, - { - "epoch": 20.51, - "learning_rate": 2.3805594405594402e-06, - "loss": 0.3942, - "step": 23670 - }, - { - "epoch": 20.52, - "learning_rate": 2.3798601398601397e-06, - "loss": 0.4678, - "step": 23680 - }, - { - "epoch": 20.53, - "learning_rate": 2.3791608391608392e-06, - "loss": 0.3161, - "step": 23690 - }, - { - "epoch": 20.54, - "learning_rate": 2.3784615384615387e-06, - "loss": 0.3986, - "step": 23700 - }, - { - "epoch": 20.55, - "learning_rate": 2.3777622377622374e-06, - "loss": 0.3756, - "step": 23710 - }, - { - "epoch": 20.55, - "learning_rate": 2.377062937062937e-06, - "loss": 0.4178, - "step": 23720 - }, - { - "epoch": 20.56, - "learning_rate": 2.3763636363636364e-06, - "loss": 0.3168, - "step": 23730 - }, - { - "epoch": 20.57, - "learning_rate": 2.375664335664336e-06, - "loss": 0.3617, - "step": 23740 - }, - { - "epoch": 20.58, - "learning_rate": 2.374965034965035e-06, - "loss": 0.4241, - "step": 23750 - }, - { - "epoch": 20.59, - "learning_rate": 2.374265734265734e-06, - "loss": 0.4324, - "step": 23760 - }, - { - "epoch": 20.6, - "learning_rate": 2.3735664335664335e-06, - "loss": 0.3782, - "step": 23770 - }, - { - "epoch": 20.61, - "learning_rate": 2.3728671328671326e-06, - "loss": 0.4475, - "step": 23780 - }, - { - "epoch": 20.61, - "learning_rate": 2.372167832167832e-06, - "loss": 0.3713, - "step": 23790 - }, - { - "epoch": 20.62, - "learning_rate": 2.3714685314685316e-06, - "loss": 0.3692, - "step": 23800 - }, - { - "epoch": 20.63, - "learning_rate": 2.3707692307692306e-06, - "loss": 0.364, - "step": 23810 - }, - { - "epoch": 20.64, - "learning_rate": 2.3700699300699297e-06, - "loss": 0.3905, - "step": 23820 - }, - { - "epoch": 20.65, - "learning_rate": 2.3693706293706292e-06, - "loss": 0.362, - "step": 23830 - }, - { - "epoch": 20.66, - "learning_rate": 2.3686713286713287e-06, - "loss": 0.4497, - "step": 23840 - }, - { - "epoch": 20.67, - "learning_rate": 2.3679720279720278e-06, - "loss": 0.3851, - "step": 23850 - }, - { - "epoch": 20.68, - "learning_rate": 2.3672727272727273e-06, - "loss": 0.3468, - "step": 23860 - }, - { - "epoch": 20.68, - "learning_rate": 2.3665734265734264e-06, - "loss": 0.3688, - "step": 23870 - }, - { - "epoch": 20.69, - "learning_rate": 2.365874125874126e-06, - "loss": 0.4112, - "step": 23880 - }, - { - "epoch": 20.7, - "learning_rate": 2.365174825174825e-06, - "loss": 0.3871, - "step": 23890 - }, - { - "epoch": 20.71, - "learning_rate": 2.3644755244755244e-06, - "loss": 0.4059, - "step": 23900 - }, - { - "epoch": 20.72, - "learning_rate": 2.363776223776224e-06, - "loss": 0.3437, - "step": 23910 - }, - { - "epoch": 20.73, - "learning_rate": 2.363076923076923e-06, - "loss": 0.387, - "step": 23920 - }, - { - "epoch": 20.74, - "learning_rate": 2.362377622377622e-06, - "loss": 0.4489, - "step": 23930 - }, - { - "epoch": 20.74, - "learning_rate": 2.3616783216783216e-06, - "loss": 0.4385, - "step": 23940 - }, - { - "epoch": 20.75, - "learning_rate": 2.360979020979021e-06, - "loss": 0.352, - "step": 23950 - }, - { - "epoch": 20.76, - "learning_rate": 2.36027972027972e-06, - "loss": 0.3235, - "step": 23960 - }, - { - "epoch": 20.77, - "learning_rate": 2.3595804195804196e-06, - "loss": 0.3833, - "step": 23970 - }, - { - "epoch": 20.78, - "learning_rate": 2.3588811188811187e-06, - "loss": 0.4387, - "step": 23980 - }, - { - "epoch": 20.79, - "learning_rate": 2.358181818181818e-06, - "loss": 0.3896, - "step": 23990 - }, - { - "epoch": 20.8, - "learning_rate": 2.3574825174825173e-06, - "loss": 0.4094, - "step": 24000 - }, - { - "epoch": 20.81, - "learning_rate": 2.3567832167832168e-06, - "loss": 0.4098, - "step": 24010 - }, - { - "epoch": 20.81, - "learning_rate": 2.3560839160839163e-06, - "loss": 0.4306, - "step": 24020 - }, - { - "epoch": 20.82, - "learning_rate": 2.355384615384615e-06, - "loss": 0.4632, - "step": 24030 - }, - { - "epoch": 20.83, - "learning_rate": 2.3546853146853144e-06, - "loss": 0.3862, - "step": 24040 - }, - { - "epoch": 20.84, - "learning_rate": 2.353986013986014e-06, - "loss": 0.3786, - "step": 24050 - }, - { - "epoch": 20.85, - "learning_rate": 2.3532867132867134e-06, - "loss": 0.3917, - "step": 24060 - }, - { - "epoch": 20.86, - "learning_rate": 2.3525874125874125e-06, - "loss": 0.409, - "step": 24070 - }, - { - "epoch": 20.87, - "learning_rate": 2.3518881118881116e-06, - "loss": 0.4337, - "step": 24080 - }, - { - "epoch": 20.87, - "learning_rate": 2.351188811188811e-06, - "loss": 0.3868, - "step": 24090 - }, - { - "epoch": 20.88, - "learning_rate": 2.35048951048951e-06, - "loss": 0.344, - "step": 24100 - }, - { - "epoch": 20.89, - "learning_rate": 2.3497902097902096e-06, - "loss": 0.3437, - "step": 24110 - }, - { - "epoch": 20.9, - "learning_rate": 2.349090909090909e-06, - "loss": 0.3807, - "step": 24120 - }, - { - "epoch": 20.91, - "learning_rate": 2.3483916083916086e-06, - "loss": 0.4006, - "step": 24130 - }, - { - "epoch": 20.92, - "learning_rate": 2.3476923076923073e-06, - "loss": 0.388, - "step": 24140 - }, - { - "epoch": 20.93, - "learning_rate": 2.3469930069930068e-06, - "loss": 0.3547, - "step": 24150 - }, - { - "epoch": 20.94, - "learning_rate": 2.3462937062937063e-06, - "loss": 0.3793, - "step": 24160 - }, - { - "epoch": 20.94, - "learning_rate": 2.3455944055944058e-06, - "loss": 0.3923, - "step": 24170 - }, - { - "epoch": 20.95, - "learning_rate": 2.344895104895105e-06, - "loss": 0.3735, - "step": 24180 - }, - { - "epoch": 20.96, - "learning_rate": 2.344195804195804e-06, - "loss": 0.3574, - "step": 24190 - }, - { - "epoch": 20.97, - "learning_rate": 2.3434965034965034e-06, - "loss": 0.3754, - "step": 24200 - }, - { - "epoch": 20.98, - "learning_rate": 2.3427972027972025e-06, - "loss": 0.3825, - "step": 24210 - }, - { - "epoch": 20.99, - "learning_rate": 2.342097902097902e-06, - "loss": 0.3868, - "step": 24220 - }, - { - "epoch": 21.0, - "learning_rate": 2.3413986013986015e-06, - "loss": 0.4249, - "step": 24230 - }, - { - "epoch": 21.0, - "eval_loss": 0.5684043169021606, - "eval_runtime": 135.7482, - "eval_samples_per_second": 3.919, - "eval_steps_per_second": 1.96, - "eval_wer": 0.2560262261361445, - "step": 24234 - }, - { - "epoch": 21.01, - "learning_rate": 2.340699300699301e-06, - "loss": 0.4147, - "step": 24240 - }, - { - "epoch": 21.01, - "learning_rate": 2.3399999999999996e-06, - "loss": 0.3816, - "step": 24250 - }, - { - "epoch": 21.02, - "learning_rate": 2.339300699300699e-06, - "loss": 0.3229, - "step": 24260 - }, - { - "epoch": 21.03, - "learning_rate": 2.3386013986013986e-06, - "loss": 0.4494, - "step": 24270 - }, - { - "epoch": 21.04, - "learning_rate": 2.3379020979020977e-06, - "loss": 0.3372, - "step": 24280 - }, - { - "epoch": 21.05, - "learning_rate": 2.337202797202797e-06, - "loss": 0.4027, - "step": 24290 - }, - { - "epoch": 21.06, - "learning_rate": 2.3365034965034963e-06, - "loss": 0.378, - "step": 24300 - }, - { - "epoch": 21.07, - "learning_rate": 2.3358041958041958e-06, - "loss": 0.3572, - "step": 24310 - }, - { - "epoch": 21.07, - "learning_rate": 2.335104895104895e-06, - "loss": 0.4459, - "step": 24320 - }, - { - "epoch": 21.08, - "learning_rate": 2.3344055944055943e-06, - "loss": 0.415, - "step": 24330 - }, - { - "epoch": 21.09, - "learning_rate": 2.333706293706294e-06, - "loss": 0.3677, - "step": 24340 - }, - { - "epoch": 21.1, - "learning_rate": 2.3330069930069933e-06, - "loss": 0.3709, - "step": 24350 - }, - { - "epoch": 21.11, - "learning_rate": 2.332307692307692e-06, - "loss": 0.3639, - "step": 24360 - }, - { - "epoch": 21.12, - "learning_rate": 2.3316083916083915e-06, - "loss": 0.3739, - "step": 24370 - }, - { - "epoch": 21.13, - "learning_rate": 2.330909090909091e-06, - "loss": 0.4741, - "step": 24380 - }, - { - "epoch": 21.14, - "learning_rate": 2.33020979020979e-06, - "loss": 0.3959, - "step": 24390 - }, - { - "epoch": 21.14, - "learning_rate": 2.3295104895104895e-06, - "loss": 0.4105, - "step": 24400 - }, - { - "epoch": 21.15, - "learning_rate": 2.3288111888111886e-06, - "loss": 0.3114, - "step": 24410 - }, - { - "epoch": 21.16, - "learning_rate": 2.328111888111888e-06, - "loss": 0.3996, - "step": 24420 - }, - { - "epoch": 21.17, - "learning_rate": 2.327412587412587e-06, - "loss": 0.3822, - "step": 24430 - }, - { - "epoch": 21.18, - "learning_rate": 2.3267132867132867e-06, - "loss": 0.3457, - "step": 24440 - }, - { - "epoch": 21.19, - "learning_rate": 2.326013986013986e-06, - "loss": 0.3282, - "step": 24450 - }, - { - "epoch": 21.2, - "learning_rate": 2.325314685314685e-06, - "loss": 0.3591, - "step": 24460 - }, - { - "epoch": 21.2, - "learning_rate": 2.3246153846153843e-06, - "loss": 0.3947, - "step": 24470 - }, - { - "epoch": 21.21, - "learning_rate": 2.323916083916084e-06, - "loss": 0.3338, - "step": 24480 - }, - { - "epoch": 21.22, - "learning_rate": 2.3232167832167833e-06, - "loss": 0.3912, - "step": 24490 - }, - { - "epoch": 21.23, - "learning_rate": 2.3225174825174824e-06, - "loss": 0.3995, - "step": 24500 - }, - { - "epoch": 21.24, - "learning_rate": 2.321818181818182e-06, - "loss": 0.3751, - "step": 24510 - }, - { - "epoch": 21.25, - "learning_rate": 2.321118881118881e-06, - "loss": 0.3852, - "step": 24520 - }, - { - "epoch": 21.26, - "learning_rate": 2.3204195804195805e-06, - "loss": 0.4216, - "step": 24530 - }, - { - "epoch": 21.27, - "learning_rate": 2.3197202797202795e-06, - "loss": 0.3995, - "step": 24540 - }, - { - "epoch": 21.27, - "learning_rate": 2.319020979020979e-06, - "loss": 0.3965, - "step": 24550 - }, - { - "epoch": 21.28, - "learning_rate": 2.3183216783216785e-06, - "loss": 0.3995, - "step": 24560 - }, - { - "epoch": 21.29, - "learning_rate": 2.317622377622377e-06, - "loss": 0.3852, - "step": 24570 - }, - { - "epoch": 21.3, - "learning_rate": 2.3169230769230767e-06, - "loss": 0.3916, - "step": 24580 - }, - { - "epoch": 21.31, - "learning_rate": 2.316223776223776e-06, - "loss": 0.4175, - "step": 24590 - }, - { - "epoch": 21.32, - "learning_rate": 2.3155244755244757e-06, - "loss": 0.3673, - "step": 24600 - }, - { - "epoch": 21.33, - "learning_rate": 2.3148251748251747e-06, - "loss": 0.4021, - "step": 24610 - }, - { - "epoch": 21.33, - "learning_rate": 2.314125874125874e-06, - "loss": 0.3781, - "step": 24620 - }, - { - "epoch": 21.34, - "learning_rate": 2.3134265734265733e-06, - "loss": 0.3848, - "step": 24630 - }, - { - "epoch": 21.35, - "learning_rate": 2.3127272727272724e-06, - "loss": 0.3694, - "step": 24640 - }, - { - "epoch": 21.36, - "learning_rate": 2.312027972027972e-06, - "loss": 0.396, - "step": 24650 - }, - { - "epoch": 21.37, - "learning_rate": 2.3113286713286714e-06, - "loss": 0.3893, - "step": 24660 - }, - { - "epoch": 21.38, - "learning_rate": 2.310629370629371e-06, - "loss": 0.4334, - "step": 24670 - }, - { - "epoch": 21.39, - "learning_rate": 2.3099300699300695e-06, - "loss": 0.385, - "step": 24680 - }, - { - "epoch": 21.39, - "learning_rate": 2.309230769230769e-06, - "loss": 0.4337, - "step": 24690 - }, - { - "epoch": 21.4, - "learning_rate": 2.3085314685314685e-06, - "loss": 0.3979, - "step": 24700 - }, - { - "epoch": 21.41, - "learning_rate": 2.307832167832168e-06, - "loss": 0.4227, - "step": 24710 - }, - { - "epoch": 21.42, - "learning_rate": 2.307132867132867e-06, - "loss": 0.3878, - "step": 24720 - }, - { - "epoch": 21.43, - "learning_rate": 2.306433566433566e-06, - "loss": 0.4102, - "step": 24730 - }, - { - "epoch": 21.44, - "learning_rate": 2.3057342657342657e-06, - "loss": 0.3923, - "step": 24740 - }, - { - "epoch": 21.45, - "learning_rate": 2.3050349650349647e-06, - "loss": 0.3457, - "step": 24750 - }, - { - "epoch": 21.46, - "learning_rate": 2.3043356643356642e-06, - "loss": 0.4122, - "step": 24760 - }, - { - "epoch": 21.46, - "learning_rate": 2.3036363636363637e-06, - "loss": 0.3605, - "step": 24770 - }, - { - "epoch": 21.47, - "learning_rate": 2.3029370629370632e-06, - "loss": 0.3637, - "step": 24780 - }, - { - "epoch": 21.48, - "learning_rate": 2.302237762237762e-06, - "loss": 0.4152, - "step": 24790 - }, - { - "epoch": 21.49, - "learning_rate": 2.3015384615384614e-06, - "loss": 0.3703, - "step": 24800 - }, - { - "epoch": 21.5, - "learning_rate": 2.300839160839161e-06, - "loss": 0.3721, - "step": 24810 - }, - { - "epoch": 21.51, - "learning_rate": 2.30013986013986e-06, - "loss": 0.3466, - "step": 24820 - }, - { - "epoch": 21.52, - "learning_rate": 2.2994405594405594e-06, - "loss": 0.3717, - "step": 24830 - }, - { - "epoch": 21.52, - "learning_rate": 2.2987412587412585e-06, - "loss": 0.3719, - "step": 24840 - }, - { - "epoch": 21.53, - "learning_rate": 2.298041958041958e-06, - "loss": 0.3881, - "step": 24850 - }, - { - "epoch": 21.54, - "learning_rate": 2.297342657342657e-06, - "loss": 0.347, - "step": 24860 - }, - { - "epoch": 21.55, - "learning_rate": 2.2966433566433566e-06, - "loss": 0.3567, - "step": 24870 - }, - { - "epoch": 21.56, - "learning_rate": 2.295944055944056e-06, - "loss": 0.4173, - "step": 24880 - }, - { - "epoch": 21.57, - "learning_rate": 2.2952447552447556e-06, - "loss": 0.3959, - "step": 24890 - }, - { - "epoch": 21.58, - "learning_rate": 2.2945454545454542e-06, - "loss": 0.3761, - "step": 24900 - }, - { - "epoch": 21.59, - "learning_rate": 2.2938461538461537e-06, - "loss": 0.3773, - "step": 24910 - }, - { - "epoch": 21.59, - "learning_rate": 2.293146853146853e-06, - "loss": 0.3891, - "step": 24920 - }, - { - "epoch": 21.6, - "learning_rate": 2.2924475524475523e-06, - "loss": 0.3779, - "step": 24930 - }, - { - "epoch": 21.61, - "learning_rate": 2.2917482517482518e-06, - "loss": 0.4076, - "step": 24940 - }, - { - "epoch": 21.62, - "learning_rate": 2.291048951048951e-06, - "loss": 0.4118, - "step": 24950 - }, - { - "epoch": 21.63, - "learning_rate": 2.2903496503496503e-06, - "loss": 0.3887, - "step": 24960 - }, - { - "epoch": 21.64, - "learning_rate": 2.2896503496503494e-06, - "loss": 0.3366, - "step": 24970 - }, - { - "epoch": 21.65, - "learning_rate": 2.288951048951049e-06, - "loss": 0.3912, - "step": 24980 - }, - { - "epoch": 21.65, - "learning_rate": 2.2882517482517484e-06, - "loss": 0.3827, - "step": 24990 - }, - { - "epoch": 21.66, - "learning_rate": 2.287552447552447e-06, - "loss": 0.3377, - "step": 25000 - }, - { - "epoch": 21.67, - "learning_rate": 2.2868531468531466e-06, - "loss": 0.3491, - "step": 25010 - }, - { - "epoch": 21.68, - "learning_rate": 2.286153846153846e-06, - "loss": 0.3245, - "step": 25020 - }, - { - "epoch": 21.69, - "learning_rate": 2.2854545454545456e-06, - "loss": 0.4169, - "step": 25030 - }, - { - "epoch": 21.7, - "learning_rate": 2.2847552447552446e-06, - "loss": 0.4224, - "step": 25040 - }, - { - "epoch": 21.71, - "learning_rate": 2.284055944055944e-06, - "loss": 0.3476, - "step": 25050 - }, - { - "epoch": 21.72, - "learning_rate": 2.283356643356643e-06, - "loss": 0.4036, - "step": 25060 - }, - { - "epoch": 21.72, - "learning_rate": 2.2826573426573423e-06, - "loss": 0.3634, - "step": 25070 - }, - { - "epoch": 21.73, - "learning_rate": 2.2819580419580418e-06, - "loss": 0.3939, - "step": 25080 - }, - { - "epoch": 21.74, - "learning_rate": 2.2812587412587413e-06, - "loss": 0.3464, - "step": 25090 - }, - { - "epoch": 21.75, - "learning_rate": 2.2805594405594408e-06, - "loss": 0.3893, - "step": 25100 - }, - { - "epoch": 21.76, - "learning_rate": 2.2798601398601394e-06, - "loss": 0.3855, - "step": 25110 - }, - { - "epoch": 21.77, - "learning_rate": 2.279160839160839e-06, - "loss": 0.4167, - "step": 25120 - }, - { - "epoch": 21.78, - "learning_rate": 2.2784615384615384e-06, - "loss": 0.3836, - "step": 25130 - }, - { - "epoch": 21.78, - "learning_rate": 2.277762237762238e-06, - "loss": 0.3105, - "step": 25140 - }, - { - "epoch": 21.79, - "learning_rate": 2.277062937062937e-06, - "loss": 0.3964, - "step": 25150 - }, - { - "epoch": 21.8, - "learning_rate": 2.276363636363636e-06, - "loss": 0.3568, - "step": 25160 - }, - { - "epoch": 21.81, - "learning_rate": 2.2756643356643355e-06, - "loss": 0.3838, - "step": 25170 - }, - { - "epoch": 21.82, - "learning_rate": 2.2749650349650346e-06, - "loss": 0.3986, - "step": 25180 - }, - { - "epoch": 21.83, - "learning_rate": 2.274265734265734e-06, - "loss": 0.382, - "step": 25190 - }, - { - "epoch": 21.84, - "learning_rate": 2.2735664335664336e-06, - "loss": 0.448, - "step": 25200 - }, - { - "epoch": 21.85, - "learning_rate": 2.272867132867133e-06, - "loss": 0.3933, - "step": 25210 - }, - { - "epoch": 21.85, - "learning_rate": 2.2721678321678318e-06, - "loss": 0.4001, - "step": 25220 - }, - { - "epoch": 21.86, - "learning_rate": 2.2714685314685313e-06, - "loss": 0.3441, - "step": 25230 - }, - { - "epoch": 21.87, - "learning_rate": 2.2707692307692308e-06, - "loss": 0.3799, - "step": 25240 - }, - { - "epoch": 21.88, - "learning_rate": 2.27006993006993e-06, - "loss": 0.3925, - "step": 25250 - }, - { - "epoch": 21.89, - "learning_rate": 2.2693706293706293e-06, - "loss": 0.3734, - "step": 25260 - }, - { - "epoch": 21.9, - "learning_rate": 2.2687412587412584e-06, - "loss": 0.4445, - "step": 25270 - }, - { - "epoch": 21.91, - "learning_rate": 2.268041958041958e-06, - "loss": 0.3718, - "step": 25280 - }, - { - "epoch": 21.91, - "learning_rate": 2.2673426573426574e-06, - "loss": 0.4257, - "step": 25290 - }, - { - "epoch": 21.92, - "learning_rate": 2.266643356643357e-06, - "loss": 0.3629, - "step": 25300 - }, - { - "epoch": 21.93, - "learning_rate": 2.2659440559440555e-06, - "loss": 0.345, - "step": 25310 - }, - { - "epoch": 21.94, - "learning_rate": 2.265244755244755e-06, - "loss": 0.424, - "step": 25320 - }, - { - "epoch": 21.95, - "learning_rate": 2.2645454545454545e-06, - "loss": 0.4096, - "step": 25330 - }, - { - "epoch": 21.96, - "learning_rate": 2.263846153846154e-06, - "loss": 0.3915, - "step": 25340 - }, - { - "epoch": 21.97, - "learning_rate": 2.263146853146853e-06, - "loss": 0.4156, - "step": 25350 - }, - { - "epoch": 21.98, - "learning_rate": 2.2624475524475526e-06, - "loss": 0.4044, - "step": 25360 - }, - { - "epoch": 21.98, - "learning_rate": 2.2617482517482516e-06, - "loss": 0.3756, - "step": 25370 - }, - { - "epoch": 21.99, - "learning_rate": 2.2610489510489507e-06, - "loss": 0.4993, - "step": 25380 - }, - { - "epoch": 22.0, - "eval_loss": 0.55206298828125, - "eval_runtime": 133.6827, - "eval_samples_per_second": 3.98, - "eval_steps_per_second": 1.99, - "eval_wer": 0.2529407983544385, - "step": 25388 - }, - { - "epoch": 22.0, - "learning_rate": 2.2603496503496502e-06, - "loss": 0.4081, - "step": 25390 - }, - { - "epoch": 22.01, - "learning_rate": 2.2596503496503497e-06, - "loss": 0.3995, - "step": 25400 - }, - { - "epoch": 22.02, - "learning_rate": 2.258951048951049e-06, - "loss": 0.3564, - "step": 25410 - }, - { - "epoch": 22.03, - "learning_rate": 2.258251748251748e-06, - "loss": 0.39, - "step": 25420 - }, - { - "epoch": 22.04, - "learning_rate": 2.2575524475524474e-06, - "loss": 0.3942, - "step": 25430 - }, - { - "epoch": 22.05, - "learning_rate": 2.256853146853147e-06, - "loss": 0.3723, - "step": 25440 - }, - { - "epoch": 22.05, - "learning_rate": 2.256153846153846e-06, - "loss": 0.4172, - "step": 25450 - }, - { - "epoch": 22.06, - "learning_rate": 2.2554545454545454e-06, - "loss": 0.4109, - "step": 25460 - }, - { - "epoch": 22.07, - "learning_rate": 2.2547552447552445e-06, - "loss": 0.3592, - "step": 25470 - }, - { - "epoch": 22.08, - "learning_rate": 2.254055944055944e-06, - "loss": 0.3938, - "step": 25480 - }, - { - "epoch": 22.09, - "learning_rate": 2.253356643356643e-06, - "loss": 0.4014, - "step": 25490 - }, - { - "epoch": 22.1, - "learning_rate": 2.2526573426573426e-06, - "loss": 0.358, - "step": 25500 - }, - { - "epoch": 22.11, - "learning_rate": 2.251958041958042e-06, - "loss": 0.3604, - "step": 25510 - }, - { - "epoch": 22.11, - "learning_rate": 2.2512587412587416e-06, - "loss": 0.3497, - "step": 25520 - }, - { - "epoch": 22.12, - "learning_rate": 2.25055944055944e-06, - "loss": 0.3939, - "step": 25530 - }, - { - "epoch": 22.13, - "learning_rate": 2.2499300699300697e-06, - "loss": 0.4107, - "step": 25540 - }, - { - "epoch": 22.14, - "learning_rate": 2.249230769230769e-06, - "loss": 0.3557, - "step": 25550 - }, - { - "epoch": 22.15, - "learning_rate": 2.2485314685314687e-06, - "loss": 0.3858, - "step": 25560 - }, - { - "epoch": 22.16, - "learning_rate": 2.2478321678321677e-06, - "loss": 0.3781, - "step": 25570 - }, - { - "epoch": 22.17, - "learning_rate": 2.247132867132867e-06, - "loss": 0.386, - "step": 25580 - }, - { - "epoch": 22.17, - "learning_rate": 2.2464335664335663e-06, - "loss": 0.3992, - "step": 25590 - }, - { - "epoch": 22.18, - "learning_rate": 2.245734265734266e-06, - "loss": 0.3983, - "step": 25600 - }, - { - "epoch": 22.19, - "learning_rate": 2.2450349650349653e-06, - "loss": 0.3997, - "step": 25610 - }, - { - "epoch": 22.2, - "learning_rate": 2.244335664335664e-06, - "loss": 0.4447, - "step": 25620 - }, - { - "epoch": 22.21, - "learning_rate": 2.2436363636363634e-06, - "loss": 0.3922, - "step": 25630 - }, - { - "epoch": 22.22, - "learning_rate": 2.242937062937063e-06, - "loss": 0.381, - "step": 25640 - }, - { - "epoch": 22.23, - "learning_rate": 2.242237762237762e-06, - "loss": 0.4374, - "step": 25650 - }, - { - "epoch": 22.24, - "learning_rate": 2.2415384615384615e-06, - "loss": 0.4023, - "step": 25660 - }, - { - "epoch": 22.24, - "learning_rate": 2.240839160839161e-06, - "loss": 0.3713, - "step": 25670 - }, - { - "epoch": 22.25, - "learning_rate": 2.24013986013986e-06, - "loss": 0.389, - "step": 25680 - }, - { - "epoch": 22.26, - "learning_rate": 2.239440559440559e-06, - "loss": 0.4042, - "step": 25690 - }, - { - "epoch": 22.27, - "learning_rate": 2.2387412587412587e-06, - "loss": 0.3508, - "step": 25700 - }, - { - "epoch": 22.28, - "learning_rate": 2.238041958041958e-06, - "loss": 0.4081, - "step": 25710 - }, - { - "epoch": 22.29, - "learning_rate": 2.2373426573426572e-06, - "loss": 0.3937, - "step": 25720 - }, - { - "epoch": 22.3, - "learning_rate": 2.2366433566433563e-06, - "loss": 0.4126, - "step": 25730 - }, - { - "epoch": 22.3, - "learning_rate": 2.235944055944056e-06, - "loss": 0.3849, - "step": 25740 - }, - { - "epoch": 22.31, - "learning_rate": 2.2352447552447553e-06, - "loss": 0.3666, - "step": 25750 - }, - { - "epoch": 22.32, - "learning_rate": 2.2345454545454544e-06, - "loss": 0.3968, - "step": 25760 - }, - { - "epoch": 22.33, - "learning_rate": 2.233846153846154e-06, - "loss": 0.3478, - "step": 25770 - }, - { - "epoch": 22.34, - "learning_rate": 2.233146853146853e-06, - "loss": 0.4305, - "step": 25780 - }, - { - "epoch": 22.35, - "learning_rate": 2.2324475524475524e-06, - "loss": 0.3786, - "step": 25790 - }, - { - "epoch": 22.36, - "learning_rate": 2.2317482517482515e-06, - "loss": 0.3271, - "step": 25800 - }, - { - "epoch": 22.37, - "learning_rate": 2.231048951048951e-06, - "loss": 0.3788, - "step": 25810 - }, - { - "epoch": 22.37, - "learning_rate": 2.2303496503496505e-06, - "loss": 0.3743, - "step": 25820 - }, - { - "epoch": 22.38, - "learning_rate": 2.2296503496503496e-06, - "loss": 0.4284, - "step": 25830 - }, - { - "epoch": 22.39, - "learning_rate": 2.2289510489510486e-06, - "loss": 0.4357, - "step": 25840 - }, - { - "epoch": 22.4, - "learning_rate": 2.228251748251748e-06, - "loss": 0.3475, - "step": 25850 - }, - { - "epoch": 22.41, - "learning_rate": 2.2275524475524476e-06, - "loss": 0.2906, - "step": 25860 - }, - { - "epoch": 22.42, - "learning_rate": 2.2268531468531467e-06, - "loss": 0.3724, - "step": 25870 - }, - { - "epoch": 22.43, - "learning_rate": 2.226153846153846e-06, - "loss": 0.3659, - "step": 25880 - }, - { - "epoch": 22.43, - "learning_rate": 2.2254545454545453e-06, - "loss": 0.374, - "step": 25890 - }, - { - "epoch": 22.44, - "learning_rate": 2.2247552447552444e-06, - "loss": 0.3879, - "step": 25900 - }, - { - "epoch": 22.45, - "learning_rate": 2.224055944055944e-06, - "loss": 0.3066, - "step": 25910 - }, - { - "epoch": 22.46, - "learning_rate": 2.2233566433566434e-06, - "loss": 0.3119, - "step": 25920 - }, - { - "epoch": 22.47, - "learning_rate": 2.222657342657343e-06, - "loss": 0.4196, - "step": 25930 - }, - { - "epoch": 22.48, - "learning_rate": 2.2219580419580415e-06, - "loss": 0.3935, - "step": 25940 - }, - { - "epoch": 22.49, - "learning_rate": 2.221258741258741e-06, - "loss": 0.363, - "step": 25950 - }, - { - "epoch": 22.5, - "learning_rate": 2.2205594405594405e-06, - "loss": 0.4021, - "step": 25960 - }, - { - "epoch": 22.5, - "learning_rate": 2.21986013986014e-06, - "loss": 0.3808, - "step": 25970 - }, - { - "epoch": 22.51, - "learning_rate": 2.219160839160839e-06, - "loss": 0.4058, - "step": 25980 - }, - { - "epoch": 22.52, - "learning_rate": 2.2184615384615386e-06, - "loss": 0.3699, - "step": 25990 - }, - { - "epoch": 22.53, - "learning_rate": 2.2177622377622376e-06, - "loss": 0.3609, - "step": 26000 - }, - { - "epoch": 22.54, - "learning_rate": 2.2170629370629367e-06, - "loss": 0.3769, - "step": 26010 - }, - { - "epoch": 22.55, - "learning_rate": 2.216363636363636e-06, - "loss": 0.3697, - "step": 26020 - }, - { - "epoch": 22.56, - "learning_rate": 2.2156643356643357e-06, - "loss": 0.4068, - "step": 26030 - }, - { - "epoch": 22.56, - "learning_rate": 2.214965034965035e-06, - "loss": 0.4025, - "step": 26040 - }, - { - "epoch": 22.57, - "learning_rate": 2.214265734265734e-06, - "loss": 0.4122, - "step": 26050 - }, - { - "epoch": 22.58, - "learning_rate": 2.2135664335664333e-06, - "loss": 0.3301, - "step": 26060 - }, - { - "epoch": 22.59, - "learning_rate": 2.212867132867133e-06, - "loss": 0.3911, - "step": 26070 - }, - { - "epoch": 22.6, - "learning_rate": 2.212167832167832e-06, - "loss": 0.3702, - "step": 26080 - }, - { - "epoch": 22.61, - "learning_rate": 2.2114685314685314e-06, - "loss": 0.4195, - "step": 26090 - }, - { - "epoch": 22.62, - "learning_rate": 2.210769230769231e-06, - "loss": 0.418, - "step": 26100 - }, - { - "epoch": 22.63, - "learning_rate": 2.21006993006993e-06, - "loss": 0.3531, - "step": 26110 - }, - { - "epoch": 22.63, - "learning_rate": 2.209370629370629e-06, - "loss": 0.4043, - "step": 26120 - }, - { - "epoch": 22.64, - "learning_rate": 2.2086713286713286e-06, - "loss": 0.3328, - "step": 26130 - }, - { - "epoch": 22.65, - "learning_rate": 2.207972027972028e-06, - "loss": 0.328, - "step": 26140 - }, - { - "epoch": 22.66, - "learning_rate": 2.207272727272727e-06, - "loss": 0.4128, - "step": 26150 - }, - { - "epoch": 22.67, - "learning_rate": 2.206573426573426e-06, - "loss": 0.3926, - "step": 26160 - }, - { - "epoch": 22.68, - "learning_rate": 2.2058741258741257e-06, - "loss": 0.3639, - "step": 26170 - }, - { - "epoch": 22.69, - "learning_rate": 2.205174825174825e-06, - "loss": 0.3715, - "step": 26180 - }, - { - "epoch": 22.69, - "learning_rate": 2.2044755244755243e-06, - "loss": 0.3521, - "step": 26190 - }, - { - "epoch": 22.7, - "learning_rate": 2.2037762237762238e-06, - "loss": 0.3788, - "step": 26200 - }, - { - "epoch": 22.71, - "learning_rate": 2.2030769230769233e-06, - "loss": 0.3915, - "step": 26210 - }, - { - "epoch": 22.72, - "learning_rate": 2.2023776223776223e-06, - "loss": 0.3423, - "step": 26220 - }, - { - "epoch": 22.73, - "learning_rate": 2.2016783216783214e-06, - "loss": 0.373, - "step": 26230 - }, - { - "epoch": 22.74, - "learning_rate": 2.200979020979021e-06, - "loss": 0.3901, - "step": 26240 - }, - { - "epoch": 22.75, - "learning_rate": 2.2002797202797204e-06, - "loss": 0.4118, - "step": 26250 - }, - { - "epoch": 22.76, - "learning_rate": 2.1995804195804195e-06, - "loss": 0.3516, - "step": 26260 - }, - { - "epoch": 22.76, - "learning_rate": 2.1988811188811185e-06, - "loss": 0.3985, - "step": 26270 - }, - { - "epoch": 22.77, - "learning_rate": 2.198181818181818e-06, - "loss": 0.3818, - "step": 26280 - }, - { - "epoch": 22.78, - "learning_rate": 2.1974825174825175e-06, - "loss": 0.4288, - "step": 26290 - }, - { - "epoch": 22.79, - "learning_rate": 2.1967832167832166e-06, - "loss": 0.3869, - "step": 26300 - }, - { - "epoch": 22.8, - "learning_rate": 2.196083916083916e-06, - "loss": 0.363, - "step": 26310 - }, - { - "epoch": 22.81, - "learning_rate": 2.195384615384615e-06, - "loss": 0.383, - "step": 26320 - }, - { - "epoch": 22.82, - "learning_rate": 2.1946853146853143e-06, - "loss": 0.3899, - "step": 26330 - }, - { - "epoch": 22.82, - "learning_rate": 2.1939860139860138e-06, - "loss": 0.3354, - "step": 26340 - }, - { - "epoch": 22.83, - "learning_rate": 2.1932867132867132e-06, - "loss": 0.3557, - "step": 26350 - }, - { - "epoch": 22.84, - "learning_rate": 2.1925874125874127e-06, - "loss": 0.4285, - "step": 26360 - }, - { - "epoch": 22.85, - "learning_rate": 2.191888111888112e-06, - "loss": 0.373, - "step": 26370 - }, - { - "epoch": 22.86, - "learning_rate": 2.191188811188811e-06, - "loss": 0.3531, - "step": 26380 - }, - { - "epoch": 22.87, - "learning_rate": 2.1904895104895104e-06, - "loss": 0.3789, - "step": 26390 - }, - { - "epoch": 22.88, - "learning_rate": 2.18979020979021e-06, - "loss": 0.3444, - "step": 26400 - }, - { - "epoch": 22.89, - "learning_rate": 2.189090909090909e-06, - "loss": 0.3703, - "step": 26410 - }, - { - "epoch": 22.89, - "learning_rate": 2.1883916083916085e-06, - "loss": 0.3799, - "step": 26420 - }, - { - "epoch": 22.9, - "learning_rate": 2.1876923076923075e-06, - "loss": 0.3731, - "step": 26430 - }, - { - "epoch": 22.91, - "learning_rate": 2.1869930069930066e-06, - "loss": 0.428, - "step": 26440 - }, - { - "epoch": 22.92, - "learning_rate": 2.186293706293706e-06, - "loss": 0.3845, - "step": 26450 - }, - { - "epoch": 22.93, - "learning_rate": 2.1855944055944056e-06, - "loss": 0.3844, - "step": 26460 - }, - { - "epoch": 22.94, - "learning_rate": 2.184895104895105e-06, - "loss": 0.3658, - "step": 26470 - }, - { - "epoch": 22.95, - "learning_rate": 2.184195804195804e-06, - "loss": 0.3885, - "step": 26480 - }, - { - "epoch": 22.95, - "learning_rate": 2.1834965034965032e-06, - "loss": 0.3828, - "step": 26490 - }, - { - "epoch": 22.96, - "learning_rate": 2.1827972027972027e-06, - "loss": 0.4448, - "step": 26500 - }, - { - "epoch": 22.97, - "learning_rate": 2.182097902097902e-06, - "loss": 0.351, - "step": 26510 - }, - { - "epoch": 22.98, - "learning_rate": 2.1813986013986013e-06, - "loss": 0.3683, - "step": 26520 - }, - { - "epoch": 22.99, - "learning_rate": 2.180699300699301e-06, - "loss": 0.3684, - "step": 26530 - }, - { - "epoch": 23.0, - "learning_rate": 2.18e-06, - "loss": 0.4006, - "step": 26540 - }, - { - "epoch": 23.0, - "eval_loss": 0.5390881299972534, - "eval_runtime": 135.1116, - "eval_samples_per_second": 3.937, - "eval_steps_per_second": 1.969, - "eval_wer": 0.2539692742816738, - "step": 26542 - }, - { - "epoch": 23.01, - "learning_rate": 2.179300699300699e-06, - "loss": 0.4004, - "step": 26550 - }, - { - "epoch": 23.02, - "learning_rate": 2.1786013986013985e-06, - "loss": 0.3702, - "step": 26560 - }, - { - "epoch": 23.02, - "learning_rate": 2.177902097902098e-06, - "loss": 0.3652, - "step": 26570 - }, - { - "epoch": 23.03, - "learning_rate": 2.1772027972027974e-06, - "loss": 0.3967, - "step": 26580 - }, - { - "epoch": 23.04, - "learning_rate": 2.176503496503496e-06, - "loss": 0.4196, - "step": 26590 - }, - { - "epoch": 23.05, - "learning_rate": 2.1758041958041956e-06, - "loss": 0.3222, - "step": 26600 - }, - { - "epoch": 23.06, - "learning_rate": 2.175104895104895e-06, - "loss": 0.4268, - "step": 26610 - }, - { - "epoch": 23.07, - "learning_rate": 2.174405594405594e-06, - "loss": 0.3838, - "step": 26620 - }, - { - "epoch": 23.08, - "learning_rate": 2.1737062937062937e-06, - "loss": 0.3729, - "step": 26630 - }, - { - "epoch": 23.08, - "learning_rate": 2.173006993006993e-06, - "loss": 0.3547, - "step": 26640 - }, - { - "epoch": 23.09, - "learning_rate": 2.1723076923076922e-06, - "loss": 0.3471, - "step": 26650 - }, - { - "epoch": 23.1, - "learning_rate": 2.1716083916083913e-06, - "loss": 0.3904, - "step": 26660 - }, - { - "epoch": 23.11, - "learning_rate": 2.170909090909091e-06, - "loss": 0.3874, - "step": 26670 - }, - { - "epoch": 23.12, - "learning_rate": 2.1702097902097903e-06, - "loss": 0.4084, - "step": 26680 - }, - { - "epoch": 23.13, - "learning_rate": 2.1695104895104894e-06, - "loss": 0.4002, - "step": 26690 - }, - { - "epoch": 23.14, - "learning_rate": 2.1688111888111884e-06, - "loss": 0.376, - "step": 26700 - }, - { - "epoch": 23.15, - "learning_rate": 2.168111888111888e-06, - "loss": 0.3864, - "step": 26710 - }, - { - "epoch": 23.15, - "learning_rate": 2.1674125874125874e-06, - "loss": 0.319, - "step": 26720 - }, - { - "epoch": 23.16, - "learning_rate": 2.1667132867132865e-06, - "loss": 0.4121, - "step": 26730 - }, - { - "epoch": 23.17, - "learning_rate": 2.166013986013986e-06, - "loss": 0.4444, - "step": 26740 - }, - { - "epoch": 23.18, - "learning_rate": 2.1653146853146855e-06, - "loss": 0.3773, - "step": 26750 - }, - { - "epoch": 23.19, - "learning_rate": 2.1646153846153846e-06, - "loss": 0.392, - "step": 26760 - }, - { - "epoch": 23.2, - "learning_rate": 2.1639160839160837e-06, - "loss": 0.4112, - "step": 26770 - }, - { - "epoch": 23.21, - "learning_rate": 2.163216783216783e-06, - "loss": 0.355, - "step": 26780 - }, - { - "epoch": 23.21, - "learning_rate": 2.1625174825174826e-06, - "loss": 0.4104, - "step": 26790 - }, - { - "epoch": 23.22, - "learning_rate": 2.1618181818181817e-06, - "loss": 0.387, - "step": 26800 - }, - { - "epoch": 23.23, - "learning_rate": 2.161118881118881e-06, - "loss": 0.3586, - "step": 26810 - }, - { - "epoch": 23.24, - "learning_rate": 2.1604195804195803e-06, - "loss": 0.3314, - "step": 26820 - }, - { - "epoch": 23.25, - "learning_rate": 2.1597202797202798e-06, - "loss": 0.3541, - "step": 26830 - }, - { - "epoch": 23.26, - "learning_rate": 2.159020979020979e-06, - "loss": 0.3251, - "step": 26840 - }, - { - "epoch": 23.27, - "learning_rate": 2.1583216783216784e-06, - "loss": 0.3827, - "step": 26850 - }, - { - "epoch": 23.28, - "learning_rate": 2.157622377622378e-06, - "loss": 0.3847, - "step": 26860 - }, - { - "epoch": 23.28, - "learning_rate": 2.1569230769230765e-06, - "loss": 0.3511, - "step": 26870 - }, - { - "epoch": 23.29, - "learning_rate": 2.156223776223776e-06, - "loss": 0.3836, - "step": 26880 - }, - { - "epoch": 23.3, - "learning_rate": 2.1555244755244755e-06, - "loss": 0.4105, - "step": 26890 - }, - { - "epoch": 23.31, - "learning_rate": 2.154825174825175e-06, - "loss": 0.389, - "step": 26900 - }, - { - "epoch": 23.32, - "learning_rate": 2.154125874125874e-06, - "loss": 0.4224, - "step": 26910 - }, - { - "epoch": 23.33, - "learning_rate": 2.153426573426573e-06, - "loss": 0.3815, - "step": 26920 - }, - { - "epoch": 23.34, - "learning_rate": 2.1527272727272726e-06, - "loss": 0.4167, - "step": 26930 - }, - { - "epoch": 23.34, - "learning_rate": 2.152027972027972e-06, - "loss": 0.3705, - "step": 26940 - }, - { - "epoch": 23.35, - "learning_rate": 2.151328671328671e-06, - "loss": 0.3442, - "step": 26950 - }, - { - "epoch": 23.36, - "learning_rate": 2.1506293706293707e-06, - "loss": 0.3981, - "step": 26960 - }, - { - "epoch": 23.37, - "learning_rate": 2.1499300699300698e-06, - "loss": 0.3808, - "step": 26970 - }, - { - "epoch": 23.38, - "learning_rate": 2.149230769230769e-06, - "loss": 0.3783, - "step": 26980 - }, - { - "epoch": 23.39, - "learning_rate": 2.1485314685314683e-06, - "loss": 0.4623, - "step": 26990 - }, - { - "epoch": 23.4, - "learning_rate": 2.147832167832168e-06, - "loss": 0.4182, - "step": 27000 - }, - { - "epoch": 23.41, - "learning_rate": 2.1471328671328673e-06, - "loss": 0.3527, - "step": 27010 - }, - { - "epoch": 23.41, - "learning_rate": 2.1464335664335664e-06, - "loss": 0.439, - "step": 27020 - }, - { - "epoch": 23.42, - "learning_rate": 2.1457342657342655e-06, - "loss": 0.3807, - "step": 27030 - }, - { - "epoch": 23.43, - "learning_rate": 2.145034965034965e-06, - "loss": 0.4682, - "step": 27040 - }, - { - "epoch": 23.44, - "learning_rate": 2.144335664335664e-06, - "loss": 0.3696, - "step": 27050 - }, - { - "epoch": 23.45, - "learning_rate": 2.1436363636363636e-06, - "loss": 0.4157, - "step": 27060 - }, - { - "epoch": 23.46, - "learning_rate": 2.142937062937063e-06, - "loss": 0.36, - "step": 27070 - }, - { - "epoch": 23.47, - "learning_rate": 2.142237762237762e-06, - "loss": 0.4192, - "step": 27080 - }, - { - "epoch": 23.47, - "learning_rate": 2.141538461538461e-06, - "loss": 0.3983, - "step": 27090 - }, - { - "epoch": 23.48, - "learning_rate": 2.1408391608391607e-06, - "loss": 0.376, - "step": 27100 - }, - { - "epoch": 23.49, - "learning_rate": 2.14013986013986e-06, - "loss": 0.3796, - "step": 27110 - }, - { - "epoch": 23.5, - "learning_rate": 2.1394405594405593e-06, - "loss": 0.3944, - "step": 27120 - }, - { - "epoch": 23.51, - "learning_rate": 2.1387412587412583e-06, - "loss": 0.3578, - "step": 27130 - }, - { - "epoch": 23.52, - "learning_rate": 2.138041958041958e-06, - "loss": 0.4543, - "step": 27140 - }, - { - "epoch": 23.53, - "learning_rate": 2.1373426573426573e-06, - "loss": 0.3819, - "step": 27150 - }, - { - "epoch": 23.54, - "learning_rate": 2.1366433566433564e-06, - "loss": 0.4166, - "step": 27160 - }, - { - "epoch": 23.54, - "learning_rate": 2.135944055944056e-06, - "loss": 0.3704, - "step": 27170 - }, - { - "epoch": 23.55, - "learning_rate": 2.1352447552447554e-06, - "loss": 0.4091, - "step": 27180 - }, - { - "epoch": 23.56, - "learning_rate": 2.1345454545454545e-06, - "loss": 0.4358, - "step": 27190 - }, - { - "epoch": 23.57, - "learning_rate": 2.1338461538461535e-06, - "loss": 0.376, - "step": 27200 - }, - { - "epoch": 23.58, - "learning_rate": 2.133146853146853e-06, - "loss": 0.3762, - "step": 27210 - }, - { - "epoch": 23.59, - "learning_rate": 2.1324475524475525e-06, - "loss": 0.3738, - "step": 27220 - }, - { - "epoch": 23.6, - "learning_rate": 2.1317482517482516e-06, - "loss": 0.4496, - "step": 27230 - }, - { - "epoch": 23.6, - "learning_rate": 2.1310489510489507e-06, - "loss": 0.3792, - "step": 27240 - }, - { - "epoch": 23.61, - "learning_rate": 2.13034965034965e-06, - "loss": 0.3751, - "step": 27250 - }, - { - "epoch": 23.62, - "learning_rate": 2.1296503496503497e-06, - "loss": 0.3919, - "step": 27260 - }, - { - "epoch": 23.63, - "learning_rate": 2.1289510489510488e-06, - "loss": 0.3704, - "step": 27270 - }, - { - "epoch": 23.64, - "learning_rate": 2.1282517482517483e-06, - "loss": 0.4081, - "step": 27280 - }, - { - "epoch": 23.65, - "learning_rate": 2.1275524475524478e-06, - "loss": 0.4452, - "step": 27290 - }, - { - "epoch": 23.66, - "learning_rate": 2.1268531468531464e-06, - "loss": 0.431, - "step": 27300 - }, - { - "epoch": 23.67, - "learning_rate": 2.126153846153846e-06, - "loss": 0.3536, - "step": 27310 - }, - { - "epoch": 23.67, - "learning_rate": 2.1254545454545454e-06, - "loss": 0.4114, - "step": 27320 - }, - { - "epoch": 23.68, - "learning_rate": 2.124755244755245e-06, - "loss": 0.3842, - "step": 27330 - }, - { - "epoch": 23.69, - "learning_rate": 2.124055944055944e-06, - "loss": 0.353, - "step": 27340 - }, - { - "epoch": 23.7, - "learning_rate": 2.123356643356643e-06, - "loss": 0.4224, - "step": 27350 - }, - { - "epoch": 23.71, - "learning_rate": 2.1226573426573425e-06, - "loss": 0.3435, - "step": 27360 - }, - { - "epoch": 23.72, - "learning_rate": 2.121958041958042e-06, - "loss": 0.3487, - "step": 27370 - }, - { - "epoch": 23.73, - "learning_rate": 2.121258741258741e-06, - "loss": 0.3942, - "step": 27380 - }, - { - "epoch": 23.73, - "learning_rate": 2.1205594405594406e-06, - "loss": 0.3632, - "step": 27390 - }, - { - "epoch": 23.74, - "learning_rate": 2.11986013986014e-06, - "loss": 0.382, - "step": 27400 - }, - { - "epoch": 23.75, - "learning_rate": 2.1191608391608387e-06, - "loss": 0.3673, - "step": 27410 - }, - { - "epoch": 23.76, - "learning_rate": 2.1184615384615382e-06, - "loss": 0.3575, - "step": 27420 - }, - { - "epoch": 23.77, - "learning_rate": 2.1177622377622377e-06, - "loss": 0.419, - "step": 27430 - }, - { - "epoch": 23.78, - "learning_rate": 2.1170629370629372e-06, - "loss": 0.3871, - "step": 27440 - }, - { - "epoch": 23.79, - "learning_rate": 2.1163636363636363e-06, - "loss": 0.3454, - "step": 27450 - }, - { - "epoch": 23.8, - "learning_rate": 2.1156643356643354e-06, - "loss": 0.334, - "step": 27460 - }, - { - "epoch": 23.8, - "learning_rate": 2.114965034965035e-06, - "loss": 0.3547, - "step": 27470 - }, - { - "epoch": 23.81, - "learning_rate": 2.114265734265734e-06, - "loss": 0.3734, - "step": 27480 - }, - { - "epoch": 23.82, - "learning_rate": 2.1135664335664335e-06, - "loss": 0.4145, - "step": 27490 - }, - { - "epoch": 23.83, - "learning_rate": 2.112867132867133e-06, - "loss": 0.4302, - "step": 27500 - }, - { - "epoch": 23.84, - "learning_rate": 2.112167832167832e-06, - "loss": 0.3534, - "step": 27510 - }, - { - "epoch": 23.85, - "learning_rate": 2.111468531468531e-06, - "loss": 0.3707, - "step": 27520 - }, - { - "epoch": 23.86, - "learning_rate": 2.1107692307692306e-06, - "loss": 0.4046, - "step": 27530 - }, - { - "epoch": 23.86, - "learning_rate": 2.11006993006993e-06, - "loss": 0.3533, - "step": 27540 - }, - { - "epoch": 23.87, - "learning_rate": 2.1093706293706296e-06, - "loss": 0.3866, - "step": 27550 - }, - { - "epoch": 23.88, - "learning_rate": 2.1086713286713287e-06, - "loss": 0.3552, - "step": 27560 - }, - { - "epoch": 23.89, - "learning_rate": 2.1079720279720277e-06, - "loss": 0.3502, - "step": 27570 - }, - { - "epoch": 23.9, - "learning_rate": 2.1072727272727272e-06, - "loss": 0.3573, - "step": 27580 - }, - { - "epoch": 23.91, - "learning_rate": 2.1065734265734263e-06, - "loss": 0.3815, - "step": 27590 - }, - { - "epoch": 23.92, - "learning_rate": 2.105874125874126e-06, - "loss": 0.3983, - "step": 27600 - }, - { - "epoch": 23.93, - "learning_rate": 2.1051748251748253e-06, - "loss": 0.3672, - "step": 27610 - }, - { - "epoch": 23.93, - "learning_rate": 2.1044755244755244e-06, - "loss": 0.3297, - "step": 27620 - }, - { - "epoch": 23.94, - "learning_rate": 2.1037762237762234e-06, - "loss": 0.4176, - "step": 27630 - }, - { - "epoch": 23.95, - "learning_rate": 2.103076923076923e-06, - "loss": 0.4519, - "step": 27640 - }, - { - "epoch": 23.96, - "learning_rate": 2.1023776223776224e-06, - "loss": 0.3794, - "step": 27650 - }, - { - "epoch": 23.97, - "learning_rate": 2.1016783216783215e-06, - "loss": 0.3804, - "step": 27660 - }, - { - "epoch": 23.98, - "learning_rate": 2.1009790209790206e-06, - "loss": 0.3239, - "step": 27670 - }, - { - "epoch": 23.99, - "learning_rate": 2.10027972027972e-06, - "loss": 0.3851, - "step": 27680 - }, - { - "epoch": 23.99, - "learning_rate": 2.0995804195804196e-06, - "loss": 0.3415, - "step": 27690 - }, - { - "epoch": 24.0, - "eval_loss": 0.5621957182884216, - "eval_runtime": 135.5763, - "eval_samples_per_second": 3.924, - "eval_steps_per_second": 1.962, - "eval_wer": 0.250305328790898, - "step": 27696 - }, - { - "epoch": 24.0, - "learning_rate": 2.0988811188811187e-06, - "loss": 0.3816, - "step": 27700 - }, - { - "epoch": 24.01, - "learning_rate": 2.098181818181818e-06, - "loss": 0.4067, - "step": 27710 - }, - { - "epoch": 24.02, - "learning_rate": 2.0974825174825176e-06, - "loss": 0.3512, - "step": 27720 - }, - { - "epoch": 24.03, - "learning_rate": 2.0967832167832167e-06, - "loss": 0.368, - "step": 27730 - }, - { - "epoch": 24.04, - "learning_rate": 2.096083916083916e-06, - "loss": 0.4063, - "step": 27740 - }, - { - "epoch": 24.05, - "learning_rate": 2.0953846153846153e-06, - "loss": 0.3105, - "step": 27750 - }, - { - "epoch": 24.06, - "learning_rate": 2.0947552447552448e-06, - "loss": 0.3747, - "step": 27760 - }, - { - "epoch": 24.06, - "learning_rate": 2.094055944055944e-06, - "loss": 0.3939, - "step": 27770 - }, - { - "epoch": 24.07, - "learning_rate": 2.0933566433566433e-06, - "loss": 0.3713, - "step": 27780 - }, - { - "epoch": 24.08, - "learning_rate": 2.0926573426573424e-06, - "loss": 0.3839, - "step": 27790 - }, - { - "epoch": 24.09, - "learning_rate": 2.091958041958042e-06, - "loss": 0.3202, - "step": 27800 - }, - { - "epoch": 24.1, - "learning_rate": 2.0912587412587414e-06, - "loss": 0.3735, - "step": 27810 - }, - { - "epoch": 24.11, - "learning_rate": 2.0905594405594405e-06, - "loss": 0.3817, - "step": 27820 - }, - { - "epoch": 24.12, - "learning_rate": 2.0898601398601395e-06, - "loss": 0.388, - "step": 27830 - }, - { - "epoch": 24.12, - "learning_rate": 2.089160839160839e-06, - "loss": 0.3489, - "step": 27840 - }, - { - "epoch": 24.13, - "learning_rate": 2.0884615384615385e-06, - "loss": 0.3306, - "step": 27850 - }, - { - "epoch": 24.14, - "learning_rate": 2.0877622377622376e-06, - "loss": 0.358, - "step": 27860 - }, - { - "epoch": 24.15, - "learning_rate": 2.087062937062937e-06, - "loss": 0.395, - "step": 27870 - }, - { - "epoch": 24.16, - "learning_rate": 2.086363636363636e-06, - "loss": 0.419, - "step": 27880 - }, - { - "epoch": 24.17, - "learning_rate": 2.0856643356643357e-06, - "loss": 0.3394, - "step": 27890 - }, - { - "epoch": 24.18, - "learning_rate": 2.0849650349650347e-06, - "loss": 0.3663, - "step": 27900 - }, - { - "epoch": 24.19, - "learning_rate": 2.0842657342657342e-06, - "loss": 0.3996, - "step": 27910 - }, - { - "epoch": 24.19, - "learning_rate": 2.0835664335664337e-06, - "loss": 0.359, - "step": 27920 - }, - { - "epoch": 24.2, - "learning_rate": 2.0828671328671324e-06, - "loss": 0.4252, - "step": 27930 - }, - { - "epoch": 24.21, - "learning_rate": 2.082167832167832e-06, - "loss": 0.3889, - "step": 27940 - }, - { - "epoch": 24.22, - "learning_rate": 2.0814685314685314e-06, - "loss": 0.3811, - "step": 27950 - }, - { - "epoch": 24.23, - "learning_rate": 2.080769230769231e-06, - "loss": 0.3844, - "step": 27960 - }, - { - "epoch": 24.24, - "learning_rate": 2.08006993006993e-06, - "loss": 0.3364, - "step": 27970 - }, - { - "epoch": 24.25, - "learning_rate": 2.079370629370629e-06, - "loss": 0.4162, - "step": 27980 - }, - { - "epoch": 24.25, - "learning_rate": 2.0786713286713285e-06, - "loss": 0.4423, - "step": 27990 - }, - { - "epoch": 24.26, - "learning_rate": 2.077972027972028e-06, - "loss": 0.3822, - "step": 28000 - }, - { - "epoch": 24.27, - "learning_rate": 2.077272727272727e-06, - "loss": 0.3784, - "step": 28010 - }, - { - "epoch": 24.28, - "learning_rate": 2.0765734265734266e-06, - "loss": 0.3552, - "step": 28020 - }, - { - "epoch": 24.29, - "learning_rate": 2.075874125874126e-06, - "loss": 0.3577, - "step": 28030 - }, - { - "epoch": 24.3, - "learning_rate": 2.0751748251748247e-06, - "loss": 0.3526, - "step": 28040 - }, - { - "epoch": 24.31, - "learning_rate": 2.0744755244755242e-06, - "loss": 0.4053, - "step": 28050 - }, - { - "epoch": 24.32, - "learning_rate": 2.0737762237762237e-06, - "loss": 0.3904, - "step": 28060 - }, - { - "epoch": 24.32, - "learning_rate": 2.0730769230769232e-06, - "loss": 0.4229, - "step": 28070 - }, - { - "epoch": 24.33, - "learning_rate": 2.0723776223776223e-06, - "loss": 0.3946, - "step": 28080 - }, - { - "epoch": 24.34, - "learning_rate": 2.0716783216783214e-06, - "loss": 0.4186, - "step": 28090 - }, - { - "epoch": 24.35, - "learning_rate": 2.070979020979021e-06, - "loss": 0.3745, - "step": 28100 - }, - { - "epoch": 24.36, - "learning_rate": 2.07027972027972e-06, - "loss": 0.3804, - "step": 28110 - }, - { - "epoch": 24.37, - "learning_rate": 2.0695804195804194e-06, - "loss": 0.3588, - "step": 28120 - }, - { - "epoch": 24.38, - "learning_rate": 2.068881118881119e-06, - "loss": 0.3584, - "step": 28130 - }, - { - "epoch": 24.38, - "learning_rate": 2.0681818181818184e-06, - "loss": 0.4453, - "step": 28140 - }, - { - "epoch": 24.39, - "learning_rate": 2.067482517482517e-06, - "loss": 0.3888, - "step": 28150 - }, - { - "epoch": 24.4, - "learning_rate": 2.0667832167832166e-06, - "loss": 0.4119, - "step": 28160 - }, - { - "epoch": 24.41, - "learning_rate": 2.066083916083916e-06, - "loss": 0.3672, - "step": 28170 - }, - { - "epoch": 24.42, - "learning_rate": 2.0653846153846156e-06, - "loss": 0.366, - "step": 28180 - }, - { - "epoch": 24.43, - "learning_rate": 2.0646853146853147e-06, - "loss": 0.4376, - "step": 28190 - }, - { - "epoch": 24.44, - "learning_rate": 2.0639860139860137e-06, - "loss": 0.3449, - "step": 28200 - }, - { - "epoch": 24.45, - "learning_rate": 2.0632867132867132e-06, - "loss": 0.3657, - "step": 28210 - }, - { - "epoch": 24.45, - "learning_rate": 2.0625874125874123e-06, - "loss": 0.369, - "step": 28220 - }, - { - "epoch": 24.46, - "learning_rate": 2.061888111888112e-06, - "loss": 0.3602, - "step": 28230 - }, - { - "epoch": 24.47, - "learning_rate": 2.0611888111888113e-06, - "loss": 0.4175, - "step": 28240 - }, - { - "epoch": 24.48, - "learning_rate": 2.060489510489511e-06, - "loss": 0.3883, - "step": 28250 - }, - { - "epoch": 24.49, - "learning_rate": 2.0597902097902094e-06, - "loss": 0.3688, - "step": 28260 - }, - { - "epoch": 24.5, - "learning_rate": 2.059090909090909e-06, - "loss": 0.4029, - "step": 28270 - }, - { - "epoch": 24.51, - "learning_rate": 2.0583916083916084e-06, - "loss": 0.3525, - "step": 28280 - }, - { - "epoch": 24.51, - "learning_rate": 2.0576923076923075e-06, - "loss": 0.3956, - "step": 28290 - }, - { - "epoch": 24.52, - "learning_rate": 2.056993006993007e-06, - "loss": 0.3645, - "step": 28300 - }, - { - "epoch": 24.53, - "learning_rate": 2.056293706293706e-06, - "loss": 0.3766, - "step": 28310 - }, - { - "epoch": 24.54, - "learning_rate": 2.0555944055944056e-06, - "loss": 0.3573, - "step": 28320 - }, - { - "epoch": 24.55, - "learning_rate": 2.0548951048951046e-06, - "loss": 0.4017, - "step": 28330 - }, - { - "epoch": 24.56, - "learning_rate": 2.054195804195804e-06, - "loss": 0.3781, - "step": 28340 - }, - { - "epoch": 24.57, - "learning_rate": 2.0534965034965036e-06, - "loss": 0.36, - "step": 28350 - }, - { - "epoch": 24.58, - "learning_rate": 2.0527972027972027e-06, - "loss": 0.3383, - "step": 28360 - }, - { - "epoch": 24.58, - "learning_rate": 2.0520979020979018e-06, - "loss": 0.4027, - "step": 28370 - }, - { - "epoch": 24.59, - "learning_rate": 2.0513986013986013e-06, - "loss": 0.3551, - "step": 28380 - }, - { - "epoch": 24.6, - "learning_rate": 2.0506993006993008e-06, - "loss": 0.3997, - "step": 28390 - }, - { - "epoch": 24.61, - "learning_rate": 2.05e-06, - "loss": 0.4885, - "step": 28400 - }, - { - "epoch": 24.62, - "learning_rate": 2.0493006993006994e-06, - "loss": 0.4051, - "step": 28410 - }, - { - "epoch": 24.63, - "learning_rate": 2.0486013986013984e-06, - "loss": 0.3174, - "step": 28420 - }, - { - "epoch": 24.64, - "learning_rate": 2.047902097902098e-06, - "loss": 0.3527, - "step": 28430 - }, - { - "epoch": 24.64, - "learning_rate": 2.047202797202797e-06, - "loss": 0.409, - "step": 28440 - }, - { - "epoch": 24.65, - "learning_rate": 2.0465034965034965e-06, - "loss": 0.3858, - "step": 28450 - }, - { - "epoch": 24.66, - "learning_rate": 2.045804195804196e-06, - "loss": 0.4063, - "step": 28460 - }, - { - "epoch": 24.67, - "learning_rate": 2.0451048951048946e-06, - "loss": 0.4017, - "step": 28470 - }, - { - "epoch": 24.68, - "learning_rate": 2.044405594405594e-06, - "loss": 0.3747, - "step": 28480 - }, - { - "epoch": 24.69, - "learning_rate": 2.0437062937062936e-06, - "loss": 0.3442, - "step": 28490 - }, - { - "epoch": 24.7, - "learning_rate": 2.043006993006993e-06, - "loss": 0.4353, - "step": 28500 - }, - { - "epoch": 24.71, - "learning_rate": 2.042307692307692e-06, - "loss": 0.3733, - "step": 28510 - }, - { - "epoch": 24.71, - "learning_rate": 2.0416083916083917e-06, - "loss": 0.3516, - "step": 28520 - }, - { - "epoch": 24.72, - "learning_rate": 2.0409090909090908e-06, - "loss": 0.3923, - "step": 28530 - }, - { - "epoch": 24.73, - "learning_rate": 2.0402097902097903e-06, - "loss": 0.3526, - "step": 28540 - }, - { - "epoch": 24.74, - "learning_rate": 2.0395104895104893e-06, - "loss": 0.3825, - "step": 28550 - }, - { - "epoch": 24.75, - "learning_rate": 2.038811188811189e-06, - "loss": 0.3442, - "step": 28560 - }, - { - "epoch": 24.76, - "learning_rate": 2.0381118881118883e-06, - "loss": 0.4184, - "step": 28570 - }, - { - "epoch": 24.77, - "learning_rate": 2.037412587412587e-06, - "loss": 0.3586, - "step": 28580 - }, - { - "epoch": 24.77, - "learning_rate": 2.0367132867132865e-06, - "loss": 0.361, - "step": 28590 - }, - { - "epoch": 24.78, - "learning_rate": 2.036013986013986e-06, - "loss": 0.3993, - "step": 28600 - }, - { - "epoch": 24.79, - "learning_rate": 2.0353146853146855e-06, - "loss": 0.392, - "step": 28610 - }, - { - "epoch": 24.8, - "learning_rate": 2.0346153846153846e-06, - "loss": 0.3895, - "step": 28620 - }, - { - "epoch": 24.81, - "learning_rate": 2.0339160839160836e-06, - "loss": 0.3679, - "step": 28630 - }, - { - "epoch": 24.82, - "learning_rate": 2.033216783216783e-06, - "loss": 0.3637, - "step": 28640 - }, - { - "epoch": 24.83, - "learning_rate": 2.032517482517482e-06, - "loss": 0.3761, - "step": 28650 - }, - { - "epoch": 24.83, - "learning_rate": 2.0318181818181817e-06, - "loss": 0.3866, - "step": 28660 - }, - { - "epoch": 24.84, - "learning_rate": 2.031118881118881e-06, - "loss": 0.4122, - "step": 28670 - }, - { - "epoch": 24.85, - "learning_rate": 2.0304195804195807e-06, - "loss": 0.3918, - "step": 28680 - }, - { - "epoch": 24.86, - "learning_rate": 2.0297202797202793e-06, - "loss": 0.3436, - "step": 28690 - }, - { - "epoch": 24.87, - "learning_rate": 2.029020979020979e-06, - "loss": 0.396, - "step": 28700 - }, - { - "epoch": 24.88, - "learning_rate": 2.0283216783216783e-06, - "loss": 0.3699, - "step": 28710 - }, - { - "epoch": 24.89, - "learning_rate": 2.0276223776223774e-06, - "loss": 0.3412, - "step": 28720 - }, - { - "epoch": 24.9, - "learning_rate": 2.026923076923077e-06, - "loss": 0.3594, - "step": 28730 - }, - { - "epoch": 24.9, - "learning_rate": 2.026223776223776e-06, - "loss": 0.4354, - "step": 28740 - }, - { - "epoch": 24.91, - "learning_rate": 2.0255244755244755e-06, - "loss": 0.3387, - "step": 28750 - }, - { - "epoch": 24.92, - "learning_rate": 2.0248251748251745e-06, - "loss": 0.3553, - "step": 28760 - }, - { - "epoch": 24.93, - "learning_rate": 2.024125874125874e-06, - "loss": 0.3067, - "step": 28770 - }, - { - "epoch": 24.94, - "learning_rate": 2.0234265734265735e-06, - "loss": 0.3769, - "step": 28780 - }, - { - "epoch": 24.95, - "learning_rate": 2.022727272727273e-06, - "loss": 0.4394, - "step": 28790 - }, - { - "epoch": 24.96, - "learning_rate": 2.0220279720279717e-06, - "loss": 0.4139, - "step": 28800 - }, - { - "epoch": 24.96, - "learning_rate": 2.021328671328671e-06, - "loss": 0.3479, - "step": 28810 - }, - { - "epoch": 24.97, - "learning_rate": 2.0206293706293707e-06, - "loss": 0.3557, - "step": 28820 - }, - { - "epoch": 24.98, - "learning_rate": 2.0199300699300698e-06, - "loss": 0.4021, - "step": 28830 - }, - { - "epoch": 24.99, - "learning_rate": 2.0192307692307692e-06, - "loss": 0.407, - "step": 28840 - }, - { - "epoch": 25.0, - "learning_rate": 2.0185314685314683e-06, - "loss": 0.3938, - "step": 28850 - }, - { - "epoch": 25.0, - "eval_loss": 0.5533283352851868, - "eval_runtime": 134.8549, - "eval_samples_per_second": 3.945, - "eval_steps_per_second": 1.972, - "eval_wer": 0.2540978337725783, - "step": 28850 - }, - { - "epoch": 25.01, - "learning_rate": 2.017832167832168e-06, - "loss": 0.3985, - "step": 28860 - }, - { - "epoch": 25.02, - "learning_rate": 2.017132867132867e-06, - "loss": 0.3684, - "step": 28870 - }, - { - "epoch": 25.03, - "learning_rate": 2.0164335664335664e-06, - "loss": 0.3493, - "step": 28880 - }, - { - "epoch": 25.03, - "learning_rate": 2.015734265734266e-06, - "loss": 0.3979, - "step": 28890 - }, - { - "epoch": 25.04, - "learning_rate": 2.0150349650349645e-06, - "loss": 0.3724, - "step": 28900 - }, - { - "epoch": 25.05, - "learning_rate": 2.014335664335664e-06, - "loss": 0.3743, - "step": 28910 - }, - { - "epoch": 25.06, - "learning_rate": 2.0136363636363635e-06, - "loss": 0.3506, - "step": 28920 - }, - { - "epoch": 25.07, - "learning_rate": 2.012937062937063e-06, - "loss": 0.3633, - "step": 28930 - }, - { - "epoch": 25.08, - "learning_rate": 2.012237762237762e-06, - "loss": 0.3833, - "step": 28940 - }, - { - "epoch": 25.09, - "learning_rate": 2.0115384615384616e-06, - "loss": 0.3936, - "step": 28950 - }, - { - "epoch": 25.1, - "learning_rate": 2.0108391608391607e-06, - "loss": 0.4143, - "step": 28960 - }, - { - "epoch": 25.1, - "learning_rate": 2.01013986013986e-06, - "loss": 0.3808, - "step": 28970 - }, - { - "epoch": 25.11, - "learning_rate": 2.0094405594405592e-06, - "loss": 0.3896, - "step": 28980 - }, - { - "epoch": 25.12, - "learning_rate": 2.0087412587412587e-06, - "loss": 0.443, - "step": 28990 - }, - { - "epoch": 25.13, - "learning_rate": 2.0080419580419582e-06, - "loss": 0.4138, - "step": 29000 - }, - { - "epoch": 25.14, - "learning_rate": 2.007342657342657e-06, - "loss": 0.3609, - "step": 29010 - }, - { - "epoch": 25.15, - "learning_rate": 2.0066433566433564e-06, - "loss": 0.3322, - "step": 29020 - }, - { - "epoch": 25.16, - "learning_rate": 2.005944055944056e-06, - "loss": 0.3868, - "step": 29030 - }, - { - "epoch": 25.16, - "learning_rate": 2.0052447552447554e-06, - "loss": 0.3576, - "step": 29040 - }, - { - "epoch": 25.17, - "learning_rate": 2.0045454545454544e-06, - "loss": 0.4285, - "step": 29050 - }, - { - "epoch": 25.18, - "learning_rate": 2.003846153846154e-06, - "loss": 0.3718, - "step": 29060 - }, - { - "epoch": 25.19, - "learning_rate": 2.003146853146853e-06, - "loss": 0.3549, - "step": 29070 - }, - { - "epoch": 25.2, - "learning_rate": 2.002447552447552e-06, - "loss": 0.3326, - "step": 29080 - }, - { - "epoch": 25.21, - "learning_rate": 2.0017482517482516e-06, - "loss": 0.3645, - "step": 29090 - }, - { - "epoch": 25.22, - "learning_rate": 2.001048951048951e-06, - "loss": 0.4107, - "step": 29100 - }, - { - "epoch": 25.23, - "learning_rate": 2.0003496503496506e-06, - "loss": 0.379, - "step": 29110 - }, - { - "epoch": 25.23, - "learning_rate": 1.9996503496503497e-06, - "loss": 0.4511, - "step": 29120 - }, - { - "epoch": 25.24, - "learning_rate": 1.9989510489510487e-06, - "loss": 0.2738, - "step": 29130 - }, - { - "epoch": 25.25, - "learning_rate": 1.9982517482517482e-06, - "loss": 0.3324, - "step": 29140 - }, - { - "epoch": 25.26, - "learning_rate": 1.9975524475524473e-06, - "loss": 0.3471, - "step": 29150 - }, - { - "epoch": 25.27, - "learning_rate": 1.996853146853147e-06, - "loss": 0.3251, - "step": 29160 - }, - { - "epoch": 25.28, - "learning_rate": 1.996153846153846e-06, - "loss": 0.3745, - "step": 29170 - }, - { - "epoch": 25.29, - "learning_rate": 1.9954545454545454e-06, - "loss": 0.3525, - "step": 29180 - }, - { - "epoch": 25.29, - "learning_rate": 1.994755244755245e-06, - "loss": 0.4024, - "step": 29190 - }, - { - "epoch": 25.3, - "learning_rate": 1.994055944055944e-06, - "loss": 0.3859, - "step": 29200 - }, - { - "epoch": 25.31, - "learning_rate": 1.9933566433566434e-06, - "loss": 0.3689, - "step": 29210 - }, - { - "epoch": 25.32, - "learning_rate": 1.9926573426573425e-06, - "loss": 0.3818, - "step": 29220 - }, - { - "epoch": 25.33, - "learning_rate": 1.991958041958042e-06, - "loss": 0.392, - "step": 29230 - }, - { - "epoch": 25.34, - "learning_rate": 1.991258741258741e-06, - "loss": 0.4117, - "step": 29240 - }, - { - "epoch": 25.35, - "learning_rate": 1.99055944055944e-06, - "loss": 0.3697, - "step": 29250 - }, - { - "epoch": 25.36, - "learning_rate": 1.9898601398601397e-06, - "loss": 0.4136, - "step": 29260 - }, - { - "epoch": 25.36, - "learning_rate": 1.989160839160839e-06, - "loss": 0.3876, - "step": 29270 - }, - { - "epoch": 25.37, - "learning_rate": 1.9884615384615382e-06, - "loss": 0.4172, - "step": 29280 - }, - { - "epoch": 25.38, - "learning_rate": 1.9877622377622377e-06, - "loss": 0.4208, - "step": 29290 - }, - { - "epoch": 25.39, - "learning_rate": 1.9870629370629372e-06, - "loss": 0.3257, - "step": 29300 - }, - { - "epoch": 25.4, - "learning_rate": 1.9863636363636363e-06, - "loss": 0.3967, - "step": 29310 - }, - { - "epoch": 25.41, - "learning_rate": 1.9856643356643358e-06, - "loss": 0.4194, - "step": 29320 - }, - { - "epoch": 25.42, - "learning_rate": 1.984965034965035e-06, - "loss": 0.3644, - "step": 29330 - }, - { - "epoch": 25.42, - "learning_rate": 1.984265734265734e-06, - "loss": 0.439, - "step": 29340 - }, - { - "epoch": 25.43, - "learning_rate": 1.9835664335664334e-06, - "loss": 0.4496, - "step": 29350 - }, - { - "epoch": 25.44, - "learning_rate": 1.9828671328671325e-06, - "loss": 0.3671, - "step": 29360 - }, - { - "epoch": 25.45, - "learning_rate": 1.982167832167832e-06, - "loss": 0.3465, - "step": 29370 - }, - { - "epoch": 25.46, - "learning_rate": 1.9814685314685315e-06, - "loss": 0.3648, - "step": 29380 - }, - { - "epoch": 25.47, - "learning_rate": 1.9807692307692306e-06, - "loss": 0.3448, - "step": 29390 - }, - { - "epoch": 25.48, - "learning_rate": 1.98006993006993e-06, - "loss": 0.366, - "step": 29400 - }, - { - "epoch": 25.49, - "learning_rate": 1.9793706293706296e-06, - "loss": 0.4236, - "step": 29410 - }, - { - "epoch": 25.49, - "learning_rate": 1.9786713286713286e-06, - "loss": 0.3443, - "step": 29420 - }, - { - "epoch": 25.5, - "learning_rate": 1.9779720279720277e-06, - "loss": 0.3399, - "step": 29430 - }, - { - "epoch": 25.51, - "learning_rate": 1.977272727272727e-06, - "loss": 0.3953, - "step": 29440 - }, - { - "epoch": 25.52, - "learning_rate": 1.9765734265734263e-06, - "loss": 0.3883, - "step": 29450 - }, - { - "epoch": 25.53, - "learning_rate": 1.9758741258741258e-06, - "loss": 0.3768, - "step": 29460 - }, - { - "epoch": 25.54, - "learning_rate": 1.975174825174825e-06, - "loss": 0.3587, - "step": 29470 - }, - { - "epoch": 25.55, - "learning_rate": 1.9744755244755243e-06, - "loss": 0.3948, - "step": 29480 - }, - { - "epoch": 25.55, - "learning_rate": 1.973776223776224e-06, - "loss": 0.3911, - "step": 29490 - }, - { - "epoch": 25.56, - "learning_rate": 1.973076923076923e-06, - "loss": 0.4282, - "step": 29500 - }, - { - "epoch": 25.57, - "learning_rate": 1.9723776223776224e-06, - "loss": 0.3315, - "step": 29510 - }, - { - "epoch": 25.58, - "learning_rate": 1.9716783216783215e-06, - "loss": 0.3706, - "step": 29520 - }, - { - "epoch": 25.59, - "learning_rate": 1.970979020979021e-06, - "loss": 0.4202, - "step": 29530 - }, - { - "epoch": 25.6, - "learning_rate": 1.97027972027972e-06, - "loss": 0.3886, - "step": 29540 - }, - { - "epoch": 25.61, - "learning_rate": 1.9695804195804196e-06, - "loss": 0.3891, - "step": 29550 - }, - { - "epoch": 25.61, - "learning_rate": 1.9688811188811186e-06, - "loss": 0.3281, - "step": 29560 - }, - { - "epoch": 25.62, - "learning_rate": 1.968181818181818e-06, - "loss": 0.4184, - "step": 29570 - }, - { - "epoch": 25.63, - "learning_rate": 1.967482517482517e-06, - "loss": 0.3783, - "step": 29580 - }, - { - "epoch": 25.64, - "learning_rate": 1.9667832167832167e-06, - "loss": 0.3379, - "step": 29590 - }, - { - "epoch": 25.65, - "learning_rate": 1.966083916083916e-06, - "loss": 0.3912, - "step": 29600 - }, - { - "epoch": 25.66, - "learning_rate": 1.9653846153846153e-06, - "loss": 0.4055, - "step": 29610 - }, - { - "epoch": 25.67, - "learning_rate": 1.9646853146853148e-06, - "loss": 0.3494, - "step": 29620 - }, - { - "epoch": 25.68, - "learning_rate": 1.963986013986014e-06, - "loss": 0.3599, - "step": 29630 - }, - { - "epoch": 25.68, - "learning_rate": 1.9632867132867133e-06, - "loss": 0.4213, - "step": 29640 - }, - { - "epoch": 25.69, - "learning_rate": 1.9625874125874124e-06, - "loss": 0.3993, - "step": 29650 - }, - { - "epoch": 25.7, - "learning_rate": 1.961888111888112e-06, - "loss": 0.3751, - "step": 29660 - }, - { - "epoch": 25.71, - "learning_rate": 1.961188811188811e-06, - "loss": 0.3582, - "step": 29670 - }, - { - "epoch": 25.72, - "learning_rate": 1.9604895104895105e-06, - "loss": 0.3391, - "step": 29680 - }, - { - "epoch": 25.73, - "learning_rate": 1.9597902097902095e-06, - "loss": 0.3844, - "step": 29690 - }, - { - "epoch": 25.74, - "learning_rate": 1.959090909090909e-06, - "loss": 0.4644, - "step": 29700 - }, - { - "epoch": 25.74, - "learning_rate": 1.958391608391608e-06, - "loss": 0.3793, - "step": 29710 - }, - { - "epoch": 25.75, - "learning_rate": 1.9576923076923076e-06, - "loss": 0.438, - "step": 29720 - }, - { - "epoch": 25.76, - "learning_rate": 1.956993006993007e-06, - "loss": 0.3883, - "step": 29730 - }, - { - "epoch": 25.77, - "learning_rate": 1.956293706293706e-06, - "loss": 0.3923, - "step": 29740 - }, - { - "epoch": 25.78, - "learning_rate": 1.9555944055944057e-06, - "loss": 0.4291, - "step": 29750 - }, - { - "epoch": 25.79, - "learning_rate": 1.9548951048951048e-06, - "loss": 0.359, - "step": 29760 - }, - { - "epoch": 25.8, - "learning_rate": 1.9541958041958043e-06, - "loss": 0.4473, - "step": 29770 - }, - { - "epoch": 25.81, - "learning_rate": 1.9534965034965033e-06, - "loss": 0.3519, - "step": 29780 - }, - { - "epoch": 25.81, - "learning_rate": 1.952797202797203e-06, - "loss": 0.3373, - "step": 29790 - }, - { - "epoch": 25.82, - "learning_rate": 1.952097902097902e-06, - "loss": 0.3667, - "step": 29800 - }, - { - "epoch": 25.83, - "learning_rate": 1.9513986013986014e-06, - "loss": 0.3505, - "step": 29810 - }, - { - "epoch": 25.84, - "learning_rate": 1.9506993006993005e-06, - "loss": 0.3392, - "step": 29820 - }, - { - "epoch": 25.85, - "learning_rate": 1.95e-06, - "loss": 0.3719, - "step": 29830 - }, - { - "epoch": 25.86, - "learning_rate": 1.9493006993006995e-06, - "loss": 0.3555, - "step": 29840 - }, - { - "epoch": 25.87, - "learning_rate": 1.9486013986013985e-06, - "loss": 0.4009, - "step": 29850 - }, - { - "epoch": 25.87, - "learning_rate": 1.947902097902098e-06, - "loss": 0.3475, - "step": 29860 - }, - { - "epoch": 25.88, - "learning_rate": 1.947202797202797e-06, - "loss": 0.4121, - "step": 29870 - }, - { - "epoch": 25.89, - "learning_rate": 1.946503496503496e-06, - "loss": 0.37, - "step": 29880 - }, - { - "epoch": 25.9, - "learning_rate": 1.9458041958041957e-06, - "loss": 0.3507, - "step": 29890 - }, - { - "epoch": 25.91, - "learning_rate": 1.9451048951048947e-06, - "loss": 0.4051, - "step": 29900 - }, - { - "epoch": 25.92, - "learning_rate": 1.9444055944055942e-06, - "loss": 0.3669, - "step": 29910 - }, - { - "epoch": 25.93, - "learning_rate": 1.9437062937062937e-06, - "loss": 0.3776, - "step": 29920 - }, - { - "epoch": 25.94, - "learning_rate": 1.943006993006993e-06, - "loss": 0.3033, - "step": 29930 - }, - { - "epoch": 25.94, - "learning_rate": 1.9423076923076923e-06, - "loss": 0.4222, - "step": 29940 - }, - { - "epoch": 25.95, - "learning_rate": 1.941608391608392e-06, - "loss": 0.4284, - "step": 29950 - }, - { - "epoch": 25.96, - "learning_rate": 1.940979020979021e-06, - "loss": 0.3916, - "step": 29960 - }, - { - "epoch": 25.97, - "learning_rate": 1.94027972027972e-06, - "loss": 0.3203, - "step": 29970 - }, - { - "epoch": 25.98, - "learning_rate": 1.9395804195804194e-06, - "loss": 0.3179, - "step": 29980 - }, - { - "epoch": 25.99, - "learning_rate": 1.938881118881119e-06, - "loss": 0.4541, - "step": 29990 - }, - { - "epoch": 26.0, - "learning_rate": 1.938181818181818e-06, - "loss": 0.4509, - "step": 30000 - }, - { - "epoch": 26.0, - "eval_loss": 0.5566795468330383, - "eval_runtime": 137.3215, - "eval_samples_per_second": 3.874, - "eval_steps_per_second": 1.937, - "eval_wer": 0.24863405540914058, - "step": 30004 - }, - { - "epoch": 26.01, - "learning_rate": 1.9374825174825175e-06, - "loss": 0.331, - "step": 30010 - }, - { - "epoch": 26.01, - "learning_rate": 1.9367832167832166e-06, - "loss": 0.341, - "step": 30020 - }, - { - "epoch": 26.02, - "learning_rate": 1.936083916083916e-06, - "loss": 0.3829, - "step": 30030 - }, - { - "epoch": 26.03, - "learning_rate": 1.9353846153846156e-06, - "loss": 0.4277, - "step": 30040 - }, - { - "epoch": 26.04, - "learning_rate": 1.9346853146853146e-06, - "loss": 0.3695, - "step": 30050 - }, - { - "epoch": 26.05, - "learning_rate": 1.9339860139860137e-06, - "loss": 0.3736, - "step": 30060 - }, - { - "epoch": 26.06, - "learning_rate": 1.933286713286713e-06, - "loss": 0.3632, - "step": 30070 - }, - { - "epoch": 26.07, - "learning_rate": 1.9325874125874123e-06, - "loss": 0.3675, - "step": 30080 - }, - { - "epoch": 26.07, - "learning_rate": 1.9318881118881118e-06, - "loss": 0.3919, - "step": 30090 - }, - { - "epoch": 26.08, - "learning_rate": 1.931188811188811e-06, - "loss": 0.4781, - "step": 30100 - }, - { - "epoch": 26.09, - "learning_rate": 1.9304895104895103e-06, - "loss": 0.4024, - "step": 30110 - }, - { - "epoch": 26.1, - "learning_rate": 1.92979020979021e-06, - "loss": 0.3457, - "step": 30120 - }, - { - "epoch": 26.11, - "learning_rate": 1.929090909090909e-06, - "loss": 0.373, - "step": 30130 - }, - { - "epoch": 26.12, - "learning_rate": 1.9283916083916084e-06, - "loss": 0.4276, - "step": 30140 - }, - { - "epoch": 26.13, - "learning_rate": 1.9276923076923075e-06, - "loss": 0.3916, - "step": 30150 - }, - { - "epoch": 26.14, - "learning_rate": 1.926993006993007e-06, - "loss": 0.3897, - "step": 30160 - }, - { - "epoch": 26.14, - "learning_rate": 1.926293706293706e-06, - "loss": 0.3996, - "step": 30170 - }, - { - "epoch": 26.15, - "learning_rate": 1.9255944055944055e-06, - "loss": 0.3456, - "step": 30180 - }, - { - "epoch": 26.16, - "learning_rate": 1.9248951048951046e-06, - "loss": 0.3332, - "step": 30190 - }, - { - "epoch": 26.17, - "learning_rate": 1.924195804195804e-06, - "loss": 0.3873, - "step": 30200 - }, - { - "epoch": 26.18, - "learning_rate": 1.923496503496503e-06, - "loss": 0.3484, - "step": 30210 - }, - { - "epoch": 26.19, - "learning_rate": 1.9227972027972027e-06, - "loss": 0.3626, - "step": 30220 - }, - { - "epoch": 26.2, - "learning_rate": 1.922097902097902e-06, - "loss": 0.3595, - "step": 30230 - }, - { - "epoch": 26.2, - "learning_rate": 1.9213986013986013e-06, - "loss": 0.4079, - "step": 30240 - }, - { - "epoch": 26.21, - "learning_rate": 1.9206993006993008e-06, - "loss": 0.3836, - "step": 30250 - }, - { - "epoch": 26.22, - "learning_rate": 1.92e-06, - "loss": 0.4066, - "step": 30260 - }, - { - "epoch": 26.23, - "learning_rate": 1.9193006993006993e-06, - "loss": 0.3826, - "step": 30270 - }, - { - "epoch": 26.24, - "learning_rate": 1.9186013986013984e-06, - "loss": 0.3621, - "step": 30280 - }, - { - "epoch": 26.25, - "learning_rate": 1.917902097902098e-06, - "loss": 0.399, - "step": 30290 - }, - { - "epoch": 26.26, - "learning_rate": 1.917202797202797e-06, - "loss": 0.468, - "step": 30300 - }, - { - "epoch": 26.27, - "learning_rate": 1.9165034965034965e-06, - "loss": 0.3621, - "step": 30310 - }, - { - "epoch": 26.27, - "learning_rate": 1.9158041958041955e-06, - "loss": 0.4275, - "step": 30320 - }, - { - "epoch": 26.28, - "learning_rate": 1.915104895104895e-06, - "loss": 0.3894, - "step": 30330 - }, - { - "epoch": 26.29, - "learning_rate": 1.9144055944055945e-06, - "loss": 0.3466, - "step": 30340 - }, - { - "epoch": 26.3, - "learning_rate": 1.9137062937062936e-06, - "loss": 0.4006, - "step": 30350 - }, - { - "epoch": 26.31, - "learning_rate": 1.913006993006993e-06, - "loss": 0.3204, - "step": 30360 - }, - { - "epoch": 26.32, - "learning_rate": 1.912307692307692e-06, - "loss": 0.4006, - "step": 30370 - }, - { - "epoch": 26.33, - "learning_rate": 1.9116083916083917e-06, - "loss": 0.3396, - "step": 30380 - }, - { - "epoch": 26.33, - "learning_rate": 1.9109090909090907e-06, - "loss": 0.3836, - "step": 30390 - }, - { - "epoch": 26.34, - "learning_rate": 1.9102097902097902e-06, - "loss": 0.3941, - "step": 30400 - }, - { - "epoch": 26.35, - "learning_rate": 1.9095104895104893e-06, - "loss": 0.4129, - "step": 30410 - }, - { - "epoch": 26.36, - "learning_rate": 1.908811188811189e-06, - "loss": 0.4021, - "step": 30420 - }, - { - "epoch": 26.37, - "learning_rate": 1.908111888111888e-06, - "loss": 0.3448, - "step": 30430 - }, - { - "epoch": 26.38, - "learning_rate": 1.9074125874125874e-06, - "loss": 0.3963, - "step": 30440 - }, - { - "epoch": 26.39, - "learning_rate": 1.9067132867132867e-06, - "loss": 0.3782, - "step": 30450 - }, - { - "epoch": 26.39, - "learning_rate": 1.906013986013986e-06, - "loss": 0.3195, - "step": 30460 - }, - { - "epoch": 26.4, - "learning_rate": 1.9053146853146852e-06, - "loss": 0.4381, - "step": 30470 - }, - { - "epoch": 26.41, - "learning_rate": 1.9046153846153845e-06, - "loss": 0.3247, - "step": 30480 - }, - { - "epoch": 26.42, - "learning_rate": 1.903916083916084e-06, - "loss": 0.379, - "step": 30490 - }, - { - "epoch": 26.43, - "learning_rate": 1.903216783216783e-06, - "loss": 0.3943, - "step": 30500 - }, - { - "epoch": 26.44, - "learning_rate": 1.9025174825174824e-06, - "loss": 0.3868, - "step": 30510 - }, - { - "epoch": 26.45, - "learning_rate": 1.9018181818181817e-06, - "loss": 0.3622, - "step": 30520 - }, - { - "epoch": 26.46, - "learning_rate": 1.901118881118881e-06, - "loss": 0.4147, - "step": 30530 - }, - { - "epoch": 26.46, - "learning_rate": 1.9004195804195804e-06, - "loss": 0.4051, - "step": 30540 - }, - { - "epoch": 26.47, - "learning_rate": 1.8997202797202795e-06, - "loss": 0.3756, - "step": 30550 - }, - { - "epoch": 26.48, - "learning_rate": 1.899020979020979e-06, - "loss": 0.376, - "step": 30560 - }, - { - "epoch": 26.49, - "learning_rate": 1.8983216783216783e-06, - "loss": 0.364, - "step": 30570 - }, - { - "epoch": 26.5, - "learning_rate": 1.8976223776223776e-06, - "loss": 0.3638, - "step": 30580 - }, - { - "epoch": 26.51, - "learning_rate": 1.8969230769230769e-06, - "loss": 0.3573, - "step": 30590 - }, - { - "epoch": 26.52, - "learning_rate": 1.896223776223776e-06, - "loss": 0.3813, - "step": 30600 - }, - { - "epoch": 26.52, - "learning_rate": 1.8955244755244754e-06, - "loss": 0.3925, - "step": 30610 - }, - { - "epoch": 26.53, - "learning_rate": 1.8948251748251747e-06, - "loss": 0.3528, - "step": 30620 - }, - { - "epoch": 26.54, - "learning_rate": 1.894125874125874e-06, - "loss": 0.361, - "step": 30630 - }, - { - "epoch": 26.55, - "learning_rate": 1.8934265734265733e-06, - "loss": 0.3667, - "step": 30640 - }, - { - "epoch": 26.56, - "learning_rate": 1.8927272727272728e-06, - "loss": 0.3815, - "step": 30650 - }, - { - "epoch": 26.57, - "learning_rate": 1.8920279720279719e-06, - "loss": 0.4043, - "step": 30660 - }, - { - "epoch": 26.58, - "learning_rate": 1.8913286713286712e-06, - "loss": 0.3642, - "step": 30670 - }, - { - "epoch": 26.59, - "learning_rate": 1.8906293706293707e-06, - "loss": 0.3322, - "step": 30680 - }, - { - "epoch": 26.59, - "learning_rate": 1.8899300699300697e-06, - "loss": 0.4152, - "step": 30690 - }, - { - "epoch": 26.6, - "learning_rate": 1.8892307692307692e-06, - "loss": 0.4589, - "step": 30700 - }, - { - "epoch": 26.61, - "learning_rate": 1.8885314685314683e-06, - "loss": 0.3927, - "step": 30710 - }, - { - "epoch": 26.62, - "learning_rate": 1.8878321678321678e-06, - "loss": 0.3514, - "step": 30720 - }, - { - "epoch": 26.63, - "learning_rate": 1.887132867132867e-06, - "loss": 0.3987, - "step": 30730 - }, - { - "epoch": 26.64, - "learning_rate": 1.8864335664335664e-06, - "loss": 0.3924, - "step": 30740 - }, - { - "epoch": 26.65, - "learning_rate": 1.8857342657342656e-06, - "loss": 0.3721, - "step": 30750 - }, - { - "epoch": 26.65, - "learning_rate": 1.885034965034965e-06, - "loss": 0.4027, - "step": 30760 - }, - { - "epoch": 26.66, - "learning_rate": 1.8843356643356642e-06, - "loss": 0.3327, - "step": 30770 - }, - { - "epoch": 26.67, - "learning_rate": 1.8836363636363635e-06, - "loss": 0.3517, - "step": 30780 - }, - { - "epoch": 26.68, - "learning_rate": 1.8829370629370628e-06, - "loss": 0.3319, - "step": 30790 - }, - { - "epoch": 26.69, - "learning_rate": 1.882237762237762e-06, - "loss": 0.3603, - "step": 30800 - }, - { - "epoch": 26.7, - "learning_rate": 1.8815384615384616e-06, - "loss": 0.4292, - "step": 30810 - }, - { - "epoch": 26.71, - "learning_rate": 1.8808391608391606e-06, - "loss": 0.3922, - "step": 30820 - }, - { - "epoch": 26.72, - "learning_rate": 1.8801398601398601e-06, - "loss": 0.3476, - "step": 30830 - }, - { - "epoch": 26.72, - "learning_rate": 1.8794405594405594e-06, - "loss": 0.378, - "step": 30840 - }, - { - "epoch": 26.73, - "learning_rate": 1.8787412587412585e-06, - "loss": 0.4082, - "step": 30850 - }, - { - "epoch": 26.74, - "learning_rate": 1.878041958041958e-06, - "loss": 0.3795, - "step": 30860 - }, - { - "epoch": 26.75, - "learning_rate": 1.877342657342657e-06, - "loss": 0.3642, - "step": 30870 - }, - { - "epoch": 26.76, - "learning_rate": 1.8766433566433566e-06, - "loss": 0.3987, - "step": 30880 - }, - { - "epoch": 26.77, - "learning_rate": 1.8759440559440559e-06, - "loss": 0.3377, - "step": 30890 - }, - { - "epoch": 26.78, - "learning_rate": 1.8752447552447551e-06, - "loss": 0.4408, - "step": 30900 - }, - { - "epoch": 26.78, - "learning_rate": 1.8745454545454544e-06, - "loss": 0.3129, - "step": 30910 - }, - { - "epoch": 26.79, - "learning_rate": 1.873846153846154e-06, - "loss": 0.3814, - "step": 30920 - }, - { - "epoch": 26.8, - "learning_rate": 1.873146853146853e-06, - "loss": 0.3311, - "step": 30930 - }, - { - "epoch": 26.81, - "learning_rate": 1.8724475524475523e-06, - "loss": 0.3986, - "step": 30940 - }, - { - "epoch": 26.82, - "learning_rate": 1.8717482517482518e-06, - "loss": 0.3727, - "step": 30950 - }, - { - "epoch": 26.83, - "learning_rate": 1.8710489510489508e-06, - "loss": 0.3677, - "step": 30960 - }, - { - "epoch": 26.84, - "learning_rate": 1.8703496503496503e-06, - "loss": 0.3461, - "step": 30970 - }, - { - "epoch": 26.85, - "learning_rate": 1.8696503496503494e-06, - "loss": 0.3699, - "step": 30980 - }, - { - "epoch": 26.85, - "learning_rate": 1.868951048951049e-06, - "loss": 0.4387, - "step": 30990 - }, - { - "epoch": 26.86, - "learning_rate": 1.8682517482517482e-06, - "loss": 0.3552, - "step": 31000 - }, - { - "epoch": 26.87, - "learning_rate": 1.8675524475524475e-06, - "loss": 0.3734, - "step": 31010 - }, - { - "epoch": 26.88, - "learning_rate": 1.8668531468531468e-06, - "loss": 0.4173, - "step": 31020 - }, - { - "epoch": 26.89, - "learning_rate": 1.866153846153846e-06, - "loss": 0.3429, - "step": 31030 - }, - { - "epoch": 26.9, - "learning_rate": 1.8654545454545453e-06, - "loss": 0.4001, - "step": 31040 - }, - { - "epoch": 26.91, - "learning_rate": 1.8647552447552446e-06, - "loss": 0.3468, - "step": 31050 - }, - { - "epoch": 26.91, - "learning_rate": 1.864055944055944e-06, - "loss": 0.3783, - "step": 31060 - }, - { - "epoch": 26.92, - "learning_rate": 1.8633566433566432e-06, - "loss": 0.3875, - "step": 31070 - }, - { - "epoch": 26.93, - "learning_rate": 1.8626573426573427e-06, - "loss": 0.3293, - "step": 31080 - }, - { - "epoch": 26.94, - "learning_rate": 1.8619580419580418e-06, - "loss": 0.3913, - "step": 31090 - }, - { - "epoch": 26.95, - "learning_rate": 1.8612587412587413e-06, - "loss": 0.4083, - "step": 31100 - }, - { - "epoch": 26.96, - "learning_rate": 1.8605594405594406e-06, - "loss": 0.3357, - "step": 31110 - }, - { - "epoch": 26.97, - "learning_rate": 1.8598601398601396e-06, - "loss": 0.3768, - "step": 31120 - }, - { - "epoch": 26.98, - "learning_rate": 1.8591608391608391e-06, - "loss": 0.3425, - "step": 31130 - }, - { - "epoch": 26.98, - "learning_rate": 1.8584615384615384e-06, - "loss": 0.4, - "step": 31140 - }, - { - "epoch": 26.99, - "learning_rate": 1.8577622377622377e-06, - "loss": 0.3583, - "step": 31150 - }, - { - "epoch": 27.0, - "eval_loss": 0.5641392469406128, - "eval_runtime": 136.2547, - "eval_samples_per_second": 3.904, - "eval_steps_per_second": 1.952, - "eval_wer": 0.25229800089991644, - "step": 31158 - }, - { - "epoch": 27.0, - "learning_rate": 1.857062937062937e-06, - "loss": 0.4314, - "step": 31160 - }, - { - "epoch": 27.01, - "learning_rate": 1.8563636363636363e-06, - "loss": 0.4011, - "step": 31170 - }, - { - "epoch": 27.02, - "learning_rate": 1.8556643356643355e-06, - "loss": 0.3816, - "step": 31180 - }, - { - "epoch": 27.03, - "learning_rate": 1.854965034965035e-06, - "loss": 0.3846, - "step": 31190 - }, - { - "epoch": 27.04, - "learning_rate": 1.8542657342657341e-06, - "loss": 0.3608, - "step": 31200 - }, - { - "epoch": 27.05, - "learning_rate": 1.8535664335664334e-06, - "loss": 0.3791, - "step": 31210 - }, - { - "epoch": 27.05, - "learning_rate": 1.852867132867133e-06, - "loss": 0.4113, - "step": 31220 - }, - { - "epoch": 27.06, - "learning_rate": 1.852167832167832e-06, - "loss": 0.3469, - "step": 31230 - }, - { - "epoch": 27.07, - "learning_rate": 1.8514685314685315e-06, - "loss": 0.3932, - "step": 31240 - }, - { - "epoch": 27.08, - "learning_rate": 1.8507692307692305e-06, - "loss": 0.3928, - "step": 31250 - }, - { - "epoch": 27.09, - "learning_rate": 1.85006993006993e-06, - "loss": 0.328, - "step": 31260 - }, - { - "epoch": 27.1, - "learning_rate": 1.8493706293706293e-06, - "loss": 0.3303, - "step": 31270 - }, - { - "epoch": 27.11, - "learning_rate": 1.8486713286713286e-06, - "loss": 0.3637, - "step": 31280 - }, - { - "epoch": 27.11, - "learning_rate": 1.847972027972028e-06, - "loss": 0.3607, - "step": 31290 - }, - { - "epoch": 27.12, - "learning_rate": 1.8472727272727272e-06, - "loss": 0.394, - "step": 31300 - }, - { - "epoch": 27.13, - "learning_rate": 1.8465734265734265e-06, - "loss": 0.4039, - "step": 31310 - }, - { - "epoch": 27.14, - "learning_rate": 1.8458741258741258e-06, - "loss": 0.3861, - "step": 31320 - }, - { - "epoch": 27.15, - "learning_rate": 1.8451748251748252e-06, - "loss": 0.3385, - "step": 31330 - }, - { - "epoch": 27.16, - "learning_rate": 1.8444755244755243e-06, - "loss": 0.3482, - "step": 31340 - }, - { - "epoch": 27.17, - "learning_rate": 1.8437762237762238e-06, - "loss": 0.3543, - "step": 31350 - }, - { - "epoch": 27.17, - "learning_rate": 1.8430769230769229e-06, - "loss": 0.4551, - "step": 31360 - }, - { - "epoch": 27.18, - "learning_rate": 1.8423776223776224e-06, - "loss": 0.3558, - "step": 31370 - }, - { - "epoch": 27.19, - "learning_rate": 1.8416783216783217e-06, - "loss": 0.3725, - "step": 31380 - }, - { - "epoch": 27.2, - "learning_rate": 1.8409790209790207e-06, - "loss": 0.3708, - "step": 31390 - }, - { - "epoch": 27.21, - "learning_rate": 1.8402797202797202e-06, - "loss": 0.3762, - "step": 31400 - }, - { - "epoch": 27.22, - "learning_rate": 1.8395804195804195e-06, - "loss": 0.3454, - "step": 31410 - }, - { - "epoch": 27.23, - "learning_rate": 1.8388811188811188e-06, - "loss": 0.3676, - "step": 31420 - }, - { - "epoch": 27.24, - "learning_rate": 1.838181818181818e-06, - "loss": 0.3525, - "step": 31430 - }, - { - "epoch": 27.24, - "learning_rate": 1.8374825174825174e-06, - "loss": 0.369, - "step": 31440 - }, - { - "epoch": 27.25, - "learning_rate": 1.8367832167832167e-06, - "loss": 0.391, - "step": 31450 - }, - { - "epoch": 27.26, - "learning_rate": 1.8360839160839162e-06, - "loss": 0.3938, - "step": 31460 - }, - { - "epoch": 27.27, - "learning_rate": 1.8353846153846152e-06, - "loss": 0.3873, - "step": 31470 - }, - { - "epoch": 27.28, - "learning_rate": 1.8346853146853145e-06, - "loss": 0.3405, - "step": 31480 - }, - { - "epoch": 27.29, - "learning_rate": 1.833986013986014e-06, - "loss": 0.3682, - "step": 31490 - }, - { - "epoch": 27.3, - "learning_rate": 1.833286713286713e-06, - "loss": 0.3943, - "step": 31500 - }, - { - "epoch": 27.3, - "learning_rate": 1.8325874125874126e-06, - "loss": 0.3856, - "step": 31510 - }, - { - "epoch": 27.31, - "learning_rate": 1.8318881118881117e-06, - "loss": 0.416, - "step": 31520 - }, - { - "epoch": 27.32, - "learning_rate": 1.8311888111888112e-06, - "loss": 0.3424, - "step": 31530 - }, - { - "epoch": 27.33, - "learning_rate": 1.8304895104895104e-06, - "loss": 0.3573, - "step": 31540 - }, - { - "epoch": 27.34, - "learning_rate": 1.8297902097902097e-06, - "loss": 0.3489, - "step": 31550 - }, - { - "epoch": 27.35, - "learning_rate": 1.829090909090909e-06, - "loss": 0.4039, - "step": 31560 - }, - { - "epoch": 27.36, - "learning_rate": 1.8283916083916083e-06, - "loss": 0.3618, - "step": 31570 - }, - { - "epoch": 27.37, - "learning_rate": 1.8276923076923076e-06, - "loss": 0.3253, - "step": 31580 - }, - { - "epoch": 27.37, - "learning_rate": 1.8269930069930069e-06, - "loss": 0.3501, - "step": 31590 - }, - { - "epoch": 27.38, - "learning_rate": 1.8262937062937064e-06, - "loss": 0.3475, - "step": 31600 - }, - { - "epoch": 27.39, - "learning_rate": 1.8255944055944054e-06, - "loss": 0.3852, - "step": 31610 - }, - { - "epoch": 27.4, - "learning_rate": 1.824895104895105e-06, - "loss": 0.3352, - "step": 31620 - }, - { - "epoch": 27.41, - "learning_rate": 1.824195804195804e-06, - "loss": 0.3391, - "step": 31630 - }, - { - "epoch": 27.42, - "learning_rate": 1.8234965034965035e-06, - "loss": 0.3885, - "step": 31640 - }, - { - "epoch": 27.43, - "learning_rate": 1.8227972027972028e-06, - "loss": 0.358, - "step": 31650 - }, - { - "epoch": 27.43, - "learning_rate": 1.8220979020979019e-06, - "loss": 0.3604, - "step": 31660 - }, - { - "epoch": 27.44, - "learning_rate": 1.8213986013986014e-06, - "loss": 0.3526, - "step": 31670 - }, - { - "epoch": 27.45, - "learning_rate": 1.8206993006993007e-06, - "loss": 0.3765, - "step": 31680 - }, - { - "epoch": 27.46, - "learning_rate": 1.82e-06, - "loss": 0.3577, - "step": 31690 - }, - { - "epoch": 27.47, - "learning_rate": 1.8193006993006992e-06, - "loss": 0.3842, - "step": 31700 - }, - { - "epoch": 27.48, - "learning_rate": 1.8186013986013985e-06, - "loss": 0.3789, - "step": 31710 - }, - { - "epoch": 27.49, - "learning_rate": 1.8179020979020978e-06, - "loss": 0.4499, - "step": 31720 - }, - { - "epoch": 27.5, - "learning_rate": 1.817202797202797e-06, - "loss": 0.3503, - "step": 31730 - }, - { - "epoch": 27.5, - "learning_rate": 1.8165034965034964e-06, - "loss": 0.3301, - "step": 31740 - }, - { - "epoch": 27.51, - "learning_rate": 1.8158041958041956e-06, - "loss": 0.3902, - "step": 31750 - }, - { - "epoch": 27.52, - "learning_rate": 1.8151048951048951e-06, - "loss": 0.423, - "step": 31760 - }, - { - "epoch": 27.53, - "learning_rate": 1.8144055944055942e-06, - "loss": 0.4111, - "step": 31770 - }, - { - "epoch": 27.54, - "learning_rate": 1.8137062937062937e-06, - "loss": 0.3757, - "step": 31780 - }, - { - "epoch": 27.55, - "learning_rate": 1.8130069930069928e-06, - "loss": 0.3748, - "step": 31790 - }, - { - "epoch": 27.56, - "learning_rate": 1.8123076923076923e-06, - "loss": 0.3695, - "step": 31800 - }, - { - "epoch": 27.56, - "learning_rate": 1.8116083916083916e-06, - "loss": 0.3734, - "step": 31810 - }, - { - "epoch": 27.57, - "learning_rate": 1.8109090909090906e-06, - "loss": 0.3587, - "step": 31820 - }, - { - "epoch": 27.58, - "learning_rate": 1.8102097902097901e-06, - "loss": 0.366, - "step": 31830 - }, - { - "epoch": 27.59, - "learning_rate": 1.8095104895104894e-06, - "loss": 0.3811, - "step": 31840 - }, - { - "epoch": 27.6, - "learning_rate": 1.8088111888111887e-06, - "loss": 0.3845, - "step": 31850 - }, - { - "epoch": 27.61, - "learning_rate": 1.808111888111888e-06, - "loss": 0.3945, - "step": 31860 - }, - { - "epoch": 27.62, - "learning_rate": 1.8074125874125875e-06, - "loss": 0.4014, - "step": 31870 - }, - { - "epoch": 27.63, - "learning_rate": 1.8067132867132866e-06, - "loss": 0.3829, - "step": 31880 - }, - { - "epoch": 27.63, - "learning_rate": 1.806013986013986e-06, - "loss": 0.4039, - "step": 31890 - }, - { - "epoch": 27.64, - "learning_rate": 1.8053146853146851e-06, - "loss": 0.4097, - "step": 31900 - }, - { - "epoch": 27.65, - "learning_rate": 1.8046153846153844e-06, - "loss": 0.3733, - "step": 31910 - }, - { - "epoch": 27.66, - "learning_rate": 1.803916083916084e-06, - "loss": 0.3835, - "step": 31920 - }, - { - "epoch": 27.67, - "learning_rate": 1.803216783216783e-06, - "loss": 0.3801, - "step": 31930 - }, - { - "epoch": 27.68, - "learning_rate": 1.8025174825174825e-06, - "loss": 0.3225, - "step": 31940 - }, - { - "epoch": 27.69, - "learning_rate": 1.8018181818181818e-06, - "loss": 0.4131, - "step": 31950 - }, - { - "epoch": 27.69, - "learning_rate": 1.801118881118881e-06, - "loss": 0.3939, - "step": 31960 - }, - { - "epoch": 27.7, - "learning_rate": 1.8004195804195803e-06, - "loss": 0.341, - "step": 31970 - }, - { - "epoch": 27.71, - "learning_rate": 1.7997202797202796e-06, - "loss": 0.3937, - "step": 31980 - }, - { - "epoch": 27.72, - "learning_rate": 1.799020979020979e-06, - "loss": 0.3684, - "step": 31990 - }, - { - "epoch": 27.73, - "learning_rate": 1.7983216783216782e-06, - "loss": 0.3699, - "step": 32000 - }, - { - "epoch": 27.74, - "learning_rate": 1.7976223776223775e-06, - "loss": 0.3764, - "step": 32010 - }, - { - "epoch": 27.75, - "learning_rate": 1.7969230769230768e-06, - "loss": 0.3609, - "step": 32020 - }, - { - "epoch": 27.76, - "learning_rate": 1.7962237762237763e-06, - "loss": 0.3248, - "step": 32030 - }, - { - "epoch": 27.76, - "learning_rate": 1.7955244755244753e-06, - "loss": 0.4042, - "step": 32040 - }, - { - "epoch": 27.77, - "learning_rate": 1.7948251748251748e-06, - "loss": 0.4085, - "step": 32050 - }, - { - "epoch": 27.78, - "learning_rate": 1.794125874125874e-06, - "loss": 0.4023, - "step": 32060 - }, - { - "epoch": 27.79, - "learning_rate": 1.7934265734265734e-06, - "loss": 0.317, - "step": 32070 - }, - { - "epoch": 27.8, - "learning_rate": 1.7927272727272727e-06, - "loss": 0.3857, - "step": 32080 - }, - { - "epoch": 27.81, - "learning_rate": 1.7920279720279718e-06, - "loss": 0.3571, - "step": 32090 - }, - { - "epoch": 27.82, - "learning_rate": 1.7913286713286713e-06, - "loss": 0.4025, - "step": 32100 - }, - { - "epoch": 27.82, - "learning_rate": 1.7906293706293706e-06, - "loss": 0.3897, - "step": 32110 - }, - { - "epoch": 27.83, - "learning_rate": 1.7899300699300698e-06, - "loss": 0.4233, - "step": 32120 - }, - { - "epoch": 27.84, - "learning_rate": 1.7892307692307691e-06, - "loss": 0.373, - "step": 32130 - }, - { - "epoch": 27.85, - "learning_rate": 1.7885314685314686e-06, - "loss": 0.3689, - "step": 32140 - }, - { - "epoch": 27.86, - "learning_rate": 1.7878321678321677e-06, - "loss": 0.3384, - "step": 32150 - }, - { - "epoch": 27.87, - "learning_rate": 1.7871328671328672e-06, - "loss": 0.393, - "step": 32160 - }, - { - "epoch": 27.88, - "learning_rate": 1.7864335664335663e-06, - "loss": 0.3157, - "step": 32170 - }, - { - "epoch": 27.89, - "learning_rate": 1.7857342657342655e-06, - "loss": 0.4032, - "step": 32180 - }, - { - "epoch": 27.89, - "learning_rate": 1.785034965034965e-06, - "loss": 0.3611, - "step": 32190 - }, - { - "epoch": 27.9, - "learning_rate": 1.7843356643356641e-06, - "loss": 0.3538, - "step": 32200 - }, - { - "epoch": 27.91, - "learning_rate": 1.7836363636363636e-06, - "loss": 0.3398, - "step": 32210 - }, - { - "epoch": 27.92, - "learning_rate": 1.782937062937063e-06, - "loss": 0.3714, - "step": 32220 - }, - { - "epoch": 27.93, - "learning_rate": 1.7822377622377622e-06, - "loss": 0.3936, - "step": 32230 - }, - { - "epoch": 27.94, - "learning_rate": 1.7815384615384615e-06, - "loss": 0.3473, - "step": 32240 - }, - { - "epoch": 27.95, - "learning_rate": 1.7808391608391608e-06, - "loss": 0.4004, - "step": 32250 - }, - { - "epoch": 27.95, - "learning_rate": 1.78013986013986e-06, - "loss": 0.3311, - "step": 32260 - }, - { - "epoch": 27.96, - "learning_rate": 1.7794405594405593e-06, - "loss": 0.3644, - "step": 32270 - }, - { - "epoch": 27.97, - "learning_rate": 1.7787412587412586e-06, - "loss": 0.3806, - "step": 32280 - }, - { - "epoch": 27.98, - "learning_rate": 1.778041958041958e-06, - "loss": 0.3713, - "step": 32290 - }, - { - "epoch": 27.99, - "learning_rate": 1.7773426573426574e-06, - "loss": 0.3826, - "step": 32300 - }, - { - "epoch": 28.0, - "learning_rate": 1.7766433566433565e-06, - "loss": 0.4084, - "step": 32310 - }, - { - "epoch": 28.0, - "eval_loss": 0.568722128868103, - "eval_runtime": 137.4904, - "eval_samples_per_second": 3.869, - "eval_steps_per_second": 1.935, - "eval_wer": 0.2521051616635598, - "step": 32312 - }, - { - "epoch": 28.01, - "learning_rate": 1.775944055944056e-06, - "loss": 0.4081, - "step": 32320 - }, - { - "epoch": 28.02, - "learning_rate": 1.775244755244755e-06, - "loss": 0.3512, - "step": 32330 - }, - { - "epoch": 28.02, - "learning_rate": 1.7745454545454545e-06, - "loss": 0.351, - "step": 32340 - }, - { - "epoch": 28.03, - "learning_rate": 1.7738461538461538e-06, - "loss": 0.3402, - "step": 32350 - }, - { - "epoch": 28.04, - "learning_rate": 1.7731468531468529e-06, - "loss": 0.3992, - "step": 32360 - }, - { - "epoch": 28.05, - "learning_rate": 1.7724475524475524e-06, - "loss": 0.4322, - "step": 32370 - }, - { - "epoch": 28.06, - "learning_rate": 1.7717482517482517e-06, - "loss": 0.3604, - "step": 32380 - }, - { - "epoch": 28.07, - "learning_rate": 1.771048951048951e-06, - "loss": 0.3135, - "step": 32390 - }, - { - "epoch": 28.08, - "learning_rate": 1.7703496503496502e-06, - "loss": 0.3935, - "step": 32400 - }, - { - "epoch": 28.08, - "learning_rate": 1.7696503496503497e-06, - "loss": 0.3196, - "step": 32410 - }, - { - "epoch": 28.09, - "learning_rate": 1.7689510489510488e-06, - "loss": 0.3479, - "step": 32420 - }, - { - "epoch": 28.1, - "learning_rate": 1.7682517482517483e-06, - "loss": 0.4076, - "step": 32430 - }, - { - "epoch": 28.11, - "learning_rate": 1.7675524475524474e-06, - "loss": 0.3654, - "step": 32440 - }, - { - "epoch": 28.12, - "learning_rate": 1.7668531468531467e-06, - "loss": 0.3773, - "step": 32450 - }, - { - "epoch": 28.13, - "learning_rate": 1.7661538461538462e-06, - "loss": 0.3836, - "step": 32460 - }, - { - "epoch": 28.14, - "learning_rate": 1.7654545454545452e-06, - "loss": 0.3514, - "step": 32470 - }, - { - "epoch": 28.15, - "learning_rate": 1.7647552447552447e-06, - "loss": 0.4039, - "step": 32480 - }, - { - "epoch": 28.15, - "learning_rate": 1.764055944055944e-06, - "loss": 0.3392, - "step": 32490 - }, - { - "epoch": 28.16, - "learning_rate": 1.7633566433566433e-06, - "loss": 0.359, - "step": 32500 - }, - { - "epoch": 28.17, - "learning_rate": 1.7626573426573426e-06, - "loss": 0.3671, - "step": 32510 - }, - { - "epoch": 28.18, - "learning_rate": 1.7619580419580419e-06, - "loss": 0.3782, - "step": 32520 - }, - { - "epoch": 28.19, - "learning_rate": 1.7612587412587412e-06, - "loss": 0.3816, - "step": 32530 - }, - { - "epoch": 28.2, - "learning_rate": 1.7605594405594404e-06, - "loss": 0.3251, - "step": 32540 - }, - { - "epoch": 28.21, - "learning_rate": 1.7598601398601397e-06, - "loss": 0.3907, - "step": 32550 - }, - { - "epoch": 28.21, - "learning_rate": 1.759160839160839e-06, - "loss": 0.4064, - "step": 32560 - }, - { - "epoch": 28.22, - "learning_rate": 1.7584615384615385e-06, - "loss": 0.3726, - "step": 32570 - }, - { - "epoch": 28.23, - "learning_rate": 1.7577622377622376e-06, - "loss": 0.3508, - "step": 32580 - }, - { - "epoch": 28.24, - "learning_rate": 1.757062937062937e-06, - "loss": 0.3468, - "step": 32590 - }, - { - "epoch": 28.25, - "learning_rate": 1.7563636363636364e-06, - "loss": 0.4059, - "step": 32600 - }, - { - "epoch": 28.26, - "learning_rate": 1.7556643356643357e-06, - "loss": 0.4445, - "step": 32610 - }, - { - "epoch": 28.27, - "learning_rate": 1.754965034965035e-06, - "loss": 0.4066, - "step": 32620 - }, - { - "epoch": 28.28, - "learning_rate": 1.754265734265734e-06, - "loss": 0.3494, - "step": 32630 - }, - { - "epoch": 28.28, - "learning_rate": 1.7535664335664335e-06, - "loss": 0.3554, - "step": 32640 - }, - { - "epoch": 28.29, - "learning_rate": 1.7528671328671328e-06, - "loss": 0.3856, - "step": 32650 - }, - { - "epoch": 28.3, - "learning_rate": 1.752167832167832e-06, - "loss": 0.3978, - "step": 32660 - }, - { - "epoch": 28.31, - "learning_rate": 1.7514685314685314e-06, - "loss": 0.3472, - "step": 32670 - }, - { - "epoch": 28.32, - "learning_rate": 1.7507692307692309e-06, - "loss": 0.3697, - "step": 32680 - }, - { - "epoch": 28.33, - "learning_rate": 1.75006993006993e-06, - "loss": 0.3225, - "step": 32690 - }, - { - "epoch": 28.34, - "learning_rate": 1.7493706293706292e-06, - "loss": 0.3769, - "step": 32700 - }, - { - "epoch": 28.34, - "learning_rate": 1.7486713286713285e-06, - "loss": 0.3747, - "step": 32710 - }, - { - "epoch": 28.35, - "learning_rate": 1.7479720279720278e-06, - "loss": 0.3268, - "step": 32720 - }, - { - "epoch": 28.36, - "learning_rate": 1.7472727272727273e-06, - "loss": 0.4022, - "step": 32730 - }, - { - "epoch": 28.37, - "learning_rate": 1.7465734265734264e-06, - "loss": 0.3495, - "step": 32740 - }, - { - "epoch": 28.38, - "learning_rate": 1.7458741258741259e-06, - "loss": 0.4143, - "step": 32750 - }, - { - "epoch": 28.39, - "learning_rate": 1.7451748251748251e-06, - "loss": 0.3261, - "step": 32760 - }, - { - "epoch": 28.4, - "learning_rate": 1.7444755244755244e-06, - "loss": 0.3724, - "step": 32770 - }, - { - "epoch": 28.41, - "learning_rate": 1.7437762237762237e-06, - "loss": 0.3713, - "step": 32780 - }, - { - "epoch": 28.41, - "learning_rate": 1.7430769230769228e-06, - "loss": 0.4072, - "step": 32790 - }, - { - "epoch": 28.42, - "learning_rate": 1.7423776223776223e-06, - "loss": 0.3862, - "step": 32800 - }, - { - "epoch": 28.43, - "learning_rate": 1.7416783216783216e-06, - "loss": 0.4113, - "step": 32810 - }, - { - "epoch": 28.44, - "learning_rate": 1.7409790209790209e-06, - "loss": 0.3918, - "step": 32820 - }, - { - "epoch": 28.45, - "learning_rate": 1.7403496503496501e-06, - "loss": 0.369, - "step": 32830 - }, - { - "epoch": 28.46, - "learning_rate": 1.7396503496503496e-06, - "loss": 0.3563, - "step": 32840 - }, - { - "epoch": 28.47, - "learning_rate": 1.7389510489510489e-06, - "loss": 0.3593, - "step": 32850 - }, - { - "epoch": 28.47, - "learning_rate": 1.7382517482517482e-06, - "loss": 0.3922, - "step": 32860 - }, - { - "epoch": 28.48, - "learning_rate": 1.7375524475524475e-06, - "loss": 0.4448, - "step": 32870 - }, - { - "epoch": 28.49, - "learning_rate": 1.736853146853147e-06, - "loss": 0.3888, - "step": 32880 - }, - { - "epoch": 28.5, - "learning_rate": 1.736153846153846e-06, - "loss": 0.3244, - "step": 32890 - }, - { - "epoch": 28.51, - "learning_rate": 1.7354545454545453e-06, - "loss": 0.3501, - "step": 32900 - }, - { - "epoch": 28.52, - "learning_rate": 1.7347552447552446e-06, - "loss": 0.4159, - "step": 32910 - }, - { - "epoch": 28.53, - "learning_rate": 1.7340559440559439e-06, - "loss": 0.3692, - "step": 32920 - }, - { - "epoch": 28.54, - "learning_rate": 1.7333566433566434e-06, - "loss": 0.3711, - "step": 32930 - }, - { - "epoch": 28.54, - "learning_rate": 1.7326573426573425e-06, - "loss": 0.3636, - "step": 32940 - }, - { - "epoch": 28.55, - "learning_rate": 1.731958041958042e-06, - "loss": 0.3652, - "step": 32950 - }, - { - "epoch": 28.56, - "learning_rate": 1.7312587412587412e-06, - "loss": 0.4086, - "step": 32960 - }, - { - "epoch": 28.57, - "learning_rate": 1.7305594405594405e-06, - "loss": 0.3202, - "step": 32970 - }, - { - "epoch": 28.58, - "learning_rate": 1.7298601398601398e-06, - "loss": 0.33, - "step": 32980 - }, - { - "epoch": 28.59, - "learning_rate": 1.729160839160839e-06, - "loss": 0.371, - "step": 32990 - }, - { - "epoch": 28.6, - "learning_rate": 1.7284615384615384e-06, - "loss": 0.384, - "step": 33000 - }, - { - "epoch": 28.6, - "learning_rate": 1.7277622377622377e-06, - "loss": 0.3612, - "step": 33010 - }, - { - "epoch": 28.61, - "learning_rate": 1.727062937062937e-06, - "loss": 0.385, - "step": 33020 - }, - { - "epoch": 28.62, - "learning_rate": 1.7263636363636362e-06, - "loss": 0.3638, - "step": 33030 - }, - { - "epoch": 28.63, - "learning_rate": 1.7256643356643357e-06, - "loss": 0.3553, - "step": 33040 - }, - { - "epoch": 28.64, - "learning_rate": 1.7249650349650348e-06, - "loss": 0.4293, - "step": 33050 - }, - { - "epoch": 28.65, - "learning_rate": 1.7242657342657343e-06, - "loss": 0.385, - "step": 33060 - }, - { - "epoch": 28.66, - "learning_rate": 1.7235664335664336e-06, - "loss": 0.3787, - "step": 33070 - }, - { - "epoch": 28.67, - "learning_rate": 1.7228671328671327e-06, - "loss": 0.373, - "step": 33080 - }, - { - "epoch": 28.67, - "learning_rate": 1.7221678321678322e-06, - "loss": 0.3868, - "step": 33090 - }, - { - "epoch": 28.68, - "learning_rate": 1.7214685314685312e-06, - "loss": 0.3748, - "step": 33100 - }, - { - "epoch": 28.69, - "learning_rate": 1.7207692307692307e-06, - "loss": 0.3846, - "step": 33110 - }, - { - "epoch": 28.7, - "learning_rate": 1.72006993006993e-06, - "loss": 0.3777, - "step": 33120 - }, - { - "epoch": 28.71, - "learning_rate": 1.7193706293706293e-06, - "loss": 0.369, - "step": 33130 - }, - { - "epoch": 28.72, - "learning_rate": 1.7186713286713286e-06, - "loss": 0.3733, - "step": 33140 - }, - { - "epoch": 28.73, - "learning_rate": 1.717972027972028e-06, - "loss": 0.3676, - "step": 33150 - }, - { - "epoch": 28.73, - "learning_rate": 1.7172727272727272e-06, - "loss": 0.4108, - "step": 33160 - }, - { - "epoch": 28.74, - "learning_rate": 1.7165734265734264e-06, - "loss": 0.3825, - "step": 33170 - }, - { - "epoch": 28.75, - "learning_rate": 1.715874125874126e-06, - "loss": 0.3638, - "step": 33180 - }, - { - "epoch": 28.76, - "learning_rate": 1.715174825174825e-06, - "loss": 0.3664, - "step": 33190 - }, - { - "epoch": 28.77, - "learning_rate": 1.7144755244755245e-06, - "loss": 0.3941, - "step": 33200 - }, - { - "epoch": 28.78, - "learning_rate": 1.7137762237762236e-06, - "loss": 0.3873, - "step": 33210 - }, - { - "epoch": 28.79, - "learning_rate": 1.713076923076923e-06, - "loss": 0.3623, - "step": 33220 - }, - { - "epoch": 28.8, - "learning_rate": 1.7123776223776224e-06, - "loss": 0.3523, - "step": 33230 - }, - { - "epoch": 28.8, - "learning_rate": 1.7116783216783214e-06, - "loss": 0.3801, - "step": 33240 - }, - { - "epoch": 28.81, - "learning_rate": 1.710979020979021e-06, - "loss": 0.3508, - "step": 33250 - }, - { - "epoch": 28.82, - "learning_rate": 1.7102797202797202e-06, - "loss": 0.3487, - "step": 33260 - }, - { - "epoch": 28.83, - "learning_rate": 1.7095804195804195e-06, - "loss": 0.3378, - "step": 33270 - }, - { - "epoch": 28.84, - "learning_rate": 1.7088811188811188e-06, - "loss": 0.4113, - "step": 33280 - }, - { - "epoch": 28.85, - "learning_rate": 1.708181818181818e-06, - "loss": 0.3687, - "step": 33290 - }, - { - "epoch": 28.86, - "learning_rate": 1.7074825174825174e-06, - "loss": 0.3522, - "step": 33300 - }, - { - "epoch": 28.86, - "learning_rate": 1.7067832167832169e-06, - "loss": 0.3869, - "step": 33310 - }, - { - "epoch": 28.87, - "learning_rate": 1.706083916083916e-06, - "loss": 0.3857, - "step": 33320 - }, - { - "epoch": 28.88, - "learning_rate": 1.7053846153846152e-06, - "loss": 0.3923, - "step": 33330 - }, - { - "epoch": 28.89, - "learning_rate": 1.7046853146853147e-06, - "loss": 0.3645, - "step": 33340 - }, - { - "epoch": 28.9, - "learning_rate": 1.7039860139860138e-06, - "loss": 0.3899, - "step": 33350 - }, - { - "epoch": 28.91, - "learning_rate": 1.7032867132867133e-06, - "loss": 0.3523, - "step": 33360 - }, - { - "epoch": 28.92, - "learning_rate": 1.7025874125874124e-06, - "loss": 0.3441, - "step": 33370 - }, - { - "epoch": 28.93, - "learning_rate": 1.7018881118881119e-06, - "loss": 0.4076, - "step": 33380 - }, - { - "epoch": 28.93, - "learning_rate": 1.7011888111888111e-06, - "loss": 0.3111, - "step": 33390 - }, - { - "epoch": 28.94, - "learning_rate": 1.7004895104895104e-06, - "loss": 0.353, - "step": 33400 - }, - { - "epoch": 28.95, - "learning_rate": 1.6997902097902097e-06, - "loss": 0.4195, - "step": 33410 - }, - { - "epoch": 28.96, - "learning_rate": 1.699090909090909e-06, - "loss": 0.2943, - "step": 33420 - }, - { - "epoch": 28.97, - "learning_rate": 1.6983916083916083e-06, - "loss": 0.3757, - "step": 33430 - }, - { - "epoch": 28.98, - "learning_rate": 1.6976923076923076e-06, - "loss": 0.3184, - "step": 33440 - }, - { - "epoch": 28.99, - "learning_rate": 1.696993006993007e-06, - "loss": 0.4107, - "step": 33450 - }, - { - "epoch": 28.99, - "learning_rate": 1.6962937062937061e-06, - "loss": 0.3916, - "step": 33460 - }, - { - "epoch": 29.0, - "eval_loss": 0.5656043887138367, - "eval_runtime": 135.8464, - "eval_samples_per_second": 3.916, - "eval_steps_per_second": 1.958, - "eval_wer": 0.2494696921000193, - "step": 33466 - }, - { - "epoch": 29.0, - "learning_rate": 1.6955944055944056e-06, - "loss": 0.4027, - "step": 33470 - }, - { - "epoch": 29.01, - "learning_rate": 1.6948951048951047e-06, - "loss": 0.3603, - "step": 33480 - }, - { - "epoch": 29.02, - "learning_rate": 1.6941958041958042e-06, - "loss": 0.364, - "step": 33490 - }, - { - "epoch": 29.03, - "learning_rate": 1.6934965034965035e-06, - "loss": 0.3812, - "step": 33500 - }, - { - "epoch": 29.04, - "learning_rate": 1.6927972027972026e-06, - "loss": 0.3828, - "step": 33510 - }, - { - "epoch": 29.05, - "learning_rate": 1.692097902097902e-06, - "loss": 0.3753, - "step": 33520 - }, - { - "epoch": 29.06, - "learning_rate": 1.6913986013986013e-06, - "loss": 0.3995, - "step": 33530 - }, - { - "epoch": 29.06, - "learning_rate": 1.6906993006993006e-06, - "loss": 0.3793, - "step": 33540 - }, - { - "epoch": 29.07, - "learning_rate": 1.69e-06, - "loss": 0.4096, - "step": 33550 - }, - { - "epoch": 29.08, - "learning_rate": 1.6893006993006992e-06, - "loss": 0.3429, - "step": 33560 - }, - { - "epoch": 29.09, - "learning_rate": 1.6886013986013985e-06, - "loss": 0.3749, - "step": 33570 - }, - { - "epoch": 29.1, - "learning_rate": 1.687902097902098e-06, - "loss": 0.353, - "step": 33580 - }, - { - "epoch": 29.11, - "learning_rate": 1.687202797202797e-06, - "loss": 0.4113, - "step": 33590 - }, - { - "epoch": 29.12, - "learning_rate": 1.6865034965034963e-06, - "loss": 0.3883, - "step": 33600 - }, - { - "epoch": 29.12, - "learning_rate": 1.6858041958041958e-06, - "loss": 0.3624, - "step": 33610 - }, - { - "epoch": 29.13, - "learning_rate": 1.685104895104895e-06, - "loss": 0.3857, - "step": 33620 - }, - { - "epoch": 29.14, - "learning_rate": 1.6844055944055944e-06, - "loss": 0.3628, - "step": 33630 - }, - { - "epoch": 29.15, - "learning_rate": 1.6837062937062935e-06, - "loss": 0.3251, - "step": 33640 - }, - { - "epoch": 29.16, - "learning_rate": 1.683006993006993e-06, - "loss": 0.3287, - "step": 33650 - }, - { - "epoch": 29.17, - "learning_rate": 1.6823076923076923e-06, - "loss": 0.4003, - "step": 33660 - }, - { - "epoch": 29.18, - "learning_rate": 1.6816083916083915e-06, - "loss": 0.3441, - "step": 33670 - }, - { - "epoch": 29.19, - "learning_rate": 1.6809090909090908e-06, - "loss": 0.3336, - "step": 33680 - }, - { - "epoch": 29.19, - "learning_rate": 1.6802097902097901e-06, - "loss": 0.3581, - "step": 33690 - }, - { - "epoch": 29.2, - "learning_rate": 1.6795104895104894e-06, - "loss": 0.3547, - "step": 33700 - }, - { - "epoch": 29.21, - "learning_rate": 1.6788111888111887e-06, - "loss": 0.3512, - "step": 33710 - }, - { - "epoch": 29.22, - "learning_rate": 1.6781118881118882e-06, - "loss": 0.3349, - "step": 33720 - }, - { - "epoch": 29.23, - "learning_rate": 1.6774125874125873e-06, - "loss": 0.335, - "step": 33730 - }, - { - "epoch": 29.24, - "learning_rate": 1.6767132867132868e-06, - "loss": 0.3946, - "step": 33740 - }, - { - "epoch": 29.25, - "learning_rate": 1.6760139860139858e-06, - "loss": 0.3519, - "step": 33750 - }, - { - "epoch": 29.25, - "learning_rate": 1.6753146853146853e-06, - "loss": 0.3994, - "step": 33760 - }, - { - "epoch": 29.26, - "learning_rate": 1.6746153846153846e-06, - "loss": 0.4, - "step": 33770 - }, - { - "epoch": 29.27, - "learning_rate": 1.6739160839160837e-06, - "loss": 0.3892, - "step": 33780 - }, - { - "epoch": 29.28, - "learning_rate": 1.6732167832167832e-06, - "loss": 0.3496, - "step": 33790 - }, - { - "epoch": 29.29, - "learning_rate": 1.6725174825174825e-06, - "loss": 0.3959, - "step": 33800 - }, - { - "epoch": 29.3, - "learning_rate": 1.6718181818181818e-06, - "loss": 0.3793, - "step": 33810 - }, - { - "epoch": 29.31, - "learning_rate": 1.671118881118881e-06, - "loss": 0.3249, - "step": 33820 - }, - { - "epoch": 29.32, - "learning_rate": 1.6704195804195803e-06, - "loss": 0.3672, - "step": 33830 - }, - { - "epoch": 29.32, - "learning_rate": 1.6697202797202796e-06, - "loss": 0.4126, - "step": 33840 - }, - { - "epoch": 29.33, - "learning_rate": 1.669020979020979e-06, - "loss": 0.3912, - "step": 33850 - }, - { - "epoch": 29.34, - "learning_rate": 1.6683216783216782e-06, - "loss": 0.355, - "step": 33860 - }, - { - "epoch": 29.35, - "learning_rate": 1.6676223776223775e-06, - "loss": 0.3485, - "step": 33870 - }, - { - "epoch": 29.36, - "learning_rate": 1.666923076923077e-06, - "loss": 0.3303, - "step": 33880 - }, - { - "epoch": 29.37, - "learning_rate": 1.666223776223776e-06, - "loss": 0.3702, - "step": 33890 - }, - { - "epoch": 29.38, - "learning_rate": 1.6655244755244755e-06, - "loss": 0.3903, - "step": 33900 - }, - { - "epoch": 29.38, - "learning_rate": 1.6648251748251746e-06, - "loss": 0.3441, - "step": 33910 - }, - { - "epoch": 29.39, - "learning_rate": 1.664125874125874e-06, - "loss": 0.4614, - "step": 33920 - }, - { - "epoch": 29.4, - "learning_rate": 1.6634265734265734e-06, - "loss": 0.4162, - "step": 33930 - }, - { - "epoch": 29.41, - "learning_rate": 1.6627272727272727e-06, - "loss": 0.339, - "step": 33940 - }, - { - "epoch": 29.42, - "learning_rate": 1.662027972027972e-06, - "loss": 0.3922, - "step": 33950 - }, - { - "epoch": 29.43, - "learning_rate": 1.6613286713286712e-06, - "loss": 0.403, - "step": 33960 - }, - { - "epoch": 29.44, - "learning_rate": 1.6606293706293705e-06, - "loss": 0.4064, - "step": 33970 - }, - { - "epoch": 29.45, - "learning_rate": 1.6599300699300698e-06, - "loss": 0.3831, - "step": 33980 - }, - { - "epoch": 29.45, - "learning_rate": 1.6592307692307693e-06, - "loss": 0.4108, - "step": 33990 - }, - { - "epoch": 29.46, - "learning_rate": 1.6585314685314684e-06, - "loss": 0.3298, - "step": 34000 - }, - { - "epoch": 29.47, - "learning_rate": 1.6578321678321679e-06, - "loss": 0.3735, - "step": 34010 - }, - { - "epoch": 29.48, - "learning_rate": 1.657132867132867e-06, - "loss": 0.3878, - "step": 34020 - }, - { - "epoch": 29.49, - "learning_rate": 1.6564335664335664e-06, - "loss": 0.398, - "step": 34030 - }, - { - "epoch": 29.5, - "learning_rate": 1.6557342657342657e-06, - "loss": 0.362, - "step": 34040 - }, - { - "epoch": 29.51, - "learning_rate": 1.6550349650349648e-06, - "loss": 0.4029, - "step": 34050 - }, - { - "epoch": 29.51, - "learning_rate": 1.6543356643356643e-06, - "loss": 0.3755, - "step": 34060 - }, - { - "epoch": 29.52, - "learning_rate": 1.6536363636363636e-06, - "loss": 0.3183, - "step": 34070 - }, - { - "epoch": 29.53, - "learning_rate": 1.6529370629370629e-06, - "loss": 0.3432, - "step": 34080 - }, - { - "epoch": 29.54, - "learning_rate": 1.6522377622377622e-06, - "loss": 0.3807, - "step": 34090 - }, - { - "epoch": 29.55, - "learning_rate": 1.6515384615384614e-06, - "loss": 0.3386, - "step": 34100 - }, - { - "epoch": 29.56, - "learning_rate": 1.6508391608391607e-06, - "loss": 0.3606, - "step": 34110 - }, - { - "epoch": 29.57, - "learning_rate": 1.6501398601398602e-06, - "loss": 0.4485, - "step": 34120 - }, - { - "epoch": 29.58, - "learning_rate": 1.6494405594405593e-06, - "loss": 0.3701, - "step": 34130 - }, - { - "epoch": 29.58, - "learning_rate": 1.6487412587412586e-06, - "loss": 0.3498, - "step": 34140 - }, - { - "epoch": 29.59, - "learning_rate": 1.648041958041958e-06, - "loss": 0.3324, - "step": 34150 - }, - { - "epoch": 29.6, - "learning_rate": 1.6473426573426572e-06, - "loss": 0.3444, - "step": 34160 - }, - { - "epoch": 29.61, - "learning_rate": 1.6466433566433567e-06, - "loss": 0.3844, - "step": 34170 - }, - { - "epoch": 29.62, - "learning_rate": 1.6459440559440557e-06, - "loss": 0.3856, - "step": 34180 - }, - { - "epoch": 29.63, - "learning_rate": 1.6452447552447552e-06, - "loss": 0.3968, - "step": 34190 - }, - { - "epoch": 29.64, - "learning_rate": 1.6445454545454545e-06, - "loss": 0.3755, - "step": 34200 - }, - { - "epoch": 29.64, - "learning_rate": 1.6438461538461538e-06, - "loss": 0.4211, - "step": 34210 - }, - { - "epoch": 29.65, - "learning_rate": 1.643146853146853e-06, - "loss": 0.3817, - "step": 34220 - }, - { - "epoch": 29.66, - "learning_rate": 1.6424475524475524e-06, - "loss": 0.3811, - "step": 34230 - }, - { - "epoch": 29.67, - "learning_rate": 1.6417482517482516e-06, - "loss": 0.3229, - "step": 34240 - }, - { - "epoch": 29.68, - "learning_rate": 1.641048951048951e-06, - "loss": 0.421, - "step": 34250 - }, - { - "epoch": 29.69, - "learning_rate": 1.6403496503496504e-06, - "loss": 0.3709, - "step": 34260 - }, - { - "epoch": 29.7, - "learning_rate": 1.6396503496503495e-06, - "loss": 0.4524, - "step": 34270 - }, - { - "epoch": 29.71, - "learning_rate": 1.638951048951049e-06, - "loss": 0.3726, - "step": 34280 - }, - { - "epoch": 29.71, - "learning_rate": 1.638251748251748e-06, - "loss": 0.3111, - "step": 34290 - }, - { - "epoch": 29.72, - "learning_rate": 1.6375524475524474e-06, - "loss": 0.3639, - "step": 34300 - }, - { - "epoch": 29.73, - "learning_rate": 1.6368531468531469e-06, - "loss": 0.4219, - "step": 34310 - }, - { - "epoch": 29.74, - "learning_rate": 1.636153846153846e-06, - "loss": 0.3993, - "step": 34320 - }, - { - "epoch": 29.75, - "learning_rate": 1.6354545454545454e-06, - "loss": 0.3243, - "step": 34330 - }, - { - "epoch": 29.76, - "learning_rate": 1.6347552447552447e-06, - "loss": 0.4005, - "step": 34340 - }, - { - "epoch": 29.77, - "learning_rate": 1.634055944055944e-06, - "loss": 0.4288, - "step": 34350 - }, - { - "epoch": 29.77, - "learning_rate": 1.6333566433566433e-06, - "loss": 0.491, - "step": 34360 - }, - { - "epoch": 29.78, - "learning_rate": 1.6326573426573426e-06, - "loss": 0.4482, - "step": 34370 - }, - { - "epoch": 29.79, - "learning_rate": 1.6319580419580419e-06, - "loss": 0.4113, - "step": 34380 - }, - { - "epoch": 29.8, - "learning_rate": 1.6312587412587411e-06, - "loss": 0.35, - "step": 34390 - }, - { - "epoch": 29.81, - "learning_rate": 1.6305594405594404e-06, - "loss": 0.373, - "step": 34400 - }, - { - "epoch": 29.82, - "learning_rate": 1.6298601398601397e-06, - "loss": 0.3738, - "step": 34410 - }, - { - "epoch": 29.83, - "learning_rate": 1.6291608391608392e-06, - "loss": 0.3479, - "step": 34420 - }, - { - "epoch": 29.83, - "learning_rate": 1.6284615384615383e-06, - "loss": 0.3902, - "step": 34430 - }, - { - "epoch": 29.84, - "learning_rate": 1.6277622377622378e-06, - "loss": 0.377, - "step": 34440 - }, - { - "epoch": 29.85, - "learning_rate": 1.627062937062937e-06, - "loss": 0.3926, - "step": 34450 - }, - { - "epoch": 29.86, - "learning_rate": 1.6263636363636363e-06, - "loss": 0.3604, - "step": 34460 - }, - { - "epoch": 29.87, - "learning_rate": 1.6256643356643356e-06, - "loss": 0.367, - "step": 34470 - }, - { - "epoch": 29.88, - "learning_rate": 1.6249650349650347e-06, - "loss": 0.439, - "step": 34480 - }, - { - "epoch": 29.89, - "learning_rate": 1.6242657342657342e-06, - "loss": 0.4341, - "step": 34490 - }, - { - "epoch": 29.9, - "learning_rate": 1.6235664335664335e-06, - "loss": 0.3464, - "step": 34500 - }, - { - "epoch": 29.9, - "learning_rate": 1.6228671328671328e-06, - "loss": 0.3569, - "step": 34510 - }, - { - "epoch": 29.91, - "learning_rate": 1.622167832167832e-06, - "loss": 0.3835, - "step": 34520 - }, - { - "epoch": 29.92, - "learning_rate": 1.6215384615384615e-06, - "loss": 0.3977, - "step": 34530 - }, - { - "epoch": 29.93, - "learning_rate": 1.6208391608391608e-06, - "loss": 0.3297, - "step": 34540 - }, - { - "epoch": 29.94, - "learning_rate": 1.62013986013986e-06, - "loss": 0.3743, - "step": 34550 - }, - { - "epoch": 29.95, - "learning_rate": 1.6194405594405594e-06, - "loss": 0.4124, - "step": 34560 - }, - { - "epoch": 29.96, - "learning_rate": 1.6187412587412589e-06, - "loss": 0.3618, - "step": 34570 - }, - { - "epoch": 29.96, - "learning_rate": 1.618041958041958e-06, - "loss": 0.3684, - "step": 34580 - }, - { - "epoch": 29.97, - "learning_rate": 1.6173426573426572e-06, - "loss": 0.362, - "step": 34590 - }, - { - "epoch": 29.98, - "learning_rate": 1.6166433566433565e-06, - "loss": 0.3643, - "step": 34600 - }, - { - "epoch": 29.99, - "learning_rate": 1.6159440559440558e-06, - "loss": 0.351, - "step": 34610 - }, - { - "epoch": 30.0, - "learning_rate": 1.6152447552447553e-06, - "loss": 0.4298, - "step": 34620 - }, - { - "epoch": 30.0, - "eval_loss": 0.5718466639518738, - "eval_runtime": 137.3598, - "eval_samples_per_second": 3.873, - "eval_steps_per_second": 1.937, - "eval_wer": 0.24985537057273252, - "step": 34620 - }, - { - "epoch": 30.01, - "learning_rate": 1.6145454545454544e-06, - "loss": 0.4091, - "step": 34630 - }, - { - "epoch": 30.02, - "learning_rate": 1.6138461538461539e-06, - "loss": 0.3421, - "step": 34640 - }, - { - "epoch": 30.03, - "learning_rate": 1.6131468531468532e-06, - "loss": 0.3637, - "step": 34650 - }, - { - "epoch": 30.03, - "learning_rate": 1.6124475524475524e-06, - "loss": 0.3804, - "step": 34660 - }, - { - "epoch": 30.04, - "learning_rate": 1.6117482517482517e-06, - "loss": 0.3391, - "step": 34670 - }, - { - "epoch": 30.05, - "learning_rate": 1.6110489510489508e-06, - "loss": 0.3682, - "step": 34680 - }, - { - "epoch": 30.06, - "learning_rate": 1.6103496503496503e-06, - "loss": 0.4202, - "step": 34690 - }, - { - "epoch": 30.07, - "learning_rate": 1.6096503496503496e-06, - "loss": 0.3785, - "step": 34700 - }, - { - "epoch": 30.08, - "learning_rate": 1.6089510489510489e-06, - "loss": 0.424, - "step": 34710 - }, - { - "epoch": 30.09, - "learning_rate": 1.6082517482517482e-06, - "loss": 0.3877, - "step": 34720 - }, - { - "epoch": 30.1, - "learning_rate": 1.6075524475524476e-06, - "loss": 0.3444, - "step": 34730 - }, - { - "epoch": 30.1, - "learning_rate": 1.6068531468531467e-06, - "loss": 0.3997, - "step": 34740 - }, - { - "epoch": 30.11, - "learning_rate": 1.606153846153846e-06, - "loss": 0.3541, - "step": 34750 - }, - { - "epoch": 30.12, - "learning_rate": 1.6054545454545453e-06, - "loss": 0.3894, - "step": 34760 - }, - { - "epoch": 30.13, - "learning_rate": 1.6047552447552446e-06, - "loss": 0.3606, - "step": 34770 - }, - { - "epoch": 30.14, - "learning_rate": 1.604055944055944e-06, - "loss": 0.3636, - "step": 34780 - }, - { - "epoch": 30.15, - "learning_rate": 1.6033566433566431e-06, - "loss": 0.3572, - "step": 34790 - }, - { - "epoch": 30.16, - "learning_rate": 1.6026573426573426e-06, - "loss": 0.3856, - "step": 34800 - }, - { - "epoch": 30.16, - "learning_rate": 1.601958041958042e-06, - "loss": 0.3364, - "step": 34810 - }, - { - "epoch": 30.17, - "learning_rate": 1.6012587412587412e-06, - "loss": 0.3653, - "step": 34820 - }, - { - "epoch": 30.18, - "learning_rate": 1.6005594405594405e-06, - "loss": 0.3721, - "step": 34830 - }, - { - "epoch": 30.19, - "learning_rate": 1.5998601398601398e-06, - "loss": 0.3632, - "step": 34840 - }, - { - "epoch": 30.2, - "learning_rate": 1.599160839160839e-06, - "loss": 0.3592, - "step": 34850 - }, - { - "epoch": 30.21, - "learning_rate": 1.5984615384615384e-06, - "loss": 0.3721, - "step": 34860 - }, - { - "epoch": 30.22, - "learning_rate": 1.5977622377622376e-06, - "loss": 0.4172, - "step": 34870 - }, - { - "epoch": 30.23, - "learning_rate": 1.597062937062937e-06, - "loss": 0.3367, - "step": 34880 - }, - { - "epoch": 30.23, - "learning_rate": 1.5963636363636364e-06, - "loss": 0.3765, - "step": 34890 - }, - { - "epoch": 30.24, - "learning_rate": 1.5956643356643355e-06, - "loss": 0.3662, - "step": 34900 - }, - { - "epoch": 30.25, - "learning_rate": 1.594965034965035e-06, - "loss": 0.3884, - "step": 34910 - }, - { - "epoch": 30.26, - "learning_rate": 1.5942657342657343e-06, - "loss": 0.3728, - "step": 34920 - }, - { - "epoch": 30.27, - "learning_rate": 1.5935664335664334e-06, - "loss": 0.3489, - "step": 34930 - }, - { - "epoch": 30.28, - "learning_rate": 1.5928671328671328e-06, - "loss": 0.3379, - "step": 34940 - }, - { - "epoch": 30.29, - "learning_rate": 1.592167832167832e-06, - "loss": 0.3322, - "step": 34950 - }, - { - "epoch": 30.29, - "learning_rate": 1.5914685314685314e-06, - "loss": 0.3663, - "step": 34960 - }, - { - "epoch": 30.3, - "learning_rate": 1.5907692307692307e-06, - "loss": 0.4156, - "step": 34970 - }, - { - "epoch": 30.31, - "learning_rate": 1.59006993006993e-06, - "loss": 0.3471, - "step": 34980 - }, - { - "epoch": 30.32, - "learning_rate": 1.5893706293706293e-06, - "loss": 0.369, - "step": 34990 - }, - { - "epoch": 30.33, - "learning_rate": 1.5886713286713288e-06, - "loss": 0.3399, - "step": 35000 - }, - { - "epoch": 30.34, - "learning_rate": 1.5879720279720278e-06, - "loss": 0.3496, - "step": 35010 - }, - { - "epoch": 30.35, - "learning_rate": 1.5872727272727271e-06, - "loss": 0.3927, - "step": 35020 - }, - { - "epoch": 30.36, - "learning_rate": 1.5865734265734266e-06, - "loss": 0.3727, - "step": 35030 - }, - { - "epoch": 30.36, - "learning_rate": 1.5858741258741257e-06, - "loss": 0.358, - "step": 35040 - }, - { - "epoch": 30.37, - "learning_rate": 1.5851748251748252e-06, - "loss": 0.3672, - "step": 35050 - }, - { - "epoch": 30.38, - "learning_rate": 1.5844755244755243e-06, - "loss": 0.3451, - "step": 35060 - }, - { - "epoch": 30.39, - "learning_rate": 1.5837762237762238e-06, - "loss": 0.3325, - "step": 35070 - }, - { - "epoch": 30.4, - "learning_rate": 1.583076923076923e-06, - "loss": 0.3569, - "step": 35080 - }, - { - "epoch": 30.41, - "learning_rate": 1.5823776223776223e-06, - "loss": 0.371, - "step": 35090 - }, - { - "epoch": 30.42, - "learning_rate": 1.5816783216783216e-06, - "loss": 0.3603, - "step": 35100 - }, - { - "epoch": 30.42, - "learning_rate": 1.580979020979021e-06, - "loss": 0.3758, - "step": 35110 - }, - { - "epoch": 30.43, - "learning_rate": 1.5802797202797202e-06, - "loss": 0.3824, - "step": 35120 - }, - { - "epoch": 30.44, - "learning_rate": 1.5795804195804195e-06, - "loss": 0.3723, - "step": 35130 - }, - { - "epoch": 30.45, - "learning_rate": 1.5788811188811188e-06, - "loss": 0.4211, - "step": 35140 - }, - { - "epoch": 30.46, - "learning_rate": 1.578181818181818e-06, - "loss": 0.3785, - "step": 35150 - }, - { - "epoch": 30.47, - "learning_rate": 1.5774825174825175e-06, - "loss": 0.409, - "step": 35160 - }, - { - "epoch": 30.48, - "learning_rate": 1.5767832167832166e-06, - "loss": 0.4054, - "step": 35170 - }, - { - "epoch": 30.49, - "learning_rate": 1.5760839160839161e-06, - "loss": 0.3717, - "step": 35180 - }, - { - "epoch": 30.49, - "learning_rate": 1.5753846153846154e-06, - "loss": 0.4008, - "step": 35190 - }, - { - "epoch": 30.5, - "learning_rate": 1.5746853146853145e-06, - "loss": 0.3472, - "step": 35200 - }, - { - "epoch": 30.51, - "learning_rate": 1.573986013986014e-06, - "loss": 0.4362, - "step": 35210 - }, - { - "epoch": 30.52, - "learning_rate": 1.573286713286713e-06, - "loss": 0.4502, - "step": 35220 - }, - { - "epoch": 30.53, - "learning_rate": 1.5725874125874125e-06, - "loss": 0.3301, - "step": 35230 - }, - { - "epoch": 30.54, - "learning_rate": 1.5718881118881118e-06, - "loss": 0.3875, - "step": 35240 - }, - { - "epoch": 30.55, - "learning_rate": 1.5711888111888111e-06, - "loss": 0.352, - "step": 35250 - }, - { - "epoch": 30.55, - "learning_rate": 1.5704895104895104e-06, - "loss": 0.3891, - "step": 35260 - }, - { - "epoch": 30.56, - "learning_rate": 1.56979020979021e-06, - "loss": 0.4293, - "step": 35270 - }, - { - "epoch": 30.57, - "learning_rate": 1.569090909090909e-06, - "loss": 0.3905, - "step": 35280 - }, - { - "epoch": 30.58, - "learning_rate": 1.5683916083916083e-06, - "loss": 0.3849, - "step": 35290 - }, - { - "epoch": 30.59, - "learning_rate": 1.5676923076923078e-06, - "loss": 0.39, - "step": 35300 - }, - { - "epoch": 30.6, - "learning_rate": 1.5669930069930068e-06, - "loss": 0.396, - "step": 35310 - }, - { - "epoch": 30.61, - "learning_rate": 1.5662937062937063e-06, - "loss": 0.3906, - "step": 35320 - }, - { - "epoch": 30.61, - "learning_rate": 1.5655944055944054e-06, - "loss": 0.3884, - "step": 35330 - }, - { - "epoch": 30.62, - "learning_rate": 1.5648951048951049e-06, - "loss": 0.3665, - "step": 35340 - }, - { - "epoch": 30.63, - "learning_rate": 1.5641958041958042e-06, - "loss": 0.3593, - "step": 35350 - }, - { - "epoch": 30.64, - "learning_rate": 1.5634965034965035e-06, - "loss": 0.3586, - "step": 35360 - }, - { - "epoch": 30.65, - "learning_rate": 1.5627972027972027e-06, - "loss": 0.3464, - "step": 35370 - }, - { - "epoch": 30.66, - "learning_rate": 1.562097902097902e-06, - "loss": 0.3643, - "step": 35380 - }, - { - "epoch": 30.67, - "learning_rate": 1.5613986013986013e-06, - "loss": 0.3734, - "step": 35390 - }, - { - "epoch": 30.68, - "learning_rate": 1.5606993006993006e-06, - "loss": 0.3686, - "step": 35400 - }, - { - "epoch": 30.68, - "learning_rate": 1.5599999999999999e-06, - "loss": 0.3713, - "step": 35410 - }, - { - "epoch": 30.69, - "learning_rate": 1.5593006993006992e-06, - "loss": 0.3656, - "step": 35420 - }, - { - "epoch": 30.7, - "learning_rate": 1.5586013986013987e-06, - "loss": 0.3911, - "step": 35430 - }, - { - "epoch": 30.71, - "learning_rate": 1.5579020979020977e-06, - "loss": 0.3081, - "step": 35440 - }, - { - "epoch": 30.72, - "learning_rate": 1.5572027972027972e-06, - "loss": 0.3021, - "step": 35450 - }, - { - "epoch": 30.73, - "learning_rate": 1.5565034965034965e-06, - "loss": 0.4553, - "step": 35460 - }, - { - "epoch": 30.74, - "learning_rate": 1.5558041958041956e-06, - "loss": 0.3951, - "step": 35470 - }, - { - "epoch": 30.74, - "learning_rate": 1.555104895104895e-06, - "loss": 0.372, - "step": 35480 - }, - { - "epoch": 30.75, - "learning_rate": 1.5544055944055942e-06, - "loss": 0.37, - "step": 35490 - }, - { - "epoch": 30.76, - "learning_rate": 1.5537062937062937e-06, - "loss": 0.3266, - "step": 35500 - }, - { - "epoch": 30.77, - "learning_rate": 1.553006993006993e-06, - "loss": 0.3462, - "step": 35510 - }, - { - "epoch": 30.78, - "learning_rate": 1.5523076923076922e-06, - "loss": 0.3416, - "step": 35520 - }, - { - "epoch": 30.79, - "learning_rate": 1.5516083916083915e-06, - "loss": 0.355, - "step": 35530 - }, - { - "epoch": 30.8, - "learning_rate": 1.550909090909091e-06, - "loss": 0.3883, - "step": 35540 - }, - { - "epoch": 30.81, - "learning_rate": 1.55020979020979e-06, - "loss": 0.3916, - "step": 35550 - }, - { - "epoch": 30.81, - "learning_rate": 1.5495104895104894e-06, - "loss": 0.407, - "step": 35560 - }, - { - "epoch": 30.82, - "learning_rate": 1.5488111888111889e-06, - "loss": 0.3629, - "step": 35570 - }, - { - "epoch": 30.83, - "learning_rate": 1.548111888111888e-06, - "loss": 0.3844, - "step": 35580 - }, - { - "epoch": 30.84, - "learning_rate": 1.5474125874125874e-06, - "loss": 0.3713, - "step": 35590 - }, - { - "epoch": 30.85, - "learning_rate": 1.5467132867132865e-06, - "loss": 0.3512, - "step": 35600 - }, - { - "epoch": 30.86, - "learning_rate": 1.546013986013986e-06, - "loss": 0.3197, - "step": 35610 - }, - { - "epoch": 30.87, - "learning_rate": 1.5453146853146853e-06, - "loss": 0.3575, - "step": 35620 - }, - { - "epoch": 30.87, - "learning_rate": 1.5446153846153846e-06, - "loss": 0.3383, - "step": 35630 - }, - { - "epoch": 30.88, - "learning_rate": 1.5439160839160839e-06, - "loss": 0.3747, - "step": 35640 - }, - { - "epoch": 30.89, - "learning_rate": 1.5432167832167832e-06, - "loss": 0.3644, - "step": 35650 - }, - { - "epoch": 30.9, - "learning_rate": 1.5425174825174824e-06, - "loss": 0.3445, - "step": 35660 - }, - { - "epoch": 30.91, - "learning_rate": 1.5418181818181817e-06, - "loss": 0.3674, - "step": 35670 - }, - { - "epoch": 30.92, - "learning_rate": 1.541118881118881e-06, - "loss": 0.404, - "step": 35680 - }, - { - "epoch": 30.93, - "learning_rate": 1.5404195804195803e-06, - "loss": 0.3292, - "step": 35690 - }, - { - "epoch": 30.94, - "learning_rate": 1.5397202797202798e-06, - "loss": 0.3722, - "step": 35700 - }, - { - "epoch": 30.94, - "learning_rate": 1.5390209790209789e-06, - "loss": 0.3704, - "step": 35710 - }, - { - "epoch": 30.95, - "learning_rate": 1.5383216783216784e-06, - "loss": 0.4484, - "step": 35720 - }, - { - "epoch": 30.96, - "learning_rate": 1.5376223776223776e-06, - "loss": 0.3342, - "step": 35730 - }, - { - "epoch": 30.97, - "learning_rate": 1.5369230769230767e-06, - "loss": 0.3784, - "step": 35740 - }, - { - "epoch": 30.98, - "learning_rate": 1.5362237762237762e-06, - "loss": 0.3727, - "step": 35750 - }, - { - "epoch": 30.99, - "learning_rate": 1.5355244755244753e-06, - "loss": 0.3832, - "step": 35760 - }, - { - "epoch": 31.0, - "learning_rate": 1.5348251748251748e-06, - "loss": 0.3544, - "step": 35770 - }, - { - "epoch": 31.0, - "eval_loss": 0.5595405697822571, - "eval_runtime": 134.7991, - "eval_samples_per_second": 3.947, - "eval_steps_per_second": 1.973, - "eval_wer": 0.24445587195474705, - "step": 35774 - }, - { - "epoch": 31.01, - "learning_rate": 1.534125874125874e-06, - "loss": 0.3527, - "step": 35780 - }, - { - "epoch": 31.01, - "learning_rate": 1.5334265734265734e-06, - "loss": 0.3921, - "step": 35790 - }, - { - "epoch": 31.02, - "learning_rate": 1.5327272727272726e-06, - "loss": 0.354, - "step": 35800 - }, - { - "epoch": 31.03, - "learning_rate": 1.532027972027972e-06, - "loss": 0.3689, - "step": 35810 - }, - { - "epoch": 31.04, - "learning_rate": 1.5313286713286712e-06, - "loss": 0.3668, - "step": 35820 - }, - { - "epoch": 31.05, - "learning_rate": 1.5306293706293705e-06, - "loss": 0.3723, - "step": 35830 - }, - { - "epoch": 31.06, - "learning_rate": 1.52993006993007e-06, - "loss": 0.3158, - "step": 35840 - }, - { - "epoch": 31.07, - "learning_rate": 1.529230769230769e-06, - "loss": 0.3894, - "step": 35850 - }, - { - "epoch": 31.07, - "learning_rate": 1.5285314685314686e-06, - "loss": 0.3496, - "step": 35860 - }, - { - "epoch": 31.08, - "learning_rate": 1.5278321678321676e-06, - "loss": 0.3798, - "step": 35870 - }, - { - "epoch": 31.09, - "learning_rate": 1.5271328671328671e-06, - "loss": 0.4188, - "step": 35880 - }, - { - "epoch": 31.1, - "learning_rate": 1.5264335664335664e-06, - "loss": 0.4129, - "step": 35890 - }, - { - "epoch": 31.11, - "learning_rate": 1.5257342657342655e-06, - "loss": 0.3586, - "step": 35900 - }, - { - "epoch": 31.12, - "learning_rate": 1.525034965034965e-06, - "loss": 0.389, - "step": 35910 - }, - { - "epoch": 31.13, - "learning_rate": 1.5243356643356643e-06, - "loss": 0.3768, - "step": 35920 - }, - { - "epoch": 31.14, - "learning_rate": 1.5236363636363636e-06, - "loss": 0.3302, - "step": 35930 - }, - { - "epoch": 31.14, - "learning_rate": 1.5229370629370628e-06, - "loss": 0.3416, - "step": 35940 - }, - { - "epoch": 31.15, - "learning_rate": 1.5222377622377621e-06, - "loss": 0.3617, - "step": 35950 - }, - { - "epoch": 31.16, - "learning_rate": 1.5215384615384614e-06, - "loss": 0.347, - "step": 35960 - }, - { - "epoch": 31.17, - "learning_rate": 1.520839160839161e-06, - "loss": 0.4397, - "step": 35970 - }, - { - "epoch": 31.18, - "learning_rate": 1.52013986013986e-06, - "loss": 0.33, - "step": 35980 - }, - { - "epoch": 31.19, - "learning_rate": 1.5194405594405593e-06, - "loss": 0.3698, - "step": 35990 - }, - { - "epoch": 31.2, - "learning_rate": 1.5187412587412588e-06, - "loss": 0.2978, - "step": 36000 - }, - { - "epoch": 31.2, - "learning_rate": 1.5180419580419578e-06, - "loss": 0.3654, - "step": 36010 - }, - { - "epoch": 31.21, - "learning_rate": 1.5173426573426573e-06, - "loss": 0.3906, - "step": 36020 - }, - { - "epoch": 31.22, - "learning_rate": 1.5166433566433564e-06, - "loss": 0.4131, - "step": 36030 - }, - { - "epoch": 31.23, - "learning_rate": 1.515944055944056e-06, - "loss": 0.3378, - "step": 36040 - }, - { - "epoch": 31.24, - "learning_rate": 1.5152447552447552e-06, - "loss": 0.3822, - "step": 36050 - }, - { - "epoch": 31.25, - "learning_rate": 1.5145454545454545e-06, - "loss": 0.3885, - "step": 36060 - }, - { - "epoch": 31.26, - "learning_rate": 1.5138461538461538e-06, - "loss": 0.4119, - "step": 36070 - }, - { - "epoch": 31.27, - "learning_rate": 1.513146853146853e-06, - "loss": 0.4497, - "step": 36080 - }, - { - "epoch": 31.27, - "learning_rate": 1.5124475524475523e-06, - "loss": 0.386, - "step": 36090 - }, - { - "epoch": 31.28, - "learning_rate": 1.5117482517482516e-06, - "loss": 0.3351, - "step": 36100 - }, - { - "epoch": 31.29, - "learning_rate": 1.5110489510489511e-06, - "loss": 0.3998, - "step": 36110 - }, - { - "epoch": 31.3, - "learning_rate": 1.5103496503496502e-06, - "loss": 0.4054, - "step": 36120 - }, - { - "epoch": 31.31, - "learning_rate": 1.5096503496503497e-06, - "loss": 0.4027, - "step": 36130 - }, - { - "epoch": 31.32, - "learning_rate": 1.5089510489510488e-06, - "loss": 0.4144, - "step": 36140 - }, - { - "epoch": 31.33, - "learning_rate": 1.5082517482517483e-06, - "loss": 0.3257, - "step": 36150 - }, - { - "epoch": 31.33, - "learning_rate": 1.5075524475524475e-06, - "loss": 0.3145, - "step": 36160 - }, - { - "epoch": 31.34, - "learning_rate": 1.5068531468531466e-06, - "loss": 0.3325, - "step": 36170 - }, - { - "epoch": 31.35, - "learning_rate": 1.5061538461538461e-06, - "loss": 0.3591, - "step": 36180 - }, - { - "epoch": 31.36, - "learning_rate": 1.5054545454545454e-06, - "loss": 0.3613, - "step": 36190 - }, - { - "epoch": 31.37, - "learning_rate": 1.5047552447552447e-06, - "loss": 0.3663, - "step": 36200 - }, - { - "epoch": 31.38, - "learning_rate": 1.504055944055944e-06, - "loss": 0.3922, - "step": 36210 - }, - { - "epoch": 31.39, - "learning_rate": 1.5033566433566433e-06, - "loss": 0.349, - "step": 36220 - }, - { - "epoch": 31.39, - "learning_rate": 1.5026573426573425e-06, - "loss": 0.3971, - "step": 36230 - }, - { - "epoch": 31.4, - "learning_rate": 1.501958041958042e-06, - "loss": 0.3792, - "step": 36240 - }, - { - "epoch": 31.41, - "learning_rate": 1.5012587412587411e-06, - "loss": 0.3938, - "step": 36250 - }, - { - "epoch": 31.42, - "learning_rate": 1.5005594405594404e-06, - "loss": 0.3061, - "step": 36260 - }, - { - "epoch": 31.43, - "learning_rate": 1.49986013986014e-06, - "loss": 0.3731, - "step": 36270 - }, - { - "epoch": 31.44, - "learning_rate": 1.499160839160839e-06, - "loss": 0.3302, - "step": 36280 - }, - { - "epoch": 31.45, - "learning_rate": 1.4984615384615385e-06, - "loss": 0.3524, - "step": 36290 - }, - { - "epoch": 31.46, - "learning_rate": 1.4977622377622378e-06, - "loss": 0.3296, - "step": 36300 - }, - { - "epoch": 31.46, - "learning_rate": 1.497062937062937e-06, - "loss": 0.3934, - "step": 36310 - }, - { - "epoch": 31.47, - "learning_rate": 1.4963636363636363e-06, - "loss": 0.3872, - "step": 36320 - }, - { - "epoch": 31.48, - "learning_rate": 1.4956643356643356e-06, - "loss": 0.3328, - "step": 36330 - }, - { - "epoch": 31.49, - "learning_rate": 1.4949650349650349e-06, - "loss": 0.4192, - "step": 36340 - }, - { - "epoch": 31.5, - "learning_rate": 1.4942657342657342e-06, - "loss": 0.3213, - "step": 36350 - }, - { - "epoch": 31.51, - "learning_rate": 1.4935664335664335e-06, - "loss": 0.3741, - "step": 36360 - }, - { - "epoch": 31.52, - "learning_rate": 1.4928671328671327e-06, - "loss": 0.4464, - "step": 36370 - }, - { - "epoch": 31.52, - "learning_rate": 1.4921678321678322e-06, - "loss": 0.3015, - "step": 36380 - }, - { - "epoch": 31.53, - "learning_rate": 1.4914685314685313e-06, - "loss": 0.4096, - "step": 36390 - }, - { - "epoch": 31.54, - "learning_rate": 1.4907692307692308e-06, - "loss": 0.3798, - "step": 36400 - }, - { - "epoch": 31.55, - "learning_rate": 1.4900699300699299e-06, - "loss": 0.3412, - "step": 36410 - }, - { - "epoch": 31.56, - "learning_rate": 1.4893706293706294e-06, - "loss": 0.3456, - "step": 36420 - }, - { - "epoch": 31.57, - "learning_rate": 1.4886713286713287e-06, - "loss": 0.3703, - "step": 36430 - }, - { - "epoch": 31.58, - "learning_rate": 1.4879720279720277e-06, - "loss": 0.395, - "step": 36440 - }, - { - "epoch": 31.59, - "learning_rate": 1.4872727272727272e-06, - "loss": 0.3474, - "step": 36450 - }, - { - "epoch": 31.59, - "learning_rate": 1.4865734265734265e-06, - "loss": 0.3511, - "step": 36460 - }, - { - "epoch": 31.6, - "learning_rate": 1.4858741258741258e-06, - "loss": 0.3584, - "step": 36470 - }, - { - "epoch": 31.61, - "learning_rate": 1.485174825174825e-06, - "loss": 0.2995, - "step": 36480 - }, - { - "epoch": 31.62, - "learning_rate": 1.4844755244755246e-06, - "loss": 0.3691, - "step": 36490 - }, - { - "epoch": 31.63, - "learning_rate": 1.4837762237762237e-06, - "loss": 0.3622, - "step": 36500 - }, - { - "epoch": 31.64, - "learning_rate": 1.4830769230769232e-06, - "loss": 0.3831, - "step": 36510 - }, - { - "epoch": 31.65, - "learning_rate": 1.4823776223776222e-06, - "loss": 0.3504, - "step": 36520 - }, - { - "epoch": 31.65, - "learning_rate": 1.4816783216783215e-06, - "loss": 0.3921, - "step": 36530 - }, - { - "epoch": 31.66, - "learning_rate": 1.480979020979021e-06, - "loss": 0.3505, - "step": 36540 - }, - { - "epoch": 31.67, - "learning_rate": 1.48027972027972e-06, - "loss": 0.4103, - "step": 36550 - }, - { - "epoch": 31.68, - "learning_rate": 1.4795804195804196e-06, - "loss": 0.3525, - "step": 36560 - }, - { - "epoch": 31.69, - "learning_rate": 1.4788811188811189e-06, - "loss": 0.3725, - "step": 36570 - }, - { - "epoch": 31.7, - "learning_rate": 1.4781818181818182e-06, - "loss": 0.3332, - "step": 36580 - }, - { - "epoch": 31.71, - "learning_rate": 1.4774825174825174e-06, - "loss": 0.3543, - "step": 36590 - }, - { - "epoch": 31.72, - "learning_rate": 1.4767832167832167e-06, - "loss": 0.361, - "step": 36600 - }, - { - "epoch": 31.72, - "learning_rate": 1.476083916083916e-06, - "loss": 0.3543, - "step": 36610 - }, - { - "epoch": 31.73, - "learning_rate": 1.4753846153846153e-06, - "loss": 0.4512, - "step": 36620 - }, - { - "epoch": 31.74, - "learning_rate": 1.4746853146853146e-06, - "loss": 0.3457, - "step": 36630 - }, - { - "epoch": 31.75, - "learning_rate": 1.4739860139860139e-06, - "loss": 0.3774, - "step": 36640 - }, - { - "epoch": 31.76, - "learning_rate": 1.4732867132867134e-06, - "loss": 0.3264, - "step": 36650 - }, - { - "epoch": 31.77, - "learning_rate": 1.4725874125874124e-06, - "loss": 0.3726, - "step": 36660 - }, - { - "epoch": 31.78, - "learning_rate": 1.471888111888112e-06, - "loss": 0.3406, - "step": 36670 - }, - { - "epoch": 31.78, - "learning_rate": 1.471188811188811e-06, - "loss": 0.3768, - "step": 36680 - }, - { - "epoch": 31.79, - "learning_rate": 1.4704895104895105e-06, - "loss": 0.4042, - "step": 36690 - }, - { - "epoch": 31.8, - "learning_rate": 1.4697902097902098e-06, - "loss": 0.3551, - "step": 36700 - }, - { - "epoch": 31.81, - "learning_rate": 1.4690909090909089e-06, - "loss": 0.3684, - "step": 36710 - }, - { - "epoch": 31.82, - "learning_rate": 1.4683916083916084e-06, - "loss": 0.3271, - "step": 36720 - }, - { - "epoch": 31.83, - "learning_rate": 1.4676923076923076e-06, - "loss": 0.4142, - "step": 36730 - }, - { - "epoch": 31.84, - "learning_rate": 1.466993006993007e-06, - "loss": 0.3726, - "step": 36740 - }, - { - "epoch": 31.85, - "learning_rate": 1.4662937062937062e-06, - "loss": 0.3297, - "step": 36750 - }, - { - "epoch": 31.85, - "learning_rate": 1.4655944055944057e-06, - "loss": 0.3958, - "step": 36760 - }, - { - "epoch": 31.86, - "learning_rate": 1.4648951048951048e-06, - "loss": 0.4074, - "step": 36770 - }, - { - "epoch": 31.87, - "learning_rate": 1.464195804195804e-06, - "loss": 0.3892, - "step": 36780 - }, - { - "epoch": 31.88, - "learning_rate": 1.4634965034965034e-06, - "loss": 0.3234, - "step": 36790 - }, - { - "epoch": 31.89, - "learning_rate": 1.4627972027972026e-06, - "loss": 0.385, - "step": 36800 - }, - { - "epoch": 31.9, - "learning_rate": 1.4620979020979021e-06, - "loss": 0.3705, - "step": 36810 - }, - { - "epoch": 31.91, - "learning_rate": 1.4613986013986012e-06, - "loss": 0.3915, - "step": 36820 - }, - { - "epoch": 31.91, - "learning_rate": 1.4606993006993007e-06, - "loss": 0.339, - "step": 36830 - }, - { - "epoch": 31.92, - "learning_rate": 1.46e-06, - "loss": 0.3448, - "step": 36840 - }, - { - "epoch": 31.93, - "learning_rate": 1.4593006993006993e-06, - "loss": 0.3134, - "step": 36850 - }, - { - "epoch": 31.94, - "learning_rate": 1.4586013986013986e-06, - "loss": 0.4355, - "step": 36860 - }, - { - "epoch": 31.95, - "learning_rate": 1.4579020979020976e-06, - "loss": 0.4304, - "step": 36870 - }, - { - "epoch": 31.96, - "learning_rate": 1.4572027972027971e-06, - "loss": 0.3529, - "step": 36880 - }, - { - "epoch": 31.97, - "learning_rate": 1.4565034965034964e-06, - "loss": 0.3889, - "step": 36890 - }, - { - "epoch": 31.98, - "learning_rate": 1.4558041958041957e-06, - "loss": 0.3798, - "step": 36900 - }, - { - "epoch": 31.98, - "learning_rate": 1.455104895104895e-06, - "loss": 0.4097, - "step": 36910 - }, - { - "epoch": 31.99, - "learning_rate": 1.4544055944055945e-06, - "loss": 0.3748, - "step": 36920 - }, - { - "epoch": 32.0, - "eval_loss": 0.5464403033256531, - "eval_runtime": 135.0985, - "eval_samples_per_second": 3.938, - "eval_steps_per_second": 1.969, - "eval_wer": 0.24606286559105225, - "step": 36928 - }, - { - "epoch": 32.0, - "learning_rate": 1.4537062937062936e-06, - "loss": 0.4613, - "step": 36930 - }, - { - "epoch": 32.01, - "learning_rate": 1.453006993006993e-06, - "loss": 0.3701, - "step": 36940 - }, - { - "epoch": 32.02, - "learning_rate": 1.4523076923076921e-06, - "loss": 0.3776, - "step": 36950 - }, - { - "epoch": 32.03, - "learning_rate": 1.4516083916083914e-06, - "loss": 0.3505, - "step": 36960 - }, - { - "epoch": 32.04, - "learning_rate": 1.450909090909091e-06, - "loss": 0.383, - "step": 36970 - }, - { - "epoch": 32.05, - "learning_rate": 1.45020979020979e-06, - "loss": 0.3804, - "step": 36980 - }, - { - "epoch": 32.05, - "learning_rate": 1.4495104895104895e-06, - "loss": 0.4103, - "step": 36990 - }, - { - "epoch": 32.06, - "learning_rate": 1.4488111888111888e-06, - "loss": 0.3761, - "step": 37000 - }, - { - "epoch": 32.07, - "learning_rate": 1.448111888111888e-06, - "loss": 0.3826, - "step": 37010 - }, - { - "epoch": 32.08, - "learning_rate": 1.4474125874125873e-06, - "loss": 0.3426, - "step": 37020 - }, - { - "epoch": 32.09, - "learning_rate": 1.4467132867132868e-06, - "loss": 0.3708, - "step": 37030 - }, - { - "epoch": 32.1, - "learning_rate": 1.446013986013986e-06, - "loss": 0.3203, - "step": 37040 - }, - { - "epoch": 32.11, - "learning_rate": 1.4453146853146852e-06, - "loss": 0.3502, - "step": 37050 - }, - { - "epoch": 32.11, - "learning_rate": 1.4446153846153845e-06, - "loss": 0.3708, - "step": 37060 - }, - { - "epoch": 32.12, - "learning_rate": 1.4439160839160838e-06, - "loss": 0.3684, - "step": 37070 - }, - { - "epoch": 32.13, - "learning_rate": 1.4432167832167833e-06, - "loss": 0.4255, - "step": 37080 - }, - { - "epoch": 32.14, - "learning_rate": 1.4425174825174823e-06, - "loss": 0.4371, - "step": 37090 - }, - { - "epoch": 32.15, - "learning_rate": 1.4418181818181818e-06, - "loss": 0.3368, - "step": 37100 - }, - { - "epoch": 32.16, - "learning_rate": 1.4411188811188811e-06, - "loss": 0.3647, - "step": 37110 - }, - { - "epoch": 32.17, - "learning_rate": 1.4404195804195804e-06, - "loss": 0.3978, - "step": 37120 - }, - { - "epoch": 32.17, - "learning_rate": 1.4397202797202797e-06, - "loss": 0.4447, - "step": 37130 - }, - { - "epoch": 32.18, - "learning_rate": 1.4390209790209788e-06, - "loss": 0.3897, - "step": 37140 - }, - { - "epoch": 32.19, - "learning_rate": 1.4383216783216783e-06, - "loss": 0.3766, - "step": 37150 - }, - { - "epoch": 32.2, - "learning_rate": 1.4376223776223775e-06, - "loss": 0.3374, - "step": 37160 - }, - { - "epoch": 32.21, - "learning_rate": 1.4369230769230768e-06, - "loss": 0.3705, - "step": 37170 - }, - { - "epoch": 32.22, - "learning_rate": 1.4362237762237761e-06, - "loss": 0.4111, - "step": 37180 - }, - { - "epoch": 32.23, - "learning_rate": 1.4355244755244756e-06, - "loss": 0.359, - "step": 37190 - }, - { - "epoch": 32.24, - "learning_rate": 1.4348251748251747e-06, - "loss": 0.353, - "step": 37200 - }, - { - "epoch": 32.24, - "learning_rate": 1.4341258741258742e-06, - "loss": 0.3253, - "step": 37210 - }, - { - "epoch": 32.25, - "learning_rate": 1.4334265734265733e-06, - "loss": 0.3938, - "step": 37220 - }, - { - "epoch": 32.26, - "learning_rate": 1.4327272727272725e-06, - "loss": 0.3608, - "step": 37230 - }, - { - "epoch": 32.27, - "learning_rate": 1.432027972027972e-06, - "loss": 0.352, - "step": 37240 - }, - { - "epoch": 32.28, - "learning_rate": 1.4313286713286711e-06, - "loss": 0.3894, - "step": 37250 - }, - { - "epoch": 32.29, - "learning_rate": 1.4306293706293706e-06, - "loss": 0.3467, - "step": 37260 - }, - { - "epoch": 32.3, - "learning_rate": 1.42993006993007e-06, - "loss": 0.3469, - "step": 37270 - }, - { - "epoch": 32.3, - "learning_rate": 1.4292307692307692e-06, - "loss": 0.3764, - "step": 37280 - }, - { - "epoch": 32.31, - "learning_rate": 1.4285314685314685e-06, - "loss": 0.3941, - "step": 37290 - }, - { - "epoch": 32.32, - "learning_rate": 1.427832167832168e-06, - "loss": 0.3929, - "step": 37300 - }, - { - "epoch": 32.33, - "learning_rate": 1.427132867132867e-06, - "loss": 0.38, - "step": 37310 - }, - { - "epoch": 32.34, - "learning_rate": 1.4264335664335663e-06, - "loss": 0.3292, - "step": 37320 - }, - { - "epoch": 32.35, - "learning_rate": 1.4257342657342656e-06, - "loss": 0.3435, - "step": 37330 - }, - { - "epoch": 32.36, - "learning_rate": 1.4250349650349649e-06, - "loss": 0.4315, - "step": 37340 - }, - { - "epoch": 32.37, - "learning_rate": 1.4243356643356644e-06, - "loss": 0.3478, - "step": 37350 - }, - { - "epoch": 32.37, - "learning_rate": 1.4236363636363635e-06, - "loss": 0.4144, - "step": 37360 - }, - { - "epoch": 32.38, - "learning_rate": 1.422937062937063e-06, - "loss": 0.3293, - "step": 37370 - }, - { - "epoch": 32.39, - "learning_rate": 1.4222377622377622e-06, - "loss": 0.3359, - "step": 37380 - }, - { - "epoch": 32.4, - "learning_rate": 1.4215384615384615e-06, - "loss": 0.3422, - "step": 37390 - }, - { - "epoch": 32.41, - "learning_rate": 1.4208391608391608e-06, - "loss": 0.369, - "step": 37400 - }, - { - "epoch": 32.42, - "learning_rate": 1.4201398601398599e-06, - "loss": 0.3224, - "step": 37410 - }, - { - "epoch": 32.43, - "learning_rate": 1.4194405594405594e-06, - "loss": 0.4373, - "step": 37420 - }, - { - "epoch": 32.43, - "learning_rate": 1.4187412587412587e-06, - "loss": 0.3844, - "step": 37430 - }, - { - "epoch": 32.44, - "learning_rate": 1.418041958041958e-06, - "loss": 0.3759, - "step": 37440 - }, - { - "epoch": 32.45, - "learning_rate": 1.4173426573426572e-06, - "loss": 0.3449, - "step": 37450 - }, - { - "epoch": 32.46, - "learning_rate": 1.4166433566433567e-06, - "loss": 0.4016, - "step": 37460 - }, - { - "epoch": 32.47, - "learning_rate": 1.4159440559440558e-06, - "loss": 0.3822, - "step": 37470 - }, - { - "epoch": 32.48, - "learning_rate": 1.4152447552447553e-06, - "loss": 0.3682, - "step": 37480 - }, - { - "epoch": 32.49, - "learning_rate": 1.4145454545454544e-06, - "loss": 0.3673, - "step": 37490 - }, - { - "epoch": 32.5, - "learning_rate": 1.4138461538461537e-06, - "loss": 0.2964, - "step": 37500 - }, - { - "epoch": 32.5, - "learning_rate": 1.4131468531468532e-06, - "loss": 0.3916, - "step": 37510 - }, - { - "epoch": 32.51, - "learning_rate": 1.4124475524475522e-06, - "loss": 0.4394, - "step": 37520 - }, - { - "epoch": 32.52, - "learning_rate": 1.4117482517482517e-06, - "loss": 0.4339, - "step": 37530 - }, - { - "epoch": 32.53, - "learning_rate": 1.411048951048951e-06, - "loss": 0.3407, - "step": 37540 - }, - { - "epoch": 32.54, - "learning_rate": 1.4103496503496503e-06, - "loss": 0.3609, - "step": 37550 - }, - { - "epoch": 32.55, - "learning_rate": 1.4096503496503496e-06, - "loss": 0.3607, - "step": 37560 - }, - { - "epoch": 32.56, - "learning_rate": 1.408951048951049e-06, - "loss": 0.3941, - "step": 37570 - }, - { - "epoch": 32.56, - "learning_rate": 1.4082517482517482e-06, - "loss": 0.3341, - "step": 37580 - }, - { - "epoch": 32.57, - "learning_rate": 1.4075524475524474e-06, - "loss": 0.3668, - "step": 37590 - }, - { - "epoch": 32.58, - "learning_rate": 1.4068531468531467e-06, - "loss": 0.3347, - "step": 37600 - }, - { - "epoch": 32.59, - "learning_rate": 1.406153846153846e-06, - "loss": 0.322, - "step": 37610 - }, - { - "epoch": 32.6, - "learning_rate": 1.4054545454545455e-06, - "loss": 0.3625, - "step": 37620 - }, - { - "epoch": 32.61, - "learning_rate": 1.4047552447552446e-06, - "loss": 0.3698, - "step": 37630 - }, - { - "epoch": 32.62, - "learning_rate": 1.404055944055944e-06, - "loss": 0.3135, - "step": 37640 - }, - { - "epoch": 32.63, - "learning_rate": 1.4033566433566434e-06, - "loss": 0.4204, - "step": 37650 - }, - { - "epoch": 32.63, - "learning_rate": 1.4026573426573427e-06, - "loss": 0.4076, - "step": 37660 - }, - { - "epoch": 32.64, - "learning_rate": 1.401958041958042e-06, - "loss": 0.3556, - "step": 37670 - }, - { - "epoch": 32.65, - "learning_rate": 1.401258741258741e-06, - "loss": 0.3814, - "step": 37680 - }, - { - "epoch": 32.66, - "learning_rate": 1.4005594405594405e-06, - "loss": 0.3562, - "step": 37690 - }, - { - "epoch": 32.67, - "learning_rate": 1.3998601398601398e-06, - "loss": 0.3452, - "step": 37700 - }, - { - "epoch": 32.68, - "learning_rate": 1.399160839160839e-06, - "loss": 0.3243, - "step": 37710 - }, - { - "epoch": 32.69, - "learning_rate": 1.3984615384615384e-06, - "loss": 0.4003, - "step": 37720 - }, - { - "epoch": 32.69, - "learning_rate": 1.3978321678321678e-06, - "loss": 0.3779, - "step": 37730 - }, - { - "epoch": 32.7, - "learning_rate": 1.3971328671328671e-06, - "loss": 0.4263, - "step": 37740 - }, - { - "epoch": 32.71, - "learning_rate": 1.3964335664335664e-06, - "loss": 0.3623, - "step": 37750 - }, - { - "epoch": 32.72, - "learning_rate": 1.3957342657342657e-06, - "loss": 0.3627, - "step": 37760 - }, - { - "epoch": 32.73, - "learning_rate": 1.395034965034965e-06, - "loss": 0.3887, - "step": 37770 - }, - { - "epoch": 32.74, - "learning_rate": 1.3943356643356643e-06, - "loss": 0.3845, - "step": 37780 - }, - { - "epoch": 32.75, - "learning_rate": 1.3936363636363635e-06, - "loss": 0.4599, - "step": 37790 - }, - { - "epoch": 32.76, - "learning_rate": 1.3929370629370628e-06, - "loss": 0.3522, - "step": 37800 - }, - { - "epoch": 32.76, - "learning_rate": 1.3922377622377621e-06, - "loss": 0.3465, - "step": 37810 - }, - { - "epoch": 32.77, - "learning_rate": 1.3915384615384616e-06, - "loss": 0.4008, - "step": 37820 - }, - { - "epoch": 32.78, - "learning_rate": 1.3908391608391607e-06, - "loss": 0.3572, - "step": 37830 - }, - { - "epoch": 32.79, - "learning_rate": 1.3901398601398602e-06, - "loss": 0.329, - "step": 37840 - }, - { - "epoch": 32.8, - "learning_rate": 1.3894405594405595e-06, - "loss": 0.4115, - "step": 37850 - }, - { - "epoch": 32.81, - "learning_rate": 1.3887412587412585e-06, - "loss": 0.3476, - "step": 37860 - }, - { - "epoch": 32.82, - "learning_rate": 1.388041958041958e-06, - "loss": 0.4221, - "step": 37870 - }, - { - "epoch": 32.82, - "learning_rate": 1.387342657342657e-06, - "loss": 0.3899, - "step": 37880 - }, - { - "epoch": 32.83, - "learning_rate": 1.3866433566433566e-06, - "loss": 0.4039, - "step": 37890 - }, - { - "epoch": 32.84, - "learning_rate": 1.3859440559440559e-06, - "loss": 0.3687, - "step": 37900 - }, - { - "epoch": 32.85, - "learning_rate": 1.3852447552447552e-06, - "loss": 0.3789, - "step": 37910 - }, - { - "epoch": 32.86, - "learning_rate": 1.3845454545454545e-06, - "loss": 0.3715, - "step": 37920 - }, - { - "epoch": 32.87, - "learning_rate": 1.383846153846154e-06, - "loss": 0.3709, - "step": 37930 - }, - { - "epoch": 32.88, - "learning_rate": 1.383146853146853e-06, - "loss": 0.3607, - "step": 37940 - }, - { - "epoch": 32.89, - "learning_rate": 1.3824475524475523e-06, - "loss": 0.3614, - "step": 37950 - }, - { - "epoch": 32.89, - "learning_rate": 1.3817482517482518e-06, - "loss": 0.3373, - "step": 37960 - }, - { - "epoch": 32.9, - "learning_rate": 1.3810489510489509e-06, - "loss": 0.3845, - "step": 37970 - }, - { - "epoch": 32.91, - "learning_rate": 1.3803496503496504e-06, - "loss": 0.3576, - "step": 37980 - }, - { - "epoch": 32.92, - "learning_rate": 1.3796503496503495e-06, - "loss": 0.3313, - "step": 37990 - }, - { - "epoch": 32.93, - "learning_rate": 1.378951048951049e-06, - "loss": 0.3453, - "step": 38000 - }, - { - "epoch": 32.94, - "learning_rate": 1.3782517482517482e-06, - "loss": 0.3868, - "step": 38010 - }, - { - "epoch": 32.95, - "learning_rate": 1.3775524475524475e-06, - "loss": 0.367, - "step": 38020 - }, - { - "epoch": 32.95, - "learning_rate": 1.3768531468531468e-06, - "loss": 0.3803, - "step": 38030 - }, - { - "epoch": 32.96, - "learning_rate": 1.376153846153846e-06, - "loss": 0.3532, - "step": 38040 - }, - { - "epoch": 32.97, - "learning_rate": 1.3754545454545454e-06, - "loss": 0.3733, - "step": 38050 - }, - { - "epoch": 32.98, - "learning_rate": 1.3747552447552447e-06, - "loss": 0.2842, - "step": 38060 - }, - { - "epoch": 32.99, - "learning_rate": 1.374055944055944e-06, - "loss": 0.3842, - "step": 38070 - }, - { - "epoch": 33.0, - "learning_rate": 1.3733566433566432e-06, - "loss": 0.3839, - "step": 38080 - }, - { - "epoch": 33.0, - "eval_loss": 0.5652355551719666, - "eval_runtime": 135.8769, - "eval_samples_per_second": 3.915, - "eval_steps_per_second": 1.958, - "eval_wer": 0.24747701999100083, - "step": 38082 - }, - { - "epoch": 33.01, - "learning_rate": 1.3726573426573427e-06, - "loss": 0.3689, - "step": 38090 - }, - { - "epoch": 33.02, - "learning_rate": 1.3719580419580418e-06, - "loss": 0.3708, - "step": 38100 - }, - { - "epoch": 33.02, - "learning_rate": 1.3712587412587413e-06, - "loss": 0.3431, - "step": 38110 - }, - { - "epoch": 33.03, - "learning_rate": 1.3705594405594406e-06, - "loss": 0.4184, - "step": 38120 - }, - { - "epoch": 33.04, - "learning_rate": 1.3698601398601397e-06, - "loss": 0.3241, - "step": 38130 - }, - { - "epoch": 33.05, - "learning_rate": 1.3691608391608392e-06, - "loss": 0.3318, - "step": 38140 - }, - { - "epoch": 33.06, - "learning_rate": 1.3684615384615384e-06, - "loss": 0.3082, - "step": 38150 - }, - { - "epoch": 33.07, - "learning_rate": 1.3677622377622377e-06, - "loss": 0.3692, - "step": 38160 - }, - { - "epoch": 33.08, - "learning_rate": 1.367062937062937e-06, - "loss": 0.3644, - "step": 38170 - }, - { - "epoch": 33.08, - "learning_rate": 1.3663636363636363e-06, - "loss": 0.3386, - "step": 38180 - }, - { - "epoch": 33.09, - "learning_rate": 1.3656643356643356e-06, - "loss": 0.415, - "step": 38190 - }, - { - "epoch": 33.1, - "learning_rate": 1.364965034965035e-06, - "loss": 0.3905, - "step": 38200 - }, - { - "epoch": 33.11, - "learning_rate": 1.3642657342657342e-06, - "loss": 0.3808, - "step": 38210 - }, - { - "epoch": 33.12, - "learning_rate": 1.3635664335664334e-06, - "loss": 0.4146, - "step": 38220 - }, - { - "epoch": 33.13, - "learning_rate": 1.362867132867133e-06, - "loss": 0.3925, - "step": 38230 - }, - { - "epoch": 33.14, - "learning_rate": 1.362167832167832e-06, - "loss": 0.4243, - "step": 38240 - }, - { - "epoch": 33.15, - "learning_rate": 1.3614685314685315e-06, - "loss": 0.3465, - "step": 38250 - }, - { - "epoch": 33.15, - "learning_rate": 1.3607692307692306e-06, - "loss": 0.3833, - "step": 38260 - }, - { - "epoch": 33.16, - "learning_rate": 1.36006993006993e-06, - "loss": 0.4024, - "step": 38270 - }, - { - "epoch": 33.17, - "learning_rate": 1.3593706293706294e-06, - "loss": 0.3583, - "step": 38280 - }, - { - "epoch": 33.18, - "learning_rate": 1.3586713286713286e-06, - "loss": 0.3401, - "step": 38290 - }, - { - "epoch": 33.19, - "learning_rate": 1.357972027972028e-06, - "loss": 0.3555, - "step": 38300 - }, - { - "epoch": 33.2, - "learning_rate": 1.3572727272727272e-06, - "loss": 0.3101, - "step": 38310 - }, - { - "epoch": 33.21, - "learning_rate": 1.3565734265734265e-06, - "loss": 0.3485, - "step": 38320 - }, - { - "epoch": 33.21, - "learning_rate": 1.3558741258741258e-06, - "loss": 0.4575, - "step": 38330 - }, - { - "epoch": 33.22, - "learning_rate": 1.3551748251748253e-06, - "loss": 0.4007, - "step": 38340 - }, - { - "epoch": 33.23, - "learning_rate": 1.3544755244755244e-06, - "loss": 0.3453, - "step": 38350 - }, - { - "epoch": 33.24, - "learning_rate": 1.3537762237762239e-06, - "loss": 0.387, - "step": 38360 - }, - { - "epoch": 33.25, - "learning_rate": 1.353076923076923e-06, - "loss": 0.3606, - "step": 38370 - }, - { - "epoch": 33.26, - "learning_rate": 1.3523776223776222e-06, - "loss": 0.3628, - "step": 38380 - }, - { - "epoch": 33.27, - "learning_rate": 1.3516783216783217e-06, - "loss": 0.345, - "step": 38390 - }, - { - "epoch": 33.28, - "learning_rate": 1.3509790209790208e-06, - "loss": 0.431, - "step": 38400 - }, - { - "epoch": 33.28, - "learning_rate": 1.3502797202797203e-06, - "loss": 0.373, - "step": 38410 - }, - { - "epoch": 33.29, - "learning_rate": 1.3495804195804196e-06, - "loss": 0.3685, - "step": 38420 - }, - { - "epoch": 33.3, - "learning_rate": 1.3488811188811188e-06, - "loss": 0.3631, - "step": 38430 - }, - { - "epoch": 33.31, - "learning_rate": 1.3481818181818181e-06, - "loss": 0.3509, - "step": 38440 - }, - { - "epoch": 33.32, - "learning_rate": 1.3474825174825174e-06, - "loss": 0.3536, - "step": 38450 - }, - { - "epoch": 33.33, - "learning_rate": 1.3467832167832167e-06, - "loss": 0.3496, - "step": 38460 - }, - { - "epoch": 33.34, - "learning_rate": 1.346083916083916e-06, - "loss": 0.3579, - "step": 38470 - }, - { - "epoch": 33.34, - "learning_rate": 1.3453846153846153e-06, - "loss": 0.3917, - "step": 38480 - }, - { - "epoch": 33.35, - "learning_rate": 1.3446853146853146e-06, - "loss": 0.3634, - "step": 38490 - }, - { - "epoch": 33.36, - "learning_rate": 1.343986013986014e-06, - "loss": 0.3654, - "step": 38500 - }, - { - "epoch": 33.37, - "learning_rate": 1.3432867132867131e-06, - "loss": 0.3681, - "step": 38510 - }, - { - "epoch": 33.38, - "learning_rate": 1.3425874125874126e-06, - "loss": 0.4137, - "step": 38520 - }, - { - "epoch": 33.39, - "learning_rate": 1.3418881118881117e-06, - "loss": 0.3998, - "step": 38530 - }, - { - "epoch": 33.4, - "learning_rate": 1.3411888111888112e-06, - "loss": 0.376, - "step": 38540 - }, - { - "epoch": 33.41, - "learning_rate": 1.3404895104895105e-06, - "loss": 0.3325, - "step": 38550 - }, - { - "epoch": 33.41, - "learning_rate": 1.3397902097902096e-06, - "loss": 0.3865, - "step": 38560 - }, - { - "epoch": 33.42, - "learning_rate": 1.339090909090909e-06, - "loss": 0.4339, - "step": 38570 - }, - { - "epoch": 33.43, - "learning_rate": 1.3383916083916083e-06, - "loss": 0.4056, - "step": 38580 - }, - { - "epoch": 33.44, - "learning_rate": 1.3376923076923076e-06, - "loss": 0.3689, - "step": 38590 - }, - { - "epoch": 33.45, - "learning_rate": 1.336993006993007e-06, - "loss": 0.3898, - "step": 38600 - }, - { - "epoch": 33.46, - "learning_rate": 1.3362937062937064e-06, - "loss": 0.3544, - "step": 38610 - }, - { - "epoch": 33.47, - "learning_rate": 1.3355944055944055e-06, - "loss": 0.3979, - "step": 38620 - }, - { - "epoch": 33.47, - "learning_rate": 1.334895104895105e-06, - "loss": 0.3858, - "step": 38630 - }, - { - "epoch": 33.48, - "learning_rate": 1.334195804195804e-06, - "loss": 0.4398, - "step": 38640 - }, - { - "epoch": 33.49, - "learning_rate": 1.3334965034965033e-06, - "loss": 0.3577, - "step": 38650 - }, - { - "epoch": 33.5, - "learning_rate": 1.3327972027972028e-06, - "loss": 0.3575, - "step": 38660 - }, - { - "epoch": 33.51, - "learning_rate": 1.332097902097902e-06, - "loss": 0.3101, - "step": 38670 - }, - { - "epoch": 33.52, - "learning_rate": 1.3313986013986014e-06, - "loss": 0.4451, - "step": 38680 - }, - { - "epoch": 33.53, - "learning_rate": 1.3306993006993007e-06, - "loss": 0.2943, - "step": 38690 - }, - { - "epoch": 33.54, - "learning_rate": 1.33e-06, - "loss": 0.3424, - "step": 38700 - }, - { - "epoch": 33.54, - "learning_rate": 1.3293006993006993e-06, - "loss": 0.3279, - "step": 38710 - }, - { - "epoch": 33.55, - "learning_rate": 1.3286013986013985e-06, - "loss": 0.3437, - "step": 38720 - }, - { - "epoch": 33.56, - "learning_rate": 1.3279020979020978e-06, - "loss": 0.36, - "step": 38730 - }, - { - "epoch": 33.57, - "learning_rate": 1.3272027972027971e-06, - "loss": 0.3833, - "step": 38740 - }, - { - "epoch": 33.58, - "learning_rate": 1.3265034965034964e-06, - "loss": 0.3473, - "step": 38750 - }, - { - "epoch": 33.59, - "learning_rate": 1.3258041958041957e-06, - "loss": 0.346, - "step": 38760 - }, - { - "epoch": 33.6, - "learning_rate": 1.3251048951048952e-06, - "loss": 0.3609, - "step": 38770 - }, - { - "epoch": 33.6, - "learning_rate": 1.3244055944055943e-06, - "loss": 0.3858, - "step": 38780 - }, - { - "epoch": 33.61, - "learning_rate": 1.3237062937062937e-06, - "loss": 0.3623, - "step": 38790 - }, - { - "epoch": 33.62, - "learning_rate": 1.3230069930069928e-06, - "loss": 0.3254, - "step": 38800 - }, - { - "epoch": 33.63, - "learning_rate": 1.3223076923076923e-06, - "loss": 0.3263, - "step": 38810 - }, - { - "epoch": 33.64, - "learning_rate": 1.3216083916083916e-06, - "loss": 0.3892, - "step": 38820 - }, - { - "epoch": 33.65, - "learning_rate": 1.3209090909090907e-06, - "loss": 0.3618, - "step": 38830 - }, - { - "epoch": 33.66, - "learning_rate": 1.3202097902097902e-06, - "loss": 0.3106, - "step": 38840 - }, - { - "epoch": 33.67, - "learning_rate": 1.3195104895104895e-06, - "loss": 0.3613, - "step": 38850 - }, - { - "epoch": 33.67, - "learning_rate": 1.3188111888111887e-06, - "loss": 0.3396, - "step": 38860 - }, - { - "epoch": 33.68, - "learning_rate": 1.318111888111888e-06, - "loss": 0.356, - "step": 38870 - }, - { - "epoch": 33.69, - "learning_rate": 1.3174125874125875e-06, - "loss": 0.4044, - "step": 38880 - }, - { - "epoch": 33.7, - "learning_rate": 1.3167132867132866e-06, - "loss": 0.3763, - "step": 38890 - }, - { - "epoch": 33.71, - "learning_rate": 1.316013986013986e-06, - "loss": 0.3754, - "step": 38900 - }, - { - "epoch": 33.72, - "learning_rate": 1.3153146853146852e-06, - "loss": 0.3176, - "step": 38910 - }, - { - "epoch": 33.73, - "learning_rate": 1.3146153846153845e-06, - "loss": 0.3711, - "step": 38920 - }, - { - "epoch": 33.73, - "learning_rate": 1.313916083916084e-06, - "loss": 0.3626, - "step": 38930 - }, - { - "epoch": 33.74, - "learning_rate": 1.313216783216783e-06, - "loss": 0.3064, - "step": 38940 - }, - { - "epoch": 33.75, - "learning_rate": 1.3125174825174825e-06, - "loss": 0.4134, - "step": 38950 - }, - { - "epoch": 33.76, - "learning_rate": 1.3118181818181818e-06, - "loss": 0.3612, - "step": 38960 - }, - { - "epoch": 33.77, - "learning_rate": 1.311118881118881e-06, - "loss": 0.4237, - "step": 38970 - }, - { - "epoch": 33.78, - "learning_rate": 1.3104195804195804e-06, - "loss": 0.3579, - "step": 38980 - }, - { - "epoch": 33.79, - "learning_rate": 1.3097202797202797e-06, - "loss": 0.3854, - "step": 38990 - }, - { - "epoch": 33.8, - "learning_rate": 1.309020979020979e-06, - "loss": 0.3347, - "step": 39000 - }, - { - "epoch": 33.8, - "learning_rate": 1.3083216783216782e-06, - "loss": 0.3272, - "step": 39010 - }, - { - "epoch": 33.81, - "learning_rate": 1.3076223776223775e-06, - "loss": 0.387, - "step": 39020 - }, - { - "epoch": 33.82, - "learning_rate": 1.3069230769230768e-06, - "loss": 0.4064, - "step": 39030 - }, - { - "epoch": 33.83, - "learning_rate": 1.3062237762237763e-06, - "loss": 0.3116, - "step": 39040 - }, - { - "epoch": 33.84, - "learning_rate": 1.3055244755244754e-06, - "loss": 0.3533, - "step": 39050 - }, - { - "epoch": 33.85, - "learning_rate": 1.3048251748251749e-06, - "loss": 0.3612, - "step": 39060 - }, - { - "epoch": 33.86, - "learning_rate": 1.304125874125874e-06, - "loss": 0.388, - "step": 39070 - }, - { - "epoch": 33.86, - "learning_rate": 1.3034265734265734e-06, - "loss": 0.4011, - "step": 39080 - }, - { - "epoch": 33.87, - "learning_rate": 1.3027272727272727e-06, - "loss": 0.3565, - "step": 39090 - }, - { - "epoch": 33.88, - "learning_rate": 1.3020279720279718e-06, - "loss": 0.3031, - "step": 39100 - }, - { - "epoch": 33.89, - "learning_rate": 1.3013286713286713e-06, - "loss": 0.3112, - "step": 39110 - }, - { - "epoch": 33.9, - "learning_rate": 1.3006293706293706e-06, - "loss": 0.3636, - "step": 39120 - }, - { - "epoch": 33.91, - "learning_rate": 1.2999300699300699e-06, - "loss": 0.3724, - "step": 39130 - }, - { - "epoch": 33.92, - "learning_rate": 1.2992307692307692e-06, - "loss": 0.3513, - "step": 39140 - }, - { - "epoch": 33.93, - "learning_rate": 1.2985314685314687e-06, - "loss": 0.4349, - "step": 39150 - }, - { - "epoch": 33.93, - "learning_rate": 1.2978321678321677e-06, - "loss": 0.3918, - "step": 39160 - }, - { - "epoch": 33.94, - "learning_rate": 1.2971328671328672e-06, - "loss": 0.4047, - "step": 39170 - }, - { - "epoch": 33.95, - "learning_rate": 1.2964335664335663e-06, - "loss": 0.3356, - "step": 39180 - }, - { - "epoch": 33.96, - "learning_rate": 1.2957342657342656e-06, - "loss": 0.4049, - "step": 39190 - }, - { - "epoch": 33.97, - "learning_rate": 1.295034965034965e-06, - "loss": 0.3867, - "step": 39200 - }, - { - "epoch": 33.98, - "learning_rate": 1.2943356643356642e-06, - "loss": 0.3492, - "step": 39210 - }, - { - "epoch": 33.99, - "learning_rate": 1.2936363636363636e-06, - "loss": 0.4248, - "step": 39220 - }, - { - "epoch": 33.99, - "learning_rate": 1.292937062937063e-06, - "loss": 0.3691, - "step": 39230 - }, - { - "epoch": 34.0, - "eval_loss": 0.5551154017448425, - "eval_runtime": 137.8613, - "eval_samples_per_second": 3.859, - "eval_steps_per_second": 1.929, - "eval_wer": 0.24278459857298965, - "step": 39236 - }, - { - "epoch": 34.0, - "learning_rate": 1.2922377622377622e-06, - "loss": 0.4403, - "step": 39240 - }, - { - "epoch": 34.01, - "learning_rate": 1.2915384615384615e-06, - "loss": 0.3549, - "step": 39250 - }, - { - "epoch": 34.02, - "learning_rate": 1.2908391608391608e-06, - "loss": 0.3839, - "step": 39260 - }, - { - "epoch": 34.03, - "learning_rate": 1.29013986013986e-06, - "loss": 0.351, - "step": 39270 - }, - { - "epoch": 34.04, - "learning_rate": 1.2894405594405594e-06, - "loss": 0.3648, - "step": 39280 - }, - { - "epoch": 34.05, - "learning_rate": 1.2887412587412586e-06, - "loss": 0.3786, - "step": 39290 - }, - { - "epoch": 34.06, - "learning_rate": 1.288041958041958e-06, - "loss": 0.3918, - "step": 39300 - }, - { - "epoch": 34.06, - "learning_rate": 1.2873426573426574e-06, - "loss": 0.3271, - "step": 39310 - }, - { - "epoch": 34.07, - "learning_rate": 1.2866433566433565e-06, - "loss": 0.3704, - "step": 39320 - }, - { - "epoch": 34.08, - "learning_rate": 1.285944055944056e-06, - "loss": 0.3887, - "step": 39330 - }, - { - "epoch": 34.09, - "learning_rate": 1.285244755244755e-06, - "loss": 0.3977, - "step": 39340 - }, - { - "epoch": 34.1, - "learning_rate": 1.2845454545454544e-06, - "loss": 0.3211, - "step": 39350 - }, - { - "epoch": 34.11, - "learning_rate": 1.2838461538461539e-06, - "loss": 0.4011, - "step": 39360 - }, - { - "epoch": 34.12, - "learning_rate": 1.283146853146853e-06, - "loss": 0.4222, - "step": 39370 - }, - { - "epoch": 34.12, - "learning_rate": 1.2824475524475524e-06, - "loss": 0.4083, - "step": 39380 - }, - { - "epoch": 34.13, - "learning_rate": 1.2817482517482517e-06, - "loss": 0.3787, - "step": 39390 - }, - { - "epoch": 34.14, - "learning_rate": 1.281048951048951e-06, - "loss": 0.4088, - "step": 39400 - }, - { - "epoch": 34.15, - "learning_rate": 1.2803496503496503e-06, - "loss": 0.3065, - "step": 39410 - }, - { - "epoch": 34.16, - "learning_rate": 1.2796503496503498e-06, - "loss": 0.3769, - "step": 39420 - }, - { - "epoch": 34.17, - "learning_rate": 1.2789510489510488e-06, - "loss": 0.4346, - "step": 39430 - }, - { - "epoch": 34.18, - "learning_rate": 1.2782517482517481e-06, - "loss": 0.2899, - "step": 39440 - }, - { - "epoch": 34.19, - "learning_rate": 1.2775524475524474e-06, - "loss": 0.3924, - "step": 39450 - }, - { - "epoch": 34.19, - "learning_rate": 1.2768531468531467e-06, - "loss": 0.3546, - "step": 39460 - }, - { - "epoch": 34.2, - "learning_rate": 1.2761538461538462e-06, - "loss": 0.3824, - "step": 39470 - }, - { - "epoch": 34.21, - "learning_rate": 1.2754545454545453e-06, - "loss": 0.3687, - "step": 39480 - }, - { - "epoch": 34.22, - "learning_rate": 1.2747552447552448e-06, - "loss": 0.3505, - "step": 39490 - }, - { - "epoch": 34.23, - "learning_rate": 1.274055944055944e-06, - "loss": 0.3921, - "step": 39500 - }, - { - "epoch": 34.24, - "learning_rate": 1.2733566433566433e-06, - "loss": 0.3381, - "step": 39510 - }, - { - "epoch": 34.25, - "learning_rate": 1.2726573426573426e-06, - "loss": 0.3819, - "step": 39520 - }, - { - "epoch": 34.25, - "learning_rate": 1.2719580419580417e-06, - "loss": 0.3564, - "step": 39530 - }, - { - "epoch": 34.26, - "learning_rate": 1.2712587412587412e-06, - "loss": 0.3359, - "step": 39540 - }, - { - "epoch": 34.27, - "learning_rate": 1.2705594405594405e-06, - "loss": 0.3467, - "step": 39550 - }, - { - "epoch": 34.28, - "learning_rate": 1.2698601398601398e-06, - "loss": 0.3431, - "step": 39560 - }, - { - "epoch": 34.29, - "learning_rate": 1.269160839160839e-06, - "loss": 0.3082, - "step": 39570 - }, - { - "epoch": 34.3, - "learning_rate": 1.2684615384615385e-06, - "loss": 0.4237, - "step": 39580 - }, - { - "epoch": 34.31, - "learning_rate": 1.2677622377622376e-06, - "loss": 0.3363, - "step": 39590 - }, - { - "epoch": 34.32, - "learning_rate": 1.2670629370629371e-06, - "loss": 0.3542, - "step": 39600 - }, - { - "epoch": 34.32, - "learning_rate": 1.2663636363636364e-06, - "loss": 0.3788, - "step": 39610 - }, - { - "epoch": 34.33, - "learning_rate": 1.2656643356643355e-06, - "loss": 0.3864, - "step": 39620 - }, - { - "epoch": 34.34, - "learning_rate": 1.264965034965035e-06, - "loss": 0.4107, - "step": 39630 - }, - { - "epoch": 34.35, - "learning_rate": 1.264265734265734e-06, - "loss": 0.3733, - "step": 39640 - }, - { - "epoch": 34.36, - "learning_rate": 1.2635664335664335e-06, - "loss": 0.353, - "step": 39650 - }, - { - "epoch": 34.37, - "learning_rate": 1.2628671328671328e-06, - "loss": 0.4167, - "step": 39660 - }, - { - "epoch": 34.38, - "learning_rate": 1.2621678321678321e-06, - "loss": 0.35, - "step": 39670 - }, - { - "epoch": 34.38, - "learning_rate": 1.2614685314685314e-06, - "loss": 0.3884, - "step": 39680 - }, - { - "epoch": 34.39, - "learning_rate": 1.260769230769231e-06, - "loss": 0.308, - "step": 39690 - }, - { - "epoch": 34.4, - "learning_rate": 1.26006993006993e-06, - "loss": 0.3529, - "step": 39700 - }, - { - "epoch": 34.41, - "learning_rate": 1.2593706293706293e-06, - "loss": 0.3589, - "step": 39710 - }, - { - "epoch": 34.42, - "learning_rate": 1.2586713286713285e-06, - "loss": 0.3543, - "step": 39720 - }, - { - "epoch": 34.43, - "learning_rate": 1.2579720279720278e-06, - "loss": 0.3261, - "step": 39730 - }, - { - "epoch": 34.44, - "learning_rate": 1.2572727272727273e-06, - "loss": 0.3342, - "step": 39740 - }, - { - "epoch": 34.45, - "learning_rate": 1.2565734265734264e-06, - "loss": 0.3243, - "step": 39750 - }, - { - "epoch": 34.45, - "learning_rate": 1.255874125874126e-06, - "loss": 0.3558, - "step": 39760 - }, - { - "epoch": 34.46, - "learning_rate": 1.2551748251748252e-06, - "loss": 0.3326, - "step": 39770 - }, - { - "epoch": 34.47, - "learning_rate": 1.2544755244755245e-06, - "loss": 0.375, - "step": 39780 - }, - { - "epoch": 34.48, - "learning_rate": 1.2537762237762238e-06, - "loss": 0.4022, - "step": 39790 - }, - { - "epoch": 34.49, - "learning_rate": 1.2530769230769228e-06, - "loss": 0.3326, - "step": 39800 - }, - { - "epoch": 34.5, - "learning_rate": 1.2523776223776223e-06, - "loss": 0.3484, - "step": 39810 - }, - { - "epoch": 34.51, - "learning_rate": 1.2516783216783216e-06, - "loss": 0.3685, - "step": 39820 - }, - { - "epoch": 34.51, - "learning_rate": 1.2509790209790209e-06, - "loss": 0.3734, - "step": 39830 - }, - { - "epoch": 34.52, - "learning_rate": 1.2502797202797202e-06, - "loss": 0.3993, - "step": 39840 - }, - { - "epoch": 34.53, - "learning_rate": 1.2495804195804197e-06, - "loss": 0.3761, - "step": 39850 - }, - { - "epoch": 34.54, - "learning_rate": 1.2488811188811187e-06, - "loss": 0.3446, - "step": 39860 - }, - { - "epoch": 34.55, - "learning_rate": 1.2481818181818182e-06, - "loss": 0.3621, - "step": 39870 - }, - { - "epoch": 34.56, - "learning_rate": 1.2474825174825175e-06, - "loss": 0.3581, - "step": 39880 - }, - { - "epoch": 34.57, - "learning_rate": 1.2467832167832166e-06, - "loss": 0.3283, - "step": 39890 - }, - { - "epoch": 34.58, - "learning_rate": 1.246083916083916e-06, - "loss": 0.3868, - "step": 39900 - }, - { - "epoch": 34.58, - "learning_rate": 1.2453846153846152e-06, - "loss": 0.3612, - "step": 39910 - }, - { - "epoch": 34.59, - "learning_rate": 1.2446853146853147e-06, - "loss": 0.3328, - "step": 39920 - }, - { - "epoch": 34.6, - "learning_rate": 1.243986013986014e-06, - "loss": 0.3535, - "step": 39930 - }, - { - "epoch": 34.61, - "learning_rate": 1.2432867132867132e-06, - "loss": 0.3693, - "step": 39940 - }, - { - "epoch": 34.62, - "learning_rate": 1.2425874125874125e-06, - "loss": 0.3924, - "step": 39950 - }, - { - "epoch": 34.63, - "learning_rate": 1.241888111888112e-06, - "loss": 0.3339, - "step": 39960 - }, - { - "epoch": 34.64, - "learning_rate": 1.241188811188811e-06, - "loss": 0.3502, - "step": 39970 - }, - { - "epoch": 34.64, - "learning_rate": 1.2404895104895104e-06, - "loss": 0.416, - "step": 39980 - }, - { - "epoch": 34.65, - "learning_rate": 1.2397902097902097e-06, - "loss": 0.3613, - "step": 39990 - }, - { - "epoch": 34.66, - "learning_rate": 1.239090909090909e-06, - "loss": 0.3711, - "step": 40000 - }, - { - "epoch": 34.67, - "learning_rate": 1.2383916083916084e-06, - "loss": 0.3933, - "step": 40010 - }, - { - "epoch": 34.68, - "learning_rate": 1.2376923076923075e-06, - "loss": 0.3666, - "step": 40020 - }, - { - "epoch": 34.69, - "learning_rate": 1.236993006993007e-06, - "loss": 0.3581, - "step": 40030 - }, - { - "epoch": 34.7, - "learning_rate": 1.2362937062937063e-06, - "loss": 0.4526, - "step": 40040 - }, - { - "epoch": 34.71, - "learning_rate": 1.2355944055944056e-06, - "loss": 0.3394, - "step": 40050 - }, - { - "epoch": 34.71, - "learning_rate": 1.2348951048951049e-06, - "loss": 0.349, - "step": 40060 - }, - { - "epoch": 34.72, - "learning_rate": 1.234195804195804e-06, - "loss": 0.3608, - "step": 40070 - }, - { - "epoch": 34.73, - "learning_rate": 1.2334965034965034e-06, - "loss": 0.4293, - "step": 40080 - }, - { - "epoch": 34.74, - "learning_rate": 1.2327972027972027e-06, - "loss": 0.4366, - "step": 40090 - }, - { - "epoch": 34.75, - "learning_rate": 1.232097902097902e-06, - "loss": 0.3568, - "step": 40100 - }, - { - "epoch": 34.76, - "learning_rate": 1.2313986013986013e-06, - "loss": 0.2909, - "step": 40110 - }, - { - "epoch": 34.77, - "learning_rate": 1.2306993006993008e-06, - "loss": 0.3152, - "step": 40120 - }, - { - "epoch": 34.77, - "learning_rate": 1.2299999999999999e-06, - "loss": 0.3114, - "step": 40130 - }, - { - "epoch": 34.78, - "learning_rate": 1.2293006993006994e-06, - "loss": 0.3518, - "step": 40140 - }, - { - "epoch": 34.79, - "learning_rate": 1.2286013986013987e-06, - "loss": 0.3207, - "step": 40150 - }, - { - "epoch": 34.8, - "learning_rate": 1.2279020979020977e-06, - "loss": 0.348, - "step": 40160 - }, - { - "epoch": 34.81, - "learning_rate": 1.2272027972027972e-06, - "loss": 0.335, - "step": 40170 - }, - { - "epoch": 34.82, - "learning_rate": 1.2265034965034963e-06, - "loss": 0.3758, - "step": 40180 - }, - { - "epoch": 34.83, - "learning_rate": 1.2258041958041958e-06, - "loss": 0.3648, - "step": 40190 - }, - { - "epoch": 34.83, - "learning_rate": 1.225104895104895e-06, - "loss": 0.4195, - "step": 40200 - }, - { - "epoch": 34.84, - "learning_rate": 1.2244055944055944e-06, - "loss": 0.3287, - "step": 40210 - }, - { - "epoch": 34.85, - "learning_rate": 1.2237062937062936e-06, - "loss": 0.388, - "step": 40220 - }, - { - "epoch": 34.86, - "learning_rate": 1.2230069930069931e-06, - "loss": 0.3598, - "step": 40230 - }, - { - "epoch": 34.87, - "learning_rate": 1.2223076923076922e-06, - "loss": 0.3694, - "step": 40240 - }, - { - "epoch": 34.88, - "learning_rate": 1.2216083916083915e-06, - "loss": 0.3836, - "step": 40250 - }, - { - "epoch": 34.89, - "learning_rate": 1.2209090909090908e-06, - "loss": 0.3677, - "step": 40260 - }, - { - "epoch": 34.9, - "learning_rate": 1.22020979020979e-06, - "loss": 0.3912, - "step": 40270 - }, - { - "epoch": 34.9, - "learning_rate": 1.2195104895104896e-06, - "loss": 0.3673, - "step": 40280 - }, - { - "epoch": 34.91, - "learning_rate": 1.2188111888111886e-06, - "loss": 0.3944, - "step": 40290 - }, - { - "epoch": 34.92, - "learning_rate": 1.2181118881118881e-06, - "loss": 0.3404, - "step": 40300 - }, - { - "epoch": 34.93, - "learning_rate": 1.2174125874125874e-06, - "loss": 0.3558, - "step": 40310 - }, - { - "epoch": 34.94, - "learning_rate": 1.2167132867132867e-06, - "loss": 0.3658, - "step": 40320 - }, - { - "epoch": 34.95, - "learning_rate": 1.216013986013986e-06, - "loss": 0.3326, - "step": 40330 - }, - { - "epoch": 34.96, - "learning_rate": 1.215314685314685e-06, - "loss": 0.355, - "step": 40340 - }, - { - "epoch": 34.96, - "learning_rate": 1.2146153846153846e-06, - "loss": 0.3233, - "step": 40350 - }, - { - "epoch": 34.97, - "learning_rate": 1.2139160839160839e-06, - "loss": 0.3928, - "step": 40360 - }, - { - "epoch": 34.98, - "learning_rate": 1.2132167832167831e-06, - "loss": 0.342, - "step": 40370 - }, - { - "epoch": 34.99, - "learning_rate": 1.2125174825174824e-06, - "loss": 0.3841, - "step": 40380 - }, - { - "epoch": 35.0, - "learning_rate": 1.211818181818182e-06, - "loss": 0.3076, - "step": 40390 - }, - { - "epoch": 35.0, - "eval_loss": 0.555358350276947, - "eval_runtime": 136.1151, - "eval_samples_per_second": 3.908, - "eval_steps_per_second": 1.954, - "eval_wer": 0.24631998457286108, - "step": 40390 - }, - { - "epoch": 35.01, - "learning_rate": 1.211118881118881e-06, - "loss": 0.3906, - "step": 40400 - }, - { - "epoch": 35.02, - "learning_rate": 1.2104195804195803e-06, - "loss": 0.3476, - "step": 40410 - }, - { - "epoch": 35.03, - "learning_rate": 1.2097202797202798e-06, - "loss": 0.3169, - "step": 40420 - }, - { - "epoch": 35.03, - "learning_rate": 1.2090209790209788e-06, - "loss": 0.3608, - "step": 40430 - }, - { - "epoch": 35.04, - "learning_rate": 1.2083216783216783e-06, - "loss": 0.3543, - "step": 40440 - }, - { - "epoch": 35.05, - "learning_rate": 1.2076223776223774e-06, - "loss": 0.3396, - "step": 40450 - }, - { - "epoch": 35.06, - "learning_rate": 1.206923076923077e-06, - "loss": 0.3822, - "step": 40460 - }, - { - "epoch": 35.07, - "learning_rate": 1.2062237762237762e-06, - "loss": 0.368, - "step": 40470 - }, - { - "epoch": 35.08, - "learning_rate": 1.2055244755244755e-06, - "loss": 0.3727, - "step": 40480 - }, - { - "epoch": 35.09, - "learning_rate": 1.2048251748251748e-06, - "loss": 0.4509, - "step": 40490 - }, - { - "epoch": 35.1, - "learning_rate": 1.204125874125874e-06, - "loss": 0.3545, - "step": 40500 - }, - { - "epoch": 35.1, - "learning_rate": 1.2034265734265733e-06, - "loss": 0.3603, - "step": 40510 - }, - { - "epoch": 35.11, - "learning_rate": 1.2027272727272726e-06, - "loss": 0.3675, - "step": 40520 - }, - { - "epoch": 35.12, - "learning_rate": 1.202027972027972e-06, - "loss": 0.3915, - "step": 40530 - }, - { - "epoch": 35.13, - "learning_rate": 1.2013286713286712e-06, - "loss": 0.3879, - "step": 40540 - }, - { - "epoch": 35.14, - "learning_rate": 1.2006293706293707e-06, - "loss": 0.3236, - "step": 40550 - }, - { - "epoch": 35.15, - "learning_rate": 1.1999300699300698e-06, - "loss": 0.3697, - "step": 40560 - }, - { - "epoch": 35.16, - "learning_rate": 1.1992307692307693e-06, - "loss": 0.2743, - "step": 40570 - }, - { - "epoch": 35.16, - "learning_rate": 1.1985314685314686e-06, - "loss": 0.3614, - "step": 40580 - }, - { - "epoch": 35.17, - "learning_rate": 1.1978321678321676e-06, - "loss": 0.3894, - "step": 40590 - }, - { - "epoch": 35.18, - "learning_rate": 1.1971328671328671e-06, - "loss": 0.3921, - "step": 40600 - }, - { - "epoch": 35.19, - "learning_rate": 1.1964335664335662e-06, - "loss": 0.3577, - "step": 40610 - }, - { - "epoch": 35.2, - "learning_rate": 1.1957342657342657e-06, - "loss": 0.3331, - "step": 40620 - }, - { - "epoch": 35.21, - "learning_rate": 1.195034965034965e-06, - "loss": 0.3841, - "step": 40630 - }, - { - "epoch": 35.22, - "learning_rate": 1.1943356643356643e-06, - "loss": 0.337, - "step": 40640 - }, - { - "epoch": 35.23, - "learning_rate": 1.1936363636363635e-06, - "loss": 0.3891, - "step": 40650 - }, - { - "epoch": 35.23, - "learning_rate": 1.192937062937063e-06, - "loss": 0.3329, - "step": 40660 - }, - { - "epoch": 35.24, - "learning_rate": 1.1922377622377621e-06, - "loss": 0.3652, - "step": 40670 - }, - { - "epoch": 35.25, - "learning_rate": 1.1915384615384614e-06, - "loss": 0.3531, - "step": 40680 - }, - { - "epoch": 35.26, - "learning_rate": 1.190839160839161e-06, - "loss": 0.4004, - "step": 40690 - }, - { - "epoch": 35.27, - "learning_rate": 1.19013986013986e-06, - "loss": 0.3696, - "step": 40700 - }, - { - "epoch": 35.28, - "learning_rate": 1.1894405594405595e-06, - "loss": 0.3911, - "step": 40710 - }, - { - "epoch": 35.29, - "learning_rate": 1.1887412587412585e-06, - "loss": 0.4062, - "step": 40720 - }, - { - "epoch": 35.29, - "learning_rate": 1.188041958041958e-06, - "loss": 0.4332, - "step": 40730 - }, - { - "epoch": 35.3, - "learning_rate": 1.1873426573426573e-06, - "loss": 0.41, - "step": 40740 - }, - { - "epoch": 35.31, - "learning_rate": 1.1866433566433566e-06, - "loss": 0.3732, - "step": 40750 - }, - { - "epoch": 35.32, - "learning_rate": 1.185944055944056e-06, - "loss": 0.3851, - "step": 40760 - }, - { - "epoch": 35.33, - "learning_rate": 1.1852447552447552e-06, - "loss": 0.3678, - "step": 40770 - }, - { - "epoch": 35.34, - "learning_rate": 1.1845454545454545e-06, - "loss": 0.4117, - "step": 40780 - }, - { - "epoch": 35.35, - "learning_rate": 1.1838461538461538e-06, - "loss": 0.4182, - "step": 40790 - }, - { - "epoch": 35.36, - "learning_rate": 1.183146853146853e-06, - "loss": 0.4155, - "step": 40800 - }, - { - "epoch": 35.36, - "learning_rate": 1.1824475524475523e-06, - "loss": 0.3544, - "step": 40810 - }, - { - "epoch": 35.37, - "learning_rate": 1.1817482517482518e-06, - "loss": 0.3307, - "step": 40820 - }, - { - "epoch": 35.38, - "learning_rate": 1.1810489510489509e-06, - "loss": 0.341, - "step": 40830 - }, - { - "epoch": 35.39, - "learning_rate": 1.1803496503496504e-06, - "loss": 0.3709, - "step": 40840 - }, - { - "epoch": 35.4, - "learning_rate": 1.1796503496503497e-06, - "loss": 0.3244, - "step": 40850 - }, - { - "epoch": 35.41, - "learning_rate": 1.1789510489510487e-06, - "loss": 0.3738, - "step": 40860 - }, - { - "epoch": 35.42, - "learning_rate": 1.1782517482517482e-06, - "loss": 0.3641, - "step": 40870 - }, - { - "epoch": 35.42, - "learning_rate": 1.1775524475524475e-06, - "loss": 0.3363, - "step": 40880 - }, - { - "epoch": 35.43, - "learning_rate": 1.1768531468531468e-06, - "loss": 0.3307, - "step": 40890 - }, - { - "epoch": 35.44, - "learning_rate": 1.176153846153846e-06, - "loss": 0.4423, - "step": 40900 - }, - { - "epoch": 35.45, - "learning_rate": 1.1754545454545454e-06, - "loss": 0.3662, - "step": 40910 - }, - { - "epoch": 35.46, - "learning_rate": 1.1747552447552447e-06, - "loss": 0.3772, - "step": 40920 - }, - { - "epoch": 35.47, - "learning_rate": 1.1740559440559442e-06, - "loss": 0.415, - "step": 40930 - }, - { - "epoch": 35.48, - "learning_rate": 1.1733566433566432e-06, - "loss": 0.4153, - "step": 40940 - }, - { - "epoch": 35.49, - "learning_rate": 1.1726573426573425e-06, - "loss": 0.3248, - "step": 40950 - }, - { - "epoch": 35.49, - "learning_rate": 1.171958041958042e-06, - "loss": 0.3395, - "step": 40960 - }, - { - "epoch": 35.5, - "learning_rate": 1.171258741258741e-06, - "loss": 0.3559, - "step": 40970 - }, - { - "epoch": 35.51, - "learning_rate": 1.1705594405594406e-06, - "loss": 0.4002, - "step": 40980 - }, - { - "epoch": 35.52, - "learning_rate": 1.1698601398601397e-06, - "loss": 0.299, - "step": 40990 - }, - { - "epoch": 35.53, - "learning_rate": 1.1691608391608392e-06, - "loss": 0.39, - "step": 41000 - }, - { - "epoch": 35.54, - "learning_rate": 1.1684615384615384e-06, - "loss": 0.3827, - "step": 41010 - }, - { - "epoch": 35.55, - "learning_rate": 1.1677622377622377e-06, - "loss": 0.318, - "step": 41020 - }, - { - "epoch": 35.55, - "learning_rate": 1.167062937062937e-06, - "loss": 0.3562, - "step": 41030 - }, - { - "epoch": 35.56, - "learning_rate": 1.1663636363636363e-06, - "loss": 0.3558, - "step": 41040 - }, - { - "epoch": 35.57, - "learning_rate": 1.1656643356643356e-06, - "loss": 0.3021, - "step": 41050 - }, - { - "epoch": 35.58, - "learning_rate": 1.1649650349650349e-06, - "loss": 0.3554, - "step": 41060 - }, - { - "epoch": 35.59, - "learning_rate": 1.1642657342657344e-06, - "loss": 0.3894, - "step": 41070 - }, - { - "epoch": 35.6, - "learning_rate": 1.1635664335664334e-06, - "loss": 0.3829, - "step": 41080 - }, - { - "epoch": 35.61, - "learning_rate": 1.162867132867133e-06, - "loss": 0.3827, - "step": 41090 - }, - { - "epoch": 35.61, - "learning_rate": 1.162167832167832e-06, - "loss": 0.3726, - "step": 41100 - }, - { - "epoch": 35.62, - "learning_rate": 1.1614685314685315e-06, - "loss": 0.3703, - "step": 41110 - }, - { - "epoch": 35.63, - "learning_rate": 1.1607692307692308e-06, - "loss": 0.3142, - "step": 41120 - }, - { - "epoch": 35.64, - "learning_rate": 1.1600699300699299e-06, - "loss": 0.3549, - "step": 41130 - }, - { - "epoch": 35.65, - "learning_rate": 1.1593706293706294e-06, - "loss": 0.3436, - "step": 41140 - }, - { - "epoch": 35.66, - "learning_rate": 1.1586713286713287e-06, - "loss": 0.3383, - "step": 41150 - }, - { - "epoch": 35.67, - "learning_rate": 1.157972027972028e-06, - "loss": 0.3643, - "step": 41160 - }, - { - "epoch": 35.68, - "learning_rate": 1.1572727272727272e-06, - "loss": 0.3612, - "step": 41170 - }, - { - "epoch": 35.68, - "learning_rate": 1.1565734265734265e-06, - "loss": 0.3992, - "step": 41180 - }, - { - "epoch": 35.69, - "learning_rate": 1.1558741258741258e-06, - "loss": 0.428, - "step": 41190 - }, - { - "epoch": 35.7, - "learning_rate": 1.1551748251748253e-06, - "loss": 0.3955, - "step": 41200 - }, - { - "epoch": 35.71, - "learning_rate": 1.1544755244755244e-06, - "loss": 0.3796, - "step": 41210 - }, - { - "epoch": 35.72, - "learning_rate": 1.1537762237762236e-06, - "loss": 0.3313, - "step": 41220 - }, - { - "epoch": 35.73, - "learning_rate": 1.1530769230769231e-06, - "loss": 0.3473, - "step": 41230 - }, - { - "epoch": 35.74, - "learning_rate": 1.1523776223776222e-06, - "loss": 0.4113, - "step": 41240 - }, - { - "epoch": 35.74, - "learning_rate": 1.1516783216783217e-06, - "loss": 0.3303, - "step": 41250 - }, - { - "epoch": 35.75, - "learning_rate": 1.1509790209790208e-06, - "loss": 0.3426, - "step": 41260 - }, - { - "epoch": 35.76, - "learning_rate": 1.1502797202797203e-06, - "loss": 0.3911, - "step": 41270 - }, - { - "epoch": 35.77, - "learning_rate": 1.1495804195804196e-06, - "loss": 0.3745, - "step": 41280 - }, - { - "epoch": 35.78, - "learning_rate": 1.1488811188811189e-06, - "loss": 0.3718, - "step": 41290 - }, - { - "epoch": 35.79, - "learning_rate": 1.1481818181818181e-06, - "loss": 0.3834, - "step": 41300 - }, - { - "epoch": 35.8, - "learning_rate": 1.1474825174825174e-06, - "loss": 0.3581, - "step": 41310 - }, - { - "epoch": 35.81, - "learning_rate": 1.1467832167832167e-06, - "loss": 0.3344, - "step": 41320 - }, - { - "epoch": 35.81, - "learning_rate": 1.146083916083916e-06, - "loss": 0.3605, - "step": 41330 - }, - { - "epoch": 35.82, - "learning_rate": 1.1453846153846155e-06, - "loss": 0.3628, - "step": 41340 - }, - { - "epoch": 35.83, - "learning_rate": 1.1446853146853146e-06, - "loss": 0.3644, - "step": 41350 - }, - { - "epoch": 35.84, - "learning_rate": 1.143986013986014e-06, - "loss": 0.4126, - "step": 41360 - }, - { - "epoch": 35.85, - "learning_rate": 1.1432867132867131e-06, - "loss": 0.3505, - "step": 41370 - }, - { - "epoch": 35.86, - "learning_rate": 1.1425874125874124e-06, - "loss": 0.3332, - "step": 41380 - }, - { - "epoch": 35.87, - "learning_rate": 1.141888111888112e-06, - "loss": 0.3638, - "step": 41390 - }, - { - "epoch": 35.87, - "learning_rate": 1.141188811188811e-06, - "loss": 0.3721, - "step": 41400 - }, - { - "epoch": 35.88, - "learning_rate": 1.1404895104895105e-06, - "loss": 0.3965, - "step": 41410 - }, - { - "epoch": 35.89, - "learning_rate": 1.1397902097902098e-06, - "loss": 0.3817, - "step": 41420 - }, - { - "epoch": 35.9, - "learning_rate": 1.139090909090909e-06, - "loss": 0.3677, - "step": 41430 - }, - { - "epoch": 35.91, - "learning_rate": 1.1383916083916083e-06, - "loss": 0.3984, - "step": 41440 - }, - { - "epoch": 35.92, - "learning_rate": 1.1376923076923076e-06, - "loss": 0.3994, - "step": 41450 - }, - { - "epoch": 35.93, - "learning_rate": 1.136993006993007e-06, - "loss": 0.4064, - "step": 41460 - }, - { - "epoch": 35.94, - "learning_rate": 1.1362937062937062e-06, - "loss": 0.3398, - "step": 41470 - }, - { - "epoch": 35.94, - "learning_rate": 1.1355944055944055e-06, - "loss": 0.3784, - "step": 41480 - }, - { - "epoch": 35.95, - "learning_rate": 1.1348951048951048e-06, - "loss": 0.3623, - "step": 41490 - }, - { - "epoch": 35.96, - "learning_rate": 1.1341958041958043e-06, - "loss": 0.3722, - "step": 41500 - }, - { - "epoch": 35.97, - "learning_rate": 1.1334965034965033e-06, - "loss": 0.3532, - "step": 41510 - }, - { - "epoch": 35.98, - "learning_rate": 1.1327972027972028e-06, - "loss": 0.363, - "step": 41520 - }, - { - "epoch": 35.99, - "learning_rate": 1.132097902097902e-06, - "loss": 0.3761, - "step": 41530 - }, - { - "epoch": 36.0, - "learning_rate": 1.1313986013986014e-06, - "loss": 0.3886, - "step": 41540 - }, - { - "epoch": 36.0, - "eval_loss": 0.558751106262207, - "eval_runtime": 137.2985, - "eval_samples_per_second": 3.875, - "eval_steps_per_second": 1.937, - "eval_wer": 0.24612714533650445, - "step": 41544 - }, - { - "epoch": 36.01, - "learning_rate": 1.1306993006993007e-06, - "loss": 0.3106, - "step": 41550 - }, - { - "epoch": 36.01, - "learning_rate": 1.1299999999999998e-06, - "loss": 0.3924, - "step": 41560 - }, - { - "epoch": 36.02, - "learning_rate": 1.1293006993006993e-06, - "loss": 0.346, - "step": 41570 - }, - { - "epoch": 36.03, - "learning_rate": 1.1286013986013986e-06, - "loss": 0.3785, - "step": 41580 - }, - { - "epoch": 36.04, - "learning_rate": 1.1279020979020978e-06, - "loss": 0.3385, - "step": 41590 - }, - { - "epoch": 36.05, - "learning_rate": 1.1272027972027971e-06, - "loss": 0.3389, - "step": 41600 - }, - { - "epoch": 36.06, - "learning_rate": 1.1265034965034966e-06, - "loss": 0.3237, - "step": 41610 - }, - { - "epoch": 36.07, - "learning_rate": 1.1258041958041957e-06, - "loss": 0.3436, - "step": 41620 - }, - { - "epoch": 36.07, - "learning_rate": 1.1251048951048952e-06, - "loss": 0.3671, - "step": 41630 - }, - { - "epoch": 36.08, - "learning_rate": 1.1244055944055943e-06, - "loss": 0.4029, - "step": 41640 - }, - { - "epoch": 36.09, - "learning_rate": 1.1237062937062935e-06, - "loss": 0.3575, - "step": 41650 - }, - { - "epoch": 36.1, - "learning_rate": 1.123006993006993e-06, - "loss": 0.3549, - "step": 41660 - }, - { - "epoch": 36.11, - "learning_rate": 1.1223076923076921e-06, - "loss": 0.3174, - "step": 41670 - }, - { - "epoch": 36.12, - "learning_rate": 1.1216083916083916e-06, - "loss": 0.3726, - "step": 41680 - }, - { - "epoch": 36.13, - "learning_rate": 1.120909090909091e-06, - "loss": 0.3989, - "step": 41690 - }, - { - "epoch": 36.14, - "learning_rate": 1.1202097902097902e-06, - "loss": 0.3642, - "step": 41700 - }, - { - "epoch": 36.14, - "learning_rate": 1.1195104895104895e-06, - "loss": 0.3407, - "step": 41710 - }, - { - "epoch": 36.15, - "learning_rate": 1.1188111888111888e-06, - "loss": 0.3471, - "step": 41720 - }, - { - "epoch": 36.16, - "learning_rate": 1.118111888111888e-06, - "loss": 0.3973, - "step": 41730 - }, - { - "epoch": 36.17, - "learning_rate": 1.1174125874125873e-06, - "loss": 0.3655, - "step": 41740 - }, - { - "epoch": 36.18, - "learning_rate": 1.1167132867132866e-06, - "loss": 0.354, - "step": 41750 - }, - { - "epoch": 36.19, - "learning_rate": 1.116013986013986e-06, - "loss": 0.3486, - "step": 41760 - }, - { - "epoch": 36.2, - "learning_rate": 1.1153146853146854e-06, - "loss": 0.3796, - "step": 41770 - }, - { - "epoch": 36.2, - "learning_rate": 1.1146153846153845e-06, - "loss": 0.3631, - "step": 41780 - }, - { - "epoch": 36.21, - "learning_rate": 1.113916083916084e-06, - "loss": 0.3843, - "step": 41790 - }, - { - "epoch": 36.22, - "learning_rate": 1.113216783216783e-06, - "loss": 0.3272, - "step": 41800 - }, - { - "epoch": 36.23, - "learning_rate": 1.1125174825174825e-06, - "loss": 0.3259, - "step": 41810 - }, - { - "epoch": 36.24, - "learning_rate": 1.1118181818181818e-06, - "loss": 0.3588, - "step": 41820 - }, - { - "epoch": 36.25, - "learning_rate": 1.1111188811188809e-06, - "loss": 0.3609, - "step": 41830 - }, - { - "epoch": 36.26, - "learning_rate": 1.1104195804195804e-06, - "loss": 0.4064, - "step": 41840 - }, - { - "epoch": 36.27, - "learning_rate": 1.1097902097902096e-06, - "loss": 0.3674, - "step": 41850 - }, - { - "epoch": 36.27, - "learning_rate": 1.1090909090909091e-06, - "loss": 0.3626, - "step": 41860 - }, - { - "epoch": 36.28, - "learning_rate": 1.1083916083916082e-06, - "loss": 0.309, - "step": 41870 - }, - { - "epoch": 36.29, - "learning_rate": 1.1076923076923077e-06, - "loss": 0.3654, - "step": 41880 - }, - { - "epoch": 36.3, - "learning_rate": 1.106993006993007e-06, - "loss": 0.3853, - "step": 41890 - }, - { - "epoch": 36.31, - "learning_rate": 1.1062937062937063e-06, - "loss": 0.4294, - "step": 41900 - }, - { - "epoch": 36.32, - "learning_rate": 1.1055944055944056e-06, - "loss": 0.3728, - "step": 41910 - }, - { - "epoch": 36.33, - "learning_rate": 1.1048951048951046e-06, - "loss": 0.355, - "step": 41920 - }, - { - "epoch": 36.33, - "learning_rate": 1.1041958041958041e-06, - "loss": 0.3343, - "step": 41930 - }, - { - "epoch": 36.34, - "learning_rate": 1.1034965034965034e-06, - "loss": 0.3595, - "step": 41940 - }, - { - "epoch": 36.35, - "learning_rate": 1.1027972027972027e-06, - "loss": 0.3631, - "step": 41950 - }, - { - "epoch": 36.36, - "learning_rate": 1.102097902097902e-06, - "loss": 0.3551, - "step": 41960 - }, - { - "epoch": 36.37, - "learning_rate": 1.1013986013986015e-06, - "loss": 0.3313, - "step": 41970 - }, - { - "epoch": 36.38, - "learning_rate": 1.1006993006993006e-06, - "loss": 0.3695, - "step": 41980 - }, - { - "epoch": 36.39, - "learning_rate": 1.1e-06, - "loss": 0.3779, - "step": 41990 - }, - { - "epoch": 36.39, - "learning_rate": 1.0993006993006993e-06, - "loss": 0.3474, - "step": 42000 - }, - { - "epoch": 36.4, - "learning_rate": 1.0986013986013984e-06, - "loss": 0.3375, - "step": 42010 - }, - { - "epoch": 36.41, - "learning_rate": 1.097902097902098e-06, - "loss": 0.3587, - "step": 42020 - }, - { - "epoch": 36.42, - "learning_rate": 1.097202797202797e-06, - "loss": 0.366, - "step": 42030 - }, - { - "epoch": 36.43, - "learning_rate": 1.0965034965034965e-06, - "loss": 0.3674, - "step": 42040 - }, - { - "epoch": 36.44, - "learning_rate": 1.0958041958041958e-06, - "loss": 0.3443, - "step": 42050 - }, - { - "epoch": 36.45, - "learning_rate": 1.095104895104895e-06, - "loss": 0.3428, - "step": 42060 - }, - { - "epoch": 36.46, - "learning_rate": 1.0944055944055943e-06, - "loss": 0.3715, - "step": 42070 - }, - { - "epoch": 36.46, - "learning_rate": 1.0937062937062938e-06, - "loss": 0.3847, - "step": 42080 - }, - { - "epoch": 36.47, - "learning_rate": 1.093006993006993e-06, - "loss": 0.3805, - "step": 42090 - }, - { - "epoch": 36.48, - "learning_rate": 1.0923076923076922e-06, - "loss": 0.4727, - "step": 42100 - }, - { - "epoch": 36.49, - "learning_rate": 1.0916083916083915e-06, - "loss": 0.4032, - "step": 42110 - }, - { - "epoch": 36.5, - "learning_rate": 1.0909090909090908e-06, - "loss": 0.3729, - "step": 42120 - }, - { - "epoch": 36.51, - "learning_rate": 1.0902097902097903e-06, - "loss": 0.3935, - "step": 42130 - }, - { - "epoch": 36.52, - "learning_rate": 1.0895104895104893e-06, - "loss": 0.4142, - "step": 42140 - }, - { - "epoch": 36.52, - "learning_rate": 1.0888111888111888e-06, - "loss": 0.4086, - "step": 42150 - }, - { - "epoch": 36.53, - "learning_rate": 1.0881118881118881e-06, - "loss": 0.3511, - "step": 42160 - }, - { - "epoch": 36.54, - "learning_rate": 1.0874125874125874e-06, - "loss": 0.3229, - "step": 42170 - }, - { - "epoch": 36.55, - "learning_rate": 1.0867132867132867e-06, - "loss": 0.3741, - "step": 42180 - }, - { - "epoch": 36.56, - "learning_rate": 1.0860139860139858e-06, - "loss": 0.3672, - "step": 42190 - }, - { - "epoch": 36.57, - "learning_rate": 1.0853146853146853e-06, - "loss": 0.3957, - "step": 42200 - }, - { - "epoch": 36.58, - "learning_rate": 1.0846153846153845e-06, - "loss": 0.3929, - "step": 42210 - }, - { - "epoch": 36.59, - "learning_rate": 1.0839160839160838e-06, - "loss": 0.3221, - "step": 42220 - }, - { - "epoch": 36.59, - "learning_rate": 1.0832167832167831e-06, - "loss": 0.359, - "step": 42230 - }, - { - "epoch": 36.6, - "learning_rate": 1.0825174825174826e-06, - "loss": 0.31, - "step": 42240 - }, - { - "epoch": 36.61, - "learning_rate": 1.0818181818181817e-06, - "loss": 0.3487, - "step": 42250 - }, - { - "epoch": 36.62, - "learning_rate": 1.0811188811188812e-06, - "loss": 0.389, - "step": 42260 - }, - { - "epoch": 36.63, - "learning_rate": 1.0804195804195805e-06, - "loss": 0.3275, - "step": 42270 - }, - { - "epoch": 36.64, - "learning_rate": 1.0797202797202795e-06, - "loss": 0.3415, - "step": 42280 - }, - { - "epoch": 36.65, - "learning_rate": 1.079020979020979e-06, - "loss": 0.3731, - "step": 42290 - }, - { - "epoch": 36.65, - "learning_rate": 1.0783216783216781e-06, - "loss": 0.3501, - "step": 42300 - }, - { - "epoch": 36.66, - "learning_rate": 1.0776223776223776e-06, - "loss": 0.3296, - "step": 42310 - }, - { - "epoch": 36.67, - "learning_rate": 1.0769230769230769e-06, - "loss": 0.3729, - "step": 42320 - }, - { - "epoch": 36.68, - "learning_rate": 1.0762237762237762e-06, - "loss": 0.3756, - "step": 42330 - }, - { - "epoch": 36.69, - "learning_rate": 1.0755244755244755e-06, - "loss": 0.2828, - "step": 42340 - }, - { - "epoch": 36.7, - "learning_rate": 1.074825174825175e-06, - "loss": 0.3814, - "step": 42350 - }, - { - "epoch": 36.71, - "learning_rate": 1.074125874125874e-06, - "loss": 0.3449, - "step": 42360 - }, - { - "epoch": 36.72, - "learning_rate": 1.0734265734265733e-06, - "loss": 0.3393, - "step": 42370 - }, - { - "epoch": 36.72, - "learning_rate": 1.0727272727272726e-06, - "loss": 0.5535, - "step": 42380 - }, - { - "epoch": 36.73, - "learning_rate": 1.0720279720279719e-06, - "loss": 0.3223, - "step": 42390 - }, - { - "epoch": 36.74, - "learning_rate": 1.0713286713286714e-06, - "loss": 0.422, - "step": 42400 - }, - { - "epoch": 36.75, - "learning_rate": 1.0706293706293705e-06, - "loss": 0.3859, - "step": 42410 - }, - { - "epoch": 36.76, - "learning_rate": 1.06993006993007e-06, - "loss": 0.3511, - "step": 42420 - }, - { - "epoch": 36.77, - "learning_rate": 1.0692307692307692e-06, - "loss": 0.3707, - "step": 42430 - }, - { - "epoch": 36.78, - "learning_rate": 1.0685314685314685e-06, - "loss": 0.3629, - "step": 42440 - }, - { - "epoch": 36.78, - "learning_rate": 1.0678321678321678e-06, - "loss": 0.2954, - "step": 42450 - }, - { - "epoch": 36.79, - "learning_rate": 1.0671328671328669e-06, - "loss": 0.3542, - "step": 42460 - }, - { - "epoch": 36.8, - "learning_rate": 1.0664335664335664e-06, - "loss": 0.3539, - "step": 42470 - }, - { - "epoch": 36.81, - "learning_rate": 1.0657342657342657e-06, - "loss": 0.3929, - "step": 42480 - }, - { - "epoch": 36.82, - "learning_rate": 1.065034965034965e-06, - "loss": 0.4005, - "step": 42490 - }, - { - "epoch": 36.83, - "learning_rate": 1.0643356643356642e-06, - "loss": 0.3936, - "step": 42500 - }, - { - "epoch": 36.84, - "learning_rate": 1.0636363636363637e-06, - "loss": 0.3981, - "step": 42510 - }, - { - "epoch": 36.85, - "learning_rate": 1.0629370629370628e-06, - "loss": 0.3591, - "step": 42520 - }, - { - "epoch": 36.85, - "learning_rate": 1.0622377622377623e-06, - "loss": 0.3683, - "step": 42530 - }, - { - "epoch": 36.86, - "learning_rate": 1.0615384615384616e-06, - "loss": 0.3906, - "step": 42540 - }, - { - "epoch": 36.87, - "learning_rate": 1.0608391608391607e-06, - "loss": 0.3424, - "step": 42550 - }, - { - "epoch": 36.88, - "learning_rate": 1.0601398601398602e-06, - "loss": 0.4172, - "step": 42560 - }, - { - "epoch": 36.89, - "learning_rate": 1.0594405594405592e-06, - "loss": 0.2909, - "step": 42570 - }, - { - "epoch": 36.9, - "learning_rate": 1.0587412587412587e-06, - "loss": 0.3886, - "step": 42580 - }, - { - "epoch": 36.91, - "learning_rate": 1.058041958041958e-06, - "loss": 0.3914, - "step": 42590 - }, - { - "epoch": 36.91, - "learning_rate": 1.0573426573426573e-06, - "loss": 0.3627, - "step": 42600 - }, - { - "epoch": 36.92, - "learning_rate": 1.0566433566433566e-06, - "loss": 0.3297, - "step": 42610 - }, - { - "epoch": 36.93, - "learning_rate": 1.055944055944056e-06, - "loss": 0.4152, - "step": 42620 - }, - { - "epoch": 36.94, - "learning_rate": 1.0552447552447552e-06, - "loss": 0.3648, - "step": 42630 - }, - { - "epoch": 36.95, - "learning_rate": 1.0545454545454544e-06, - "loss": 0.3864, - "step": 42640 - }, - { - "epoch": 36.96, - "learning_rate": 1.0538461538461537e-06, - "loss": 0.345, - "step": 42650 - }, - { - "epoch": 36.97, - "learning_rate": 1.053146853146853e-06, - "loss": 0.3624, - "step": 42660 - }, - { - "epoch": 36.98, - "learning_rate": 1.0524475524475525e-06, - "loss": 0.3598, - "step": 42670 - }, - { - "epoch": 36.98, - "learning_rate": 1.0517482517482516e-06, - "loss": 0.3666, - "step": 42680 - }, - { - "epoch": 36.99, - "learning_rate": 1.051048951048951e-06, - "loss": 0.41, - "step": 42690 - }, - { - "epoch": 37.0, - "eval_loss": 0.5600542426109314, - "eval_runtime": 136.3308, - "eval_samples_per_second": 3.902, - "eval_steps_per_second": 1.951, - "eval_wer": 0.2506910072636112, - "step": 42698 - }, - { - "epoch": 37.0, - "learning_rate": 1.0503496503496504e-06, - "loss": 0.3753, - "step": 42700 - }, - { - "epoch": 37.01, - "learning_rate": 1.0496503496503496e-06, - "loss": 0.3875, - "step": 42710 - }, - { - "epoch": 37.02, - "learning_rate": 1.048951048951049e-06, - "loss": 0.3963, - "step": 42720 - }, - { - "epoch": 37.03, - "learning_rate": 1.0482517482517482e-06, - "loss": 0.3604, - "step": 42730 - }, - { - "epoch": 37.04, - "learning_rate": 1.0475524475524475e-06, - "loss": 0.4096, - "step": 42740 - }, - { - "epoch": 37.05, - "learning_rate": 1.0468531468531468e-06, - "loss": 0.3517, - "step": 42750 - }, - { - "epoch": 37.05, - "learning_rate": 1.046153846153846e-06, - "loss": 0.3432, - "step": 42760 - }, - { - "epoch": 37.06, - "learning_rate": 1.0454545454545454e-06, - "loss": 0.4349, - "step": 42770 - }, - { - "epoch": 37.07, - "learning_rate": 1.0447552447552449e-06, - "loss": 0.3735, - "step": 42780 - }, - { - "epoch": 37.08, - "learning_rate": 1.044055944055944e-06, - "loss": 0.407, - "step": 42790 - }, - { - "epoch": 37.09, - "learning_rate": 1.0433566433566434e-06, - "loss": 0.3428, - "step": 42800 - }, - { - "epoch": 37.1, - "learning_rate": 1.0426573426573427e-06, - "loss": 0.353, - "step": 42810 - }, - { - "epoch": 37.11, - "learning_rate": 1.0419580419580418e-06, - "loss": 0.3502, - "step": 42820 - }, - { - "epoch": 37.11, - "learning_rate": 1.0412587412587413e-06, - "loss": 0.3917, - "step": 42830 - }, - { - "epoch": 37.12, - "learning_rate": 1.0405594405594404e-06, - "loss": 0.4072, - "step": 42840 - }, - { - "epoch": 37.13, - "learning_rate": 1.0398601398601399e-06, - "loss": 0.3533, - "step": 42850 - }, - { - "epoch": 37.14, - "learning_rate": 1.0391608391608391e-06, - "loss": 0.3397, - "step": 42860 - }, - { - "epoch": 37.15, - "learning_rate": 1.0384615384615384e-06, - "loss": 0.394, - "step": 42870 - }, - { - "epoch": 37.16, - "learning_rate": 1.0377622377622377e-06, - "loss": 0.3791, - "step": 42880 - }, - { - "epoch": 37.17, - "learning_rate": 1.0370629370629372e-06, - "loss": 0.3509, - "step": 42890 - }, - { - "epoch": 37.17, - "learning_rate": 1.0363636363636363e-06, - "loss": 0.4394, - "step": 42900 - }, - { - "epoch": 37.18, - "learning_rate": 1.0356643356643356e-06, - "loss": 0.357, - "step": 42910 - }, - { - "epoch": 37.19, - "learning_rate": 1.034965034965035e-06, - "loss": 0.305, - "step": 42920 - }, - { - "epoch": 37.2, - "learning_rate": 1.0342657342657341e-06, - "loss": 0.3295, - "step": 42930 - }, - { - "epoch": 37.21, - "learning_rate": 1.0335664335664336e-06, - "loss": 0.4157, - "step": 42940 - }, - { - "epoch": 37.22, - "learning_rate": 1.0328671328671327e-06, - "loss": 0.386, - "step": 42950 - }, - { - "epoch": 37.23, - "learning_rate": 1.0321678321678322e-06, - "loss": 0.3664, - "step": 42960 - }, - { - "epoch": 37.24, - "learning_rate": 1.0314685314685315e-06, - "loss": 0.3553, - "step": 42970 - }, - { - "epoch": 37.24, - "learning_rate": 1.0307692307692306e-06, - "loss": 0.359, - "step": 42980 - }, - { - "epoch": 37.25, - "learning_rate": 1.03006993006993e-06, - "loss": 0.3668, - "step": 42990 - }, - { - "epoch": 37.26, - "learning_rate": 1.0293706293706293e-06, - "loss": 0.84, - "step": 43000 - }, - { - "epoch": 37.27, - "learning_rate": 1.0286713286713286e-06, - "loss": 0.4169, - "step": 43010 - }, - { - "epoch": 37.28, - "learning_rate": 1.027972027972028e-06, - "loss": 0.4215, - "step": 43020 - }, - { - "epoch": 37.29, - "learning_rate": 1.0272727272727272e-06, - "loss": 0.3693, - "step": 43030 - }, - { - "epoch": 37.3, - "learning_rate": 1.0265734265734265e-06, - "loss": 0.3395, - "step": 43040 - }, - { - "epoch": 37.3, - "learning_rate": 1.025874125874126e-06, - "loss": 0.3611, - "step": 43050 - }, - { - "epoch": 37.31, - "learning_rate": 1.025174825174825e-06, - "loss": 0.3396, - "step": 43060 - }, - { - "epoch": 37.32, - "learning_rate": 1.0244755244755243e-06, - "loss": 0.4121, - "step": 43070 - }, - { - "epoch": 37.33, - "learning_rate": 1.0237762237762238e-06, - "loss": 0.3261, - "step": 43080 - }, - { - "epoch": 37.34, - "learning_rate": 1.023076923076923e-06, - "loss": 0.3397, - "step": 43090 - }, - { - "epoch": 37.35, - "learning_rate": 1.0223776223776224e-06, - "loss": 0.2939, - "step": 43100 - }, - { - "epoch": 37.36, - "learning_rate": 1.0216783216783215e-06, - "loss": 0.3971, - "step": 43110 - }, - { - "epoch": 37.37, - "learning_rate": 1.020979020979021e-06, - "loss": 0.369, - "step": 43120 - }, - { - "epoch": 37.37, - "learning_rate": 1.0202797202797203e-06, - "loss": 0.367, - "step": 43130 - }, - { - "epoch": 37.38, - "learning_rate": 1.0195804195804195e-06, - "loss": 0.3512, - "step": 43140 - }, - { - "epoch": 37.39, - "learning_rate": 1.0188811188811188e-06, - "loss": 0.403, - "step": 43150 - }, - { - "epoch": 37.4, - "learning_rate": 1.0181818181818181e-06, - "loss": 0.3309, - "step": 43160 - }, - { - "epoch": 37.41, - "learning_rate": 1.0174825174825174e-06, - "loss": 0.3211, - "step": 43170 - }, - { - "epoch": 37.42, - "learning_rate": 1.0167832167832167e-06, - "loss": 0.3635, - "step": 43180 - }, - { - "epoch": 37.43, - "learning_rate": 1.0160839160839162e-06, - "loss": 0.3595, - "step": 43190 - }, - { - "epoch": 37.43, - "learning_rate": 1.0153846153846153e-06, - "loss": 0.3189, - "step": 43200 - }, - { - "epoch": 37.44, - "learning_rate": 1.0146853146853148e-06, - "loss": 0.3031, - "step": 43210 - }, - { - "epoch": 37.45, - "learning_rate": 1.0139860139860138e-06, - "loss": 0.3341, - "step": 43220 - }, - { - "epoch": 37.46, - "learning_rate": 1.0132867132867133e-06, - "loss": 0.3429, - "step": 43230 - }, - { - "epoch": 37.47, - "learning_rate": 1.0125874125874126e-06, - "loss": 0.3394, - "step": 43240 - }, - { - "epoch": 37.48, - "learning_rate": 1.0118881118881117e-06, - "loss": 0.3817, - "step": 43250 - }, - { - "epoch": 37.49, - "learning_rate": 1.0111888111888112e-06, - "loss": 0.3684, - "step": 43260 - }, - { - "epoch": 37.5, - "learning_rate": 1.0104895104895105e-06, - "loss": 0.3615, - "step": 43270 - }, - { - "epoch": 37.5, - "learning_rate": 1.0097902097902098e-06, - "loss": 0.364, - "step": 43280 - }, - { - "epoch": 37.51, - "learning_rate": 1.009090909090909e-06, - "loss": 0.44, - "step": 43290 - }, - { - "epoch": 37.52, - "learning_rate": 1.0083916083916083e-06, - "loss": 0.3402, - "step": 43300 - }, - { - "epoch": 37.53, - "learning_rate": 1.0076923076923076e-06, - "loss": 0.3225, - "step": 43310 - }, - { - "epoch": 37.54, - "learning_rate": 1.006993006993007e-06, - "loss": 0.3241, - "step": 43320 - }, - { - "epoch": 37.55, - "learning_rate": 1.0062937062937062e-06, - "loss": 0.3411, - "step": 43330 - }, - { - "epoch": 37.56, - "learning_rate": 1.0055944055944055e-06, - "loss": 0.35, - "step": 43340 - }, - { - "epoch": 37.56, - "learning_rate": 1.004895104895105e-06, - "loss": 0.3763, - "step": 43350 - }, - { - "epoch": 37.57, - "learning_rate": 1.004195804195804e-06, - "loss": 0.3327, - "step": 43360 - }, - { - "epoch": 37.58, - "learning_rate": 1.0034965034965035e-06, - "loss": 0.3849, - "step": 43370 - }, - { - "epoch": 37.59, - "learning_rate": 1.0027972027972026e-06, - "loss": 0.3767, - "step": 43380 - }, - { - "epoch": 37.6, - "learning_rate": 1.002097902097902e-06, - "loss": 0.4381, - "step": 43390 - }, - { - "epoch": 37.61, - "learning_rate": 1.0013986013986014e-06, - "loss": 0.4041, - "step": 43400 - }, - { - "epoch": 37.62, - "learning_rate": 1.0006993006993007e-06, - "loss": 0.3674, - "step": 43410 - }, - { - "epoch": 37.63, - "learning_rate": 1e-06, - "loss": 0.3349, - "step": 43420 - }, - { - "epoch": 37.63, - "learning_rate": 9.993006993006992e-07, - "loss": 0.344, - "step": 43430 - }, - { - "epoch": 37.64, - "learning_rate": 9.986013986013985e-07, - "loss": 0.3806, - "step": 43440 - }, - { - "epoch": 37.65, - "learning_rate": 9.979020979020978e-07, - "loss": 0.3198, - "step": 43450 - }, - { - "epoch": 37.66, - "learning_rate": 9.972027972027973e-07, - "loss": 0.3704, - "step": 43460 - }, - { - "epoch": 37.67, - "learning_rate": 9.965034965034964e-07, - "loss": 0.3334, - "step": 43470 - }, - { - "epoch": 37.68, - "learning_rate": 9.958041958041957e-07, - "loss": 0.3586, - "step": 43480 - }, - { - "epoch": 37.69, - "learning_rate": 9.95104895104895e-07, - "loss": 0.3963, - "step": 43490 - }, - { - "epoch": 37.69, - "learning_rate": 9.944055944055944e-07, - "loss": 0.3769, - "step": 43500 - }, - { - "epoch": 37.7, - "learning_rate": 9.937062937062937e-07, - "loss": 0.3593, - "step": 43510 - }, - { - "epoch": 37.71, - "learning_rate": 9.93006993006993e-07, - "loss": 0.3758, - "step": 43520 - }, - { - "epoch": 37.72, - "learning_rate": 9.923076923076923e-07, - "loss": 0.3967, - "step": 43530 - }, - { - "epoch": 37.73, - "learning_rate": 9.916083916083916e-07, - "loss": 0.3647, - "step": 43540 - }, - { - "epoch": 37.74, - "learning_rate": 9.909090909090909e-07, - "loss": 0.3461, - "step": 43550 - }, - { - "epoch": 37.75, - "learning_rate": 9.902097902097902e-07, - "loss": 0.3963, - "step": 43560 - }, - { - "epoch": 37.76, - "learning_rate": 9.895104895104894e-07, - "loss": 0.3842, - "step": 43570 - }, - { - "epoch": 37.76, - "learning_rate": 9.888111888111887e-07, - "loss": 0.3668, - "step": 43580 - }, - { - "epoch": 37.77, - "learning_rate": 9.88111888111888e-07, - "loss": 0.3835, - "step": 43590 - }, - { - "epoch": 37.78, - "learning_rate": 9.874125874125873e-07, - "loss": 0.3577, - "step": 43600 - }, - { - "epoch": 37.79, - "learning_rate": 9.867132867132866e-07, - "loss": 0.3185, - "step": 43610 - }, - { - "epoch": 37.8, - "learning_rate": 9.86013986013986e-07, - "loss": 0.3138, - "step": 43620 - }, - { - "epoch": 37.81, - "learning_rate": 9.853146853146854e-07, - "loss": 0.3538, - "step": 43630 - }, - { - "epoch": 37.82, - "learning_rate": 9.846153846153847e-07, - "loss": 0.3668, - "step": 43640 - }, - { - "epoch": 37.82, - "learning_rate": 9.839160839160837e-07, - "loss": 0.37, - "step": 43650 - }, - { - "epoch": 37.83, - "learning_rate": 9.832167832167832e-07, - "loss": 0.3803, - "step": 43660 - }, - { - "epoch": 37.84, - "learning_rate": 9.825174825174825e-07, - "loss": 0.3459, - "step": 43670 - }, - { - "epoch": 37.85, - "learning_rate": 9.818181818181818e-07, - "loss": 0.4266, - "step": 43680 - }, - { - "epoch": 37.86, - "learning_rate": 9.81118881118881e-07, - "loss": 0.3547, - "step": 43690 - }, - { - "epoch": 37.87, - "learning_rate": 9.804195804195804e-07, - "loss": 0.3848, - "step": 43700 - }, - { - "epoch": 37.88, - "learning_rate": 9.797202797202796e-07, - "loss": 0.3814, - "step": 43710 - }, - { - "epoch": 37.89, - "learning_rate": 9.79020979020979e-07, - "loss": 0.3339, - "step": 43720 - }, - { - "epoch": 37.89, - "learning_rate": 9.783216783216782e-07, - "loss": 0.3518, - "step": 43730 - }, - { - "epoch": 37.9, - "learning_rate": 9.776223776223775e-07, - "loss": 0.3501, - "step": 43740 - }, - { - "epoch": 37.91, - "learning_rate": 9.769230769230768e-07, - "loss": 0.4146, - "step": 43750 - }, - { - "epoch": 37.92, - "learning_rate": 9.76223776223776e-07, - "loss": 0.3855, - "step": 43760 - }, - { - "epoch": 37.93, - "learning_rate": 9.755244755244756e-07, - "loss": 0.3061, - "step": 43770 - }, - { - "epoch": 37.94, - "learning_rate": 9.748251748251749e-07, - "loss": 0.3929, - "step": 43780 - }, - { - "epoch": 37.95, - "learning_rate": 9.741258741258741e-07, - "loss": 0.3627, - "step": 43790 - }, - { - "epoch": 37.95, - "learning_rate": 9.734265734265734e-07, - "loss": 0.3824, - "step": 43800 - }, - { - "epoch": 37.96, - "learning_rate": 9.727272727272727e-07, - "loss": 0.3575, - "step": 43810 - }, - { - "epoch": 37.97, - "learning_rate": 9.72027972027972e-07, - "loss": 0.3515, - "step": 43820 - }, - { - "epoch": 37.98, - "learning_rate": 9.713286713286713e-07, - "loss": 0.3463, - "step": 43830 - }, - { - "epoch": 37.99, - "learning_rate": 9.706293706293706e-07, - "loss": 0.3723, - "step": 43840 - }, - { - "epoch": 38.0, - "learning_rate": 9.699300699300699e-07, - "loss": 0.3595, - "step": 43850 - }, - { - "epoch": 38.0, - "eval_loss": 0.5644901990890503, - "eval_runtime": 138.0216, - "eval_samples_per_second": 3.854, - "eval_steps_per_second": 1.927, - "eval_wer": 0.24252747959118082, - "step": 43852 - }, - { - "epoch": 38.01, - "learning_rate": 9.692307692307691e-07, - "loss": 0.3875, - "step": 43860 - }, - { - "epoch": 38.02, - "learning_rate": 9.685314685314684e-07, - "loss": 0.3265, - "step": 43870 - }, - { - "epoch": 38.02, - "learning_rate": 9.678321678321677e-07, - "loss": 0.3206, - "step": 43880 - }, - { - "epoch": 38.03, - "learning_rate": 9.671328671328672e-07, - "loss": 0.3687, - "step": 43890 - }, - { - "epoch": 38.04, - "learning_rate": 9.664335664335665e-07, - "loss": 0.3597, - "step": 43900 - }, - { - "epoch": 38.05, - "learning_rate": 9.657342657342656e-07, - "loss": 0.3749, - "step": 43910 - }, - { - "epoch": 38.06, - "learning_rate": 9.650349650349648e-07, - "loss": 0.4115, - "step": 43920 - }, - { - "epoch": 38.07, - "learning_rate": 9.643356643356643e-07, - "loss": 0.3816, - "step": 43930 - }, - { - "epoch": 38.08, - "learning_rate": 9.636363636363636e-07, - "loss": 0.3347, - "step": 43940 - }, - { - "epoch": 38.08, - "learning_rate": 9.62937062937063e-07, - "loss": 0.3663, - "step": 43950 - }, - { - "epoch": 38.09, - "learning_rate": 9.622377622377622e-07, - "loss": 0.3175, - "step": 43960 - }, - { - "epoch": 38.1, - "learning_rate": 9.615384615384615e-07, - "loss": 0.4146, - "step": 43970 - }, - { - "epoch": 38.11, - "learning_rate": 9.608391608391608e-07, - "loss": 0.3256, - "step": 43980 - }, - { - "epoch": 38.12, - "learning_rate": 9.6013986013986e-07, - "loss": 0.3867, - "step": 43990 - }, - { - "epoch": 38.13, - "learning_rate": 9.594405594405593e-07, - "loss": 0.3616, - "step": 44000 - }, - { - "epoch": 38.14, - "learning_rate": 9.587412587412586e-07, - "loss": 0.382, - "step": 44010 - }, - { - "epoch": 38.15, - "learning_rate": 9.58041958041958e-07, - "loss": 0.368, - "step": 44020 - }, - { - "epoch": 38.15, - "learning_rate": 9.573426573426572e-07, - "loss": 0.387, - "step": 44030 - }, - { - "epoch": 38.16, - "learning_rate": 9.566433566433567e-07, - "loss": 0.3909, - "step": 44040 - }, - { - "epoch": 38.17, - "learning_rate": 9.55944055944056e-07, - "loss": 0.3383, - "step": 44050 - }, - { - "epoch": 38.18, - "learning_rate": 9.552447552447553e-07, - "loss": 0.338, - "step": 44060 - }, - { - "epoch": 38.19, - "learning_rate": 9.545454545454546e-07, - "loss": 0.3665, - "step": 44070 - }, - { - "epoch": 38.2, - "learning_rate": 9.538461538461538e-07, - "loss": 0.3143, - "step": 44080 - }, - { - "epoch": 38.21, - "learning_rate": 9.53146853146853e-07, - "loss": 0.357, - "step": 44090 - }, - { - "epoch": 38.21, - "learning_rate": 9.524475524475524e-07, - "loss": 0.361, - "step": 44100 - }, - { - "epoch": 38.22, - "learning_rate": 9.517482517482517e-07, - "loss": 0.3403, - "step": 44110 - }, - { - "epoch": 38.23, - "learning_rate": 9.51048951048951e-07, - "loss": 0.4304, - "step": 44120 - }, - { - "epoch": 38.24, - "learning_rate": 9.503496503496503e-07, - "loss": 0.3789, - "step": 44130 - }, - { - "epoch": 38.25, - "learning_rate": 9.496503496503497e-07, - "loss": 0.4432, - "step": 44140 - }, - { - "epoch": 38.26, - "learning_rate": 9.489510489510489e-07, - "loss": 0.3962, - "step": 44150 - }, - { - "epoch": 38.27, - "learning_rate": 9.482517482517482e-07, - "loss": 0.3889, - "step": 44160 - }, - { - "epoch": 38.28, - "learning_rate": 9.475524475524476e-07, - "loss": 0.3886, - "step": 44170 - }, - { - "epoch": 38.28, - "learning_rate": 9.468531468531468e-07, - "loss": 0.3698, - "step": 44180 - }, - { - "epoch": 38.29, - "learning_rate": 9.461538461538461e-07, - "loss": 0.363, - "step": 44190 - }, - { - "epoch": 38.3, - "learning_rate": 9.454545454545454e-07, - "loss": 0.3795, - "step": 44200 - }, - { - "epoch": 38.31, - "learning_rate": 9.447552447552448e-07, - "loss": 0.3191, - "step": 44210 - }, - { - "epoch": 38.32, - "learning_rate": 9.44055944055944e-07, - "loss": 0.3204, - "step": 44220 - }, - { - "epoch": 38.33, - "learning_rate": 9.433566433566433e-07, - "loss": 0.3443, - "step": 44230 - }, - { - "epoch": 38.34, - "learning_rate": 9.426573426573426e-07, - "loss": 0.3001, - "step": 44240 - }, - { - "epoch": 38.34, - "learning_rate": 9.41958041958042e-07, - "loss": 0.3616, - "step": 44250 - }, - { - "epoch": 38.35, - "learning_rate": 9.412587412587412e-07, - "loss": 0.3068, - "step": 44260 - }, - { - "epoch": 38.36, - "learning_rate": 9.405594405594405e-07, - "loss": 0.3636, - "step": 44270 - }, - { - "epoch": 38.37, - "learning_rate": 9.398601398601398e-07, - "loss": 0.3701, - "step": 44280 - }, - { - "epoch": 38.38, - "learning_rate": 9.391608391608391e-07, - "loss": 0.3862, - "step": 44290 - }, - { - "epoch": 38.39, - "learning_rate": 9.384615384615384e-07, - "loss": 0.4033, - "step": 44300 - }, - { - "epoch": 38.4, - "learning_rate": 9.377622377622377e-07, - "loss": 0.3917, - "step": 44310 - }, - { - "epoch": 38.41, - "learning_rate": 9.37062937062937e-07, - "loss": 0.3281, - "step": 44320 - }, - { - "epoch": 38.41, - "learning_rate": 9.363636363636364e-07, - "loss": 0.3073, - "step": 44330 - }, - { - "epoch": 38.42, - "learning_rate": 9.356643356643357e-07, - "loss": 0.3964, - "step": 44340 - }, - { - "epoch": 38.43, - "learning_rate": 9.349650349650349e-07, - "loss": 0.3475, - "step": 44350 - }, - { - "epoch": 38.44, - "learning_rate": 9.342657342657341e-07, - "loss": 0.3904, - "step": 44360 - }, - { - "epoch": 38.45, - "learning_rate": 9.335664335664335e-07, - "loss": 0.3616, - "step": 44370 - }, - { - "epoch": 38.46, - "learning_rate": 9.328671328671328e-07, - "loss": 0.3734, - "step": 44380 - }, - { - "epoch": 38.47, - "learning_rate": 9.321678321678321e-07, - "loss": 0.3758, - "step": 44390 - }, - { - "epoch": 38.47, - "learning_rate": 9.314685314685314e-07, - "loss": 0.3554, - "step": 44400 - }, - { - "epoch": 38.48, - "learning_rate": 9.307692307692308e-07, - "loss": 0.3412, - "step": 44410 - }, - { - "epoch": 38.49, - "learning_rate": 9.300699300699301e-07, - "loss": 0.3786, - "step": 44420 - }, - { - "epoch": 38.5, - "learning_rate": 9.293706293706293e-07, - "loss": 0.329, - "step": 44430 - }, - { - "epoch": 38.51, - "learning_rate": 9.286713286713286e-07, - "loss": 0.3826, - "step": 44440 - }, - { - "epoch": 38.52, - "learning_rate": 9.279720279720279e-07, - "loss": 0.382, - "step": 44450 - }, - { - "epoch": 38.53, - "learning_rate": 9.272727272727272e-07, - "loss": 0.345, - "step": 44460 - }, - { - "epoch": 38.54, - "learning_rate": 9.265734265734265e-07, - "loss": 0.4207, - "step": 44470 - }, - { - "epoch": 38.54, - "learning_rate": 9.258741258741259e-07, - "loss": 0.3646, - "step": 44480 - }, - { - "epoch": 38.55, - "learning_rate": 9.251748251748252e-07, - "loss": 0.3903, - "step": 44490 - }, - { - "epoch": 38.56, - "learning_rate": 9.244755244755244e-07, - "loss": 0.3991, - "step": 44500 - }, - { - "epoch": 38.57, - "learning_rate": 9.237762237762237e-07, - "loss": 0.3537, - "step": 44510 - }, - { - "epoch": 38.58, - "learning_rate": 9.230769230769231e-07, - "loss": 0.355, - "step": 44520 - }, - { - "epoch": 38.59, - "learning_rate": 9.223776223776223e-07, - "loss": 0.3738, - "step": 44530 - }, - { - "epoch": 38.6, - "learning_rate": 9.216783216783216e-07, - "loss": 0.3995, - "step": 44540 - }, - { - "epoch": 38.6, - "learning_rate": 9.209790209790209e-07, - "loss": 0.3621, - "step": 44550 - }, - { - "epoch": 38.61, - "learning_rate": 9.202797202797203e-07, - "loss": 0.3447, - "step": 44560 - }, - { - "epoch": 38.62, - "learning_rate": 9.195804195804196e-07, - "loss": 0.3588, - "step": 44570 - }, - { - "epoch": 38.63, - "learning_rate": 9.188811188811188e-07, - "loss": 0.3549, - "step": 44580 - }, - { - "epoch": 38.64, - "learning_rate": 9.181818181818181e-07, - "loss": 0.3609, - "step": 44590 - }, - { - "epoch": 38.65, - "learning_rate": 9.174825174825175e-07, - "loss": 0.3788, - "step": 44600 - }, - { - "epoch": 38.66, - "learning_rate": 9.167832167832168e-07, - "loss": 0.3588, - "step": 44610 - }, - { - "epoch": 38.67, - "learning_rate": 9.16083916083916e-07, - "loss": 0.3362, - "step": 44620 - }, - { - "epoch": 38.67, - "learning_rate": 9.153846153846153e-07, - "loss": 0.3101, - "step": 44630 - }, - { - "epoch": 38.68, - "learning_rate": 9.146853146853147e-07, - "loss": 0.3447, - "step": 44640 - }, - { - "epoch": 38.69, - "learning_rate": 9.139860139860139e-07, - "loss": 0.4118, - "step": 44650 - }, - { - "epoch": 38.7, - "learning_rate": 9.132867132867132e-07, - "loss": 0.3416, - "step": 44660 - }, - { - "epoch": 38.71, - "learning_rate": 9.125874125874126e-07, - "loss": 0.324, - "step": 44670 - }, - { - "epoch": 38.72, - "learning_rate": 9.118881118881119e-07, - "loss": 0.2899, - "step": 44680 - }, - { - "epoch": 38.73, - "learning_rate": 9.111888111888112e-07, - "loss": 0.4077, - "step": 44690 - }, - { - "epoch": 38.73, - "learning_rate": 9.104895104895104e-07, - "loss": 0.3471, - "step": 44700 - }, - { - "epoch": 38.74, - "learning_rate": 9.097902097902098e-07, - "loss": 0.4073, - "step": 44710 - }, - { - "epoch": 38.75, - "learning_rate": 9.09090909090909e-07, - "loss": 0.3735, - "step": 44720 - }, - { - "epoch": 38.76, - "learning_rate": 9.083916083916083e-07, - "loss": 0.383, - "step": 44730 - }, - { - "epoch": 38.77, - "learning_rate": 9.076923076923076e-07, - "loss": 0.3692, - "step": 44740 - }, - { - "epoch": 38.78, - "learning_rate": 9.06993006993007e-07, - "loss": 0.3726, - "step": 44750 - }, - { - "epoch": 38.79, - "learning_rate": 9.062937062937063e-07, - "loss": 0.419, - "step": 44760 - }, - { - "epoch": 38.8, - "learning_rate": 9.055944055944056e-07, - "loss": 0.3219, - "step": 44770 - }, - { - "epoch": 38.8, - "learning_rate": 9.048951048951049e-07, - "loss": 0.333, - "step": 44780 - }, - { - "epoch": 38.81, - "learning_rate": 9.041958041958041e-07, - "loss": 0.3529, - "step": 44790 - }, - { - "epoch": 38.82, - "learning_rate": 9.034965034965034e-07, - "loss": 0.3975, - "step": 44800 - }, - { - "epoch": 38.83, - "learning_rate": 9.027972027972027e-07, - "loss": 0.3833, - "step": 44810 - }, - { - "epoch": 38.84, - "learning_rate": 9.02097902097902e-07, - "loss": 0.3765, - "step": 44820 - }, - { - "epoch": 38.85, - "learning_rate": 9.013986013986014e-07, - "loss": 0.3236, - "step": 44830 - }, - { - "epoch": 38.86, - "learning_rate": 9.006993006993007e-07, - "loss": 0.3945, - "step": 44840 - }, - { - "epoch": 38.86, - "learning_rate": 9e-07, - "loss": 0.3876, - "step": 44850 - }, - { - "epoch": 38.87, - "learning_rate": 8.993006993006992e-07, - "loss": 0.3197, - "step": 44860 - }, - { - "epoch": 38.88, - "learning_rate": 8.986013986013986e-07, - "loss": 0.3528, - "step": 44870 - }, - { - "epoch": 38.89, - "learning_rate": 8.979020979020978e-07, - "loss": 0.3329, - "step": 44880 - }, - { - "epoch": 38.9, - "learning_rate": 8.972027972027971e-07, - "loss": 0.378, - "step": 44890 - }, - { - "epoch": 38.91, - "learning_rate": 8.965034965034964e-07, - "loss": 0.3684, - "step": 44900 - }, - { - "epoch": 38.92, - "learning_rate": 8.958041958041958e-07, - "loss": 0.3379, - "step": 44910 - }, - { - "epoch": 38.93, - "learning_rate": 8.951048951048951e-07, - "loss": 0.4082, - "step": 44920 - }, - { - "epoch": 38.93, - "learning_rate": 8.944055944055943e-07, - "loss": 0.4096, - "step": 44930 - }, - { - "epoch": 38.94, - "learning_rate": 8.937062937062937e-07, - "loss": 0.3939, - "step": 44940 - }, - { - "epoch": 38.95, - "learning_rate": 8.93006993006993e-07, - "loss": 0.3941, - "step": 44950 - }, - { - "epoch": 38.96, - "learning_rate": 8.923076923076923e-07, - "loss": 0.3486, - "step": 44960 - }, - { - "epoch": 38.97, - "learning_rate": 8.916083916083915e-07, - "loss": 0.365, - "step": 44970 - }, - { - "epoch": 38.98, - "learning_rate": 8.909090909090909e-07, - "loss": 0.3748, - "step": 44980 - }, - { - "epoch": 38.99, - "learning_rate": 8.902097902097902e-07, - "loss": 0.3601, - "step": 44990 - }, - { - "epoch": 38.99, - "learning_rate": 8.895104895104894e-07, - "loss": 0.4174, - "step": 45000 - }, - { - "epoch": 39.0, - "eval_loss": 0.5560790300369263, - "eval_runtime": 134.861, - "eval_samples_per_second": 3.945, - "eval_steps_per_second": 1.972, - "eval_wer": 0.2422060808639198, - "step": 45006 - }, - { - "epoch": 39.0, - "learning_rate": 8.888111888111887e-07, - "loss": 0.3254, - "step": 45010 - }, - { - "epoch": 39.01, - "learning_rate": 8.881118881118881e-07, - "loss": 0.3612, - "step": 45020 - }, - { - "epoch": 39.02, - "learning_rate": 8.874125874125874e-07, - "loss": 0.3244, - "step": 45030 - }, - { - "epoch": 39.03, - "learning_rate": 8.867132867132867e-07, - "loss": 0.3464, - "step": 45040 - }, - { - "epoch": 39.04, - "learning_rate": 8.86013986013986e-07, - "loss": 0.3929, - "step": 45050 - }, - { - "epoch": 39.05, - "learning_rate": 8.853146853146853e-07, - "loss": 0.3325, - "step": 45060 - }, - { - "epoch": 39.06, - "learning_rate": 8.846153846153846e-07, - "loss": 0.3727, - "step": 45070 - }, - { - "epoch": 39.06, - "learning_rate": 8.839160839160838e-07, - "loss": 0.3336, - "step": 45080 - }, - { - "epoch": 39.07, - "learning_rate": 8.832167832167831e-07, - "loss": 0.365, - "step": 45090 - }, - { - "epoch": 39.08, - "learning_rate": 8.825174825174825e-07, - "loss": 0.3776, - "step": 45100 - }, - { - "epoch": 39.09, - "learning_rate": 8.818181818181818e-07, - "loss": 0.3349, - "step": 45110 - }, - { - "epoch": 39.1, - "learning_rate": 8.811188811188811e-07, - "loss": 0.3766, - "step": 45120 - }, - { - "epoch": 39.11, - "learning_rate": 8.804195804195805e-07, - "loss": 0.3304, - "step": 45130 - }, - { - "epoch": 39.12, - "learning_rate": 8.797202797202798e-07, - "loss": 0.3559, - "step": 45140 - }, - { - "epoch": 39.12, - "learning_rate": 8.790209790209789e-07, - "loss": 0.3789, - "step": 45150 - }, - { - "epoch": 39.13, - "learning_rate": 8.783216783216782e-07, - "loss": 0.3489, - "step": 45160 - }, - { - "epoch": 39.14, - "learning_rate": 8.776223776223776e-07, - "loss": 0.3391, - "step": 45170 - }, - { - "epoch": 39.15, - "learning_rate": 8.769230769230769e-07, - "loss": 0.3677, - "step": 45180 - }, - { - "epoch": 39.16, - "learning_rate": 8.762237762237762e-07, - "loss": 0.3268, - "step": 45190 - }, - { - "epoch": 39.17, - "learning_rate": 8.755244755244755e-07, - "loss": 0.3579, - "step": 45200 - }, - { - "epoch": 39.18, - "learning_rate": 8.748251748251749e-07, - "loss": 0.3822, - "step": 45210 - }, - { - "epoch": 39.19, - "learning_rate": 8.741258741258741e-07, - "loss": 0.3721, - "step": 45220 - }, - { - "epoch": 39.19, - "learning_rate": 8.734265734265733e-07, - "loss": 0.3749, - "step": 45230 - }, - { - "epoch": 39.2, - "learning_rate": 8.727272727272726e-07, - "loss": 0.3774, - "step": 45240 - }, - { - "epoch": 39.21, - "learning_rate": 8.72027972027972e-07, - "loss": 0.4054, - "step": 45250 - }, - { - "epoch": 39.22, - "learning_rate": 8.713286713286713e-07, - "loss": 0.3563, - "step": 45260 - }, - { - "epoch": 39.23, - "learning_rate": 8.706293706293706e-07, - "loss": 0.3177, - "step": 45270 - }, - { - "epoch": 39.24, - "learning_rate": 8.699300699300699e-07, - "loss": 0.3767, - "step": 45280 - }, - { - "epoch": 39.25, - "learning_rate": 8.692307692307692e-07, - "loss": 0.3558, - "step": 45290 - }, - { - "epoch": 39.25, - "learning_rate": 8.685314685314685e-07, - "loss": 0.367, - "step": 45300 - }, - { - "epoch": 39.26, - "learning_rate": 8.678321678321678e-07, - "loss": 0.3671, - "step": 45310 - }, - { - "epoch": 39.27, - "learning_rate": 8.67132867132867e-07, - "loss": 0.3949, - "step": 45320 - }, - { - "epoch": 39.28, - "learning_rate": 8.664335664335664e-07, - "loss": 0.3387, - "step": 45330 - }, - { - "epoch": 39.29, - "learning_rate": 8.657342657342657e-07, - "loss": 0.3181, - "step": 45340 - }, - { - "epoch": 39.3, - "learning_rate": 8.65034965034965e-07, - "loss": 0.4401, - "step": 45350 - }, - { - "epoch": 39.31, - "learning_rate": 8.644055944055943e-07, - "loss": 1.004, - "step": 45360 - }, - { - "epoch": 39.32, - "learning_rate": 8.637062937062937e-07, - "loss": 0.3415, - "step": 45370 - }, - { - "epoch": 39.32, - "learning_rate": 8.63006993006993e-07, - "loss": 0.3209, - "step": 45380 - }, - { - "epoch": 39.33, - "learning_rate": 8.623076923076923e-07, - "loss": 0.3658, - "step": 45390 - }, - { - "epoch": 39.34, - "learning_rate": 8.616083916083916e-07, - "loss": 0.3934, - "step": 45400 - }, - { - "epoch": 39.35, - "learning_rate": 8.60909090909091e-07, - "loss": 0.3391, - "step": 45410 - }, - { - "epoch": 39.36, - "learning_rate": 8.602097902097901e-07, - "loss": 0.3803, - "step": 45420 - }, - { - "epoch": 39.37, - "learning_rate": 8.595104895104894e-07, - "loss": 0.3205, - "step": 45430 - }, - { - "epoch": 39.38, - "learning_rate": 8.588111888111887e-07, - "loss": 0.3482, - "step": 45440 - }, - { - "epoch": 39.38, - "learning_rate": 8.581118881118881e-07, - "loss": 0.327, - "step": 45450 - }, - { - "epoch": 39.39, - "learning_rate": 8.574125874125874e-07, - "loss": 0.3618, - "step": 45460 - }, - { - "epoch": 39.4, - "learning_rate": 8.567132867132867e-07, - "loss": 0.2993, - "step": 45470 - }, - { - "epoch": 39.41, - "learning_rate": 8.56013986013986e-07, - "loss": 0.3172, - "step": 45480 - }, - { - "epoch": 39.42, - "learning_rate": 8.553146853146853e-07, - "loss": 0.3522, - "step": 45490 - }, - { - "epoch": 39.43, - "learning_rate": 8.546153846153846e-07, - "loss": 0.4131, - "step": 45500 - }, - { - "epoch": 39.44, - "learning_rate": 8.539160839160838e-07, - "loss": 0.3244, - "step": 45510 - }, - { - "epoch": 39.45, - "learning_rate": 8.532167832167831e-07, - "loss": 0.4001, - "step": 45520 - }, - { - "epoch": 39.45, - "learning_rate": 8.525174825174825e-07, - "loss": 0.3875, - "step": 45530 - }, - { - "epoch": 39.46, - "learning_rate": 8.518181818181818e-07, - "loss": 0.3784, - "step": 45540 - }, - { - "epoch": 39.47, - "learning_rate": 8.51118881118881e-07, - "loss": 0.3371, - "step": 45550 - }, - { - "epoch": 39.48, - "learning_rate": 8.504195804195804e-07, - "loss": 0.3874, - "step": 45560 - }, - { - "epoch": 39.49, - "learning_rate": 8.497202797202797e-07, - "loss": 0.4045, - "step": 45570 - }, - { - "epoch": 39.5, - "learning_rate": 8.49020979020979e-07, - "loss": 0.3472, - "step": 45580 - }, - { - "epoch": 39.51, - "learning_rate": 8.483216783216783e-07, - "loss": 0.3323, - "step": 45590 - }, - { - "epoch": 39.51, - "learning_rate": 8.476223776223776e-07, - "loss": 0.3584, - "step": 45600 - }, - { - "epoch": 39.52, - "learning_rate": 8.469230769230769e-07, - "loss": 0.3508, - "step": 45610 - }, - { - "epoch": 39.53, - "learning_rate": 8.462237762237762e-07, - "loss": 0.3475, - "step": 45620 - }, - { - "epoch": 39.54, - "learning_rate": 8.455244755244754e-07, - "loss": 0.3261, - "step": 45630 - }, - { - "epoch": 39.55, - "learning_rate": 8.448251748251748e-07, - "loss": 0.3484, - "step": 45640 - }, - { - "epoch": 39.56, - "learning_rate": 8.441258741258741e-07, - "loss": 0.3232, - "step": 45650 - }, - { - "epoch": 39.57, - "learning_rate": 8.434265734265734e-07, - "loss": 0.3817, - "step": 45660 - }, - { - "epoch": 39.58, - "learning_rate": 8.427272727272727e-07, - "loss": 0.3977, - "step": 45670 - }, - { - "epoch": 39.58, - "learning_rate": 8.420279720279721e-07, - "loss": 0.3844, - "step": 45680 - }, - { - "epoch": 39.59, - "learning_rate": 8.413286713286713e-07, - "loss": 0.4122, - "step": 45690 - }, - { - "epoch": 39.6, - "learning_rate": 8.406293706293705e-07, - "loss": 0.3463, - "step": 45700 - }, - { - "epoch": 39.61, - "learning_rate": 8.399300699300698e-07, - "loss": 0.3676, - "step": 45710 - }, - { - "epoch": 39.62, - "learning_rate": 8.392307692307692e-07, - "loss": 0.3153, - "step": 45720 - }, - { - "epoch": 39.63, - "learning_rate": 8.385314685314685e-07, - "loss": 0.3782, - "step": 45730 - }, - { - "epoch": 39.64, - "learning_rate": 8.378321678321678e-07, - "loss": 0.3946, - "step": 45740 - }, - { - "epoch": 39.64, - "learning_rate": 8.371328671328672e-07, - "loss": 0.337, - "step": 45750 - }, - { - "epoch": 39.65, - "learning_rate": 8.364335664335665e-07, - "loss": 0.343, - "step": 45760 - }, - { - "epoch": 39.66, - "learning_rate": 8.357342657342656e-07, - "loss": 0.4086, - "step": 45770 - }, - { - "epoch": 39.67, - "learning_rate": 8.350349650349649e-07, - "loss": 0.3289, - "step": 45780 - }, - { - "epoch": 39.68, - "learning_rate": 8.343356643356643e-07, - "loss": 0.3764, - "step": 45790 - }, - { - "epoch": 39.69, - "learning_rate": 8.336363636363636e-07, - "loss": 0.4078, - "step": 45800 - }, - { - "epoch": 39.7, - "learning_rate": 8.329370629370629e-07, - "loss": 0.3649, - "step": 45810 - }, - { - "epoch": 39.71, - "learning_rate": 8.322377622377622e-07, - "loss": 0.3192, - "step": 45820 - }, - { - "epoch": 39.71, - "learning_rate": 8.315384615384616e-07, - "loss": 0.3186, - "step": 45830 - }, - { - "epoch": 39.72, - "learning_rate": 8.308391608391609e-07, - "loss": 0.3843, - "step": 45840 - }, - { - "epoch": 39.73, - "learning_rate": 8.301398601398601e-07, - "loss": 0.4289, - "step": 45850 - }, - { - "epoch": 39.74, - "learning_rate": 8.294405594405593e-07, - "loss": 0.3832, - "step": 45860 - }, - { - "epoch": 39.75, - "learning_rate": 8.287412587412587e-07, - "loss": 0.3709, - "step": 45870 - }, - { - "epoch": 39.76, - "learning_rate": 8.28041958041958e-07, - "loss": 0.3485, - "step": 45880 - }, - { - "epoch": 39.77, - "learning_rate": 8.273426573426573e-07, - "loss": 0.4107, - "step": 45890 - }, - { - "epoch": 39.77, - "learning_rate": 8.266433566433566e-07, - "loss": 0.3506, - "step": 45900 - }, - { - "epoch": 39.78, - "learning_rate": 8.25944055944056e-07, - "loss": 0.3926, - "step": 45910 - }, - { - "epoch": 39.79, - "learning_rate": 8.252447552447552e-07, - "loss": 0.3188, - "step": 45920 - }, - { - "epoch": 39.8, - "learning_rate": 8.245454545454545e-07, - "loss": 0.3841, - "step": 45930 - }, - { - "epoch": 39.81, - "learning_rate": 8.238461538461538e-07, - "loss": 0.33, - "step": 45940 - }, - { - "epoch": 39.82, - "learning_rate": 8.231468531468531e-07, - "loss": 0.4078, - "step": 45950 - }, - { - "epoch": 39.83, - "learning_rate": 8.224475524475524e-07, - "loss": 0.3734, - "step": 45960 - }, - { - "epoch": 39.83, - "learning_rate": 8.217482517482517e-07, - "loss": 0.433, - "step": 45970 - }, - { - "epoch": 39.84, - "learning_rate": 8.21048951048951e-07, - "loss": 0.3371, - "step": 45980 - }, - { - "epoch": 39.85, - "learning_rate": 8.203496503496503e-07, - "loss": 0.3286, - "step": 45990 - }, - { - "epoch": 39.86, - "learning_rate": 8.196503496503496e-07, - "loss": 0.3165, - "step": 46000 - }, - { - "epoch": 39.87, - "learning_rate": 8.189510489510489e-07, - "loss": 0.3681, - "step": 46010 - }, - { - "epoch": 39.88, - "learning_rate": 8.182517482517483e-07, - "loss": 0.4005, - "step": 46020 - }, - { - "epoch": 39.89, - "learning_rate": 8.175524475524476e-07, - "loss": 0.3461, - "step": 46030 - }, - { - "epoch": 39.9, - "learning_rate": 8.168531468531468e-07, - "loss": 0.3826, - "step": 46040 - }, - { - "epoch": 39.9, - "learning_rate": 8.16153846153846e-07, - "loss": 0.3303, - "step": 46050 - }, - { - "epoch": 39.91, - "learning_rate": 8.154545454545454e-07, - "loss": 0.3725, - "step": 46060 - }, - { - "epoch": 39.92, - "learning_rate": 8.147552447552447e-07, - "loss": 0.3333, - "step": 46070 - }, - { - "epoch": 39.93, - "learning_rate": 8.14055944055944e-07, - "loss": 0.3256, - "step": 46080 - }, - { - "epoch": 39.94, - "learning_rate": 8.133566433566433e-07, - "loss": 0.3596, - "step": 46090 - }, - { - "epoch": 39.95, - "learning_rate": 8.126573426573427e-07, - "loss": 0.3749, - "step": 46100 - }, - { - "epoch": 39.96, - "learning_rate": 8.11958041958042e-07, - "loss": 0.3801, - "step": 46110 - }, - { - "epoch": 39.96, - "learning_rate": 8.112587412587413e-07, - "loss": 0.3549, - "step": 46120 - }, - { - "epoch": 39.97, - "learning_rate": 8.105594405594404e-07, - "loss": 0.2963, - "step": 46130 - }, - { - "epoch": 39.98, - "learning_rate": 8.098601398601398e-07, - "loss": 0.3943, - "step": 46140 - }, - { - "epoch": 39.99, - "learning_rate": 8.091608391608391e-07, - "loss": 0.4128, - "step": 46150 - }, - { - "epoch": 40.0, - "learning_rate": 8.084615384615384e-07, - "loss": 0.3801, - "step": 46160 - }, - { - "epoch": 40.0, - "eval_loss": 0.555422306060791, - "eval_runtime": 135.1325, - "eval_samples_per_second": 3.937, - "eval_steps_per_second": 1.968, - "eval_wer": 0.24265603908208525, - "step": 46160 - }, - { - "epoch": 40.01, - "learning_rate": 8.077622377622377e-07, - "loss": 0.3376, - "step": 46170 - }, - { - "epoch": 40.02, - "learning_rate": 8.070629370629371e-07, - "loss": 0.3705, - "step": 46180 - }, - { - "epoch": 40.03, - "learning_rate": 8.063636363636364e-07, - "loss": 0.3501, - "step": 46190 - }, - { - "epoch": 40.03, - "learning_rate": 8.056643356643356e-07, - "loss": 0.3822, - "step": 46200 - }, - { - "epoch": 40.04, - "learning_rate": 8.049650349650349e-07, - "loss": 0.4096, - "step": 46210 - }, - { - "epoch": 40.05, - "learning_rate": 8.042657342657342e-07, - "loss": 0.3671, - "step": 46220 - }, - { - "epoch": 40.06, - "learning_rate": 8.035664335664335e-07, - "loss": 0.3587, - "step": 46230 - }, - { - "epoch": 40.07, - "learning_rate": 8.028671328671328e-07, - "loss": 0.3556, - "step": 46240 - }, - { - "epoch": 40.08, - "learning_rate": 8.021678321678321e-07, - "loss": 0.3804, - "step": 46250 - }, - { - "epoch": 40.09, - "learning_rate": 8.014685314685315e-07, - "loss": 0.3352, - "step": 46260 - }, - { - "epoch": 40.1, - "learning_rate": 8.007692307692308e-07, - "loss": 0.3717, - "step": 46270 - }, - { - "epoch": 40.1, - "learning_rate": 8.0006993006993e-07, - "loss": 0.3979, - "step": 46280 - }, - { - "epoch": 40.11, - "learning_rate": 7.993706293706294e-07, - "loss": 0.339, - "step": 46290 - }, - { - "epoch": 40.12, - "learning_rate": 7.986713286713286e-07, - "loss": 0.3293, - "step": 46300 - }, - { - "epoch": 40.13, - "learning_rate": 7.979720279720279e-07, - "loss": 0.434, - "step": 46310 - }, - { - "epoch": 40.14, - "learning_rate": 7.972727272727272e-07, - "loss": 0.3497, - "step": 46320 - }, - { - "epoch": 40.15, - "learning_rate": 7.965734265734266e-07, - "loss": 0.3962, - "step": 46330 - }, - { - "epoch": 40.16, - "learning_rate": 7.958741258741259e-07, - "loss": 0.3041, - "step": 46340 - }, - { - "epoch": 40.16, - "learning_rate": 7.951748251748251e-07, - "loss": 0.3659, - "step": 46350 - }, - { - "epoch": 40.17, - "learning_rate": 7.944755244755244e-07, - "loss": 0.3684, - "step": 46360 - }, - { - "epoch": 40.18, - "learning_rate": 7.937762237762238e-07, - "loss": 0.3591, - "step": 46370 - }, - { - "epoch": 40.19, - "learning_rate": 7.930769230769231e-07, - "loss": 0.3384, - "step": 46380 - }, - { - "epoch": 40.2, - "learning_rate": 7.923776223776223e-07, - "loss": 0.3565, - "step": 46390 - }, - { - "epoch": 40.21, - "learning_rate": 7.916783216783216e-07, - "loss": 0.3494, - "step": 46400 - }, - { - "epoch": 40.22, - "learning_rate": 7.90979020979021e-07, - "loss": 0.3633, - "step": 46410 - }, - { - "epoch": 40.23, - "learning_rate": 7.902797202797202e-07, - "loss": 0.3559, - "step": 46420 - }, - { - "epoch": 40.23, - "learning_rate": 7.895804195804195e-07, - "loss": 0.3643, - "step": 46430 - }, - { - "epoch": 40.24, - "learning_rate": 7.888811188811188e-07, - "loss": 0.3674, - "step": 46440 - }, - { - "epoch": 40.25, - "learning_rate": 7.881818181818182e-07, - "loss": 0.3457, - "step": 46450 - }, - { - "epoch": 40.26, - "learning_rate": 7.874825174825175e-07, - "loss": 0.428, - "step": 46460 - }, - { - "epoch": 40.27, - "learning_rate": 7.867832167832168e-07, - "loss": 0.3056, - "step": 46470 - }, - { - "epoch": 40.28, - "learning_rate": 7.86083916083916e-07, - "loss": 0.3643, - "step": 46480 - }, - { - "epoch": 40.29, - "learning_rate": 7.853846153846153e-07, - "loss": 0.3634, - "step": 46490 - }, - { - "epoch": 40.29, - "learning_rate": 7.846853146853146e-07, - "loss": 0.3273, - "step": 46500 - }, - { - "epoch": 40.3, - "learning_rate": 7.839860139860139e-07, - "loss": 0.3266, - "step": 46510 - }, - { - "epoch": 40.31, - "learning_rate": 7.832867132867133e-07, - "loss": 0.386, - "step": 46520 - }, - { - "epoch": 40.32, - "learning_rate": 7.825874125874126e-07, - "loss": 0.3992, - "step": 46530 - }, - { - "epoch": 40.33, - "learning_rate": 7.818881118881119e-07, - "loss": 0.3818, - "step": 46540 - }, - { - "epoch": 40.34, - "learning_rate": 7.811888111888112e-07, - "loss": 0.3936, - "step": 46550 - }, - { - "epoch": 40.35, - "learning_rate": 7.804895104895105e-07, - "loss": 0.3577, - "step": 46560 - }, - { - "epoch": 40.36, - "learning_rate": 7.797902097902097e-07, - "loss": 0.3625, - "step": 46570 - }, - { - "epoch": 40.36, - "learning_rate": 7.79090909090909e-07, - "loss": 0.325, - "step": 46580 - }, - { - "epoch": 40.37, - "learning_rate": 7.783916083916083e-07, - "loss": 0.2867, - "step": 46590 - }, - { - "epoch": 40.38, - "learning_rate": 7.776923076923077e-07, - "loss": 0.3772, - "step": 46600 - }, - { - "epoch": 40.39, - "learning_rate": 7.76993006993007e-07, - "loss": 0.4338, - "step": 46610 - }, - { - "epoch": 40.4, - "learning_rate": 7.762937062937063e-07, - "loss": 0.2842, - "step": 46620 - }, - { - "epoch": 40.41, - "learning_rate": 7.755944055944055e-07, - "loss": 0.3428, - "step": 46630 - }, - { - "epoch": 40.42, - "learning_rate": 7.748951048951049e-07, - "loss": 0.3017, - "step": 46640 - }, - { - "epoch": 40.42, - "learning_rate": 7.741958041958042e-07, - "loss": 0.377, - "step": 46650 - }, - { - "epoch": 40.43, - "learning_rate": 7.734965034965034e-07, - "loss": 0.3507, - "step": 46660 - }, - { - "epoch": 40.44, - "learning_rate": 7.727972027972027e-07, - "loss": 0.4011, - "step": 46670 - }, - { - "epoch": 40.45, - "learning_rate": 7.720979020979021e-07, - "loss": 0.3269, - "step": 46680 - }, - { - "epoch": 40.46, - "learning_rate": 7.713986013986014e-07, - "loss": 0.3637, - "step": 46690 - }, - { - "epoch": 40.47, - "learning_rate": 7.706993006993006e-07, - "loss": 0.3921, - "step": 46700 - }, - { - "epoch": 40.48, - "learning_rate": 7.699999999999999e-07, - "loss": 0.3854, - "step": 46710 - }, - { - "epoch": 40.49, - "learning_rate": 7.693006993006993e-07, - "loss": 0.3721, - "step": 46720 - }, - { - "epoch": 40.49, - "learning_rate": 7.686013986013986e-07, - "loss": 0.3072, - "step": 46730 - }, - { - "epoch": 40.5, - "learning_rate": 7.679020979020979e-07, - "loss": 0.3823, - "step": 46740 - }, - { - "epoch": 40.51, - "learning_rate": 7.672027972027971e-07, - "loss": 0.428, - "step": 46750 - }, - { - "epoch": 40.52, - "learning_rate": 7.665034965034965e-07, - "loss": 0.391, - "step": 46760 - }, - { - "epoch": 40.53, - "learning_rate": 7.658041958041958e-07, - "loss": 0.388, - "step": 46770 - }, - { - "epoch": 40.54, - "learning_rate": 7.65104895104895e-07, - "loss": 0.3316, - "step": 46780 - }, - { - "epoch": 40.55, - "learning_rate": 7.644055944055944e-07, - "loss": 0.3006, - "step": 46790 - }, - { - "epoch": 40.55, - "learning_rate": 7.637062937062937e-07, - "loss": 0.3454, - "step": 46800 - }, - { - "epoch": 40.56, - "learning_rate": 7.63006993006993e-07, - "loss": 0.3911, - "step": 46810 - }, - { - "epoch": 40.57, - "learning_rate": 7.623076923076923e-07, - "loss": 0.4216, - "step": 46820 - }, - { - "epoch": 40.58, - "learning_rate": 7.616083916083916e-07, - "loss": 0.3473, - "step": 46830 - }, - { - "epoch": 40.59, - "learning_rate": 7.609090909090909e-07, - "loss": 0.318, - "step": 46840 - }, - { - "epoch": 40.6, - "learning_rate": 7.602097902097901e-07, - "loss": 0.3566, - "step": 46850 - }, - { - "epoch": 40.61, - "learning_rate": 7.595104895104894e-07, - "loss": 0.4275, - "step": 46860 - }, - { - "epoch": 40.61, - "learning_rate": 7.588111888111888e-07, - "loss": 0.3429, - "step": 46870 - }, - { - "epoch": 40.62, - "learning_rate": 7.581118881118881e-07, - "loss": 0.3497, - "step": 46880 - }, - { - "epoch": 40.63, - "learning_rate": 7.574125874125874e-07, - "loss": 0.3578, - "step": 46890 - }, - { - "epoch": 40.64, - "learning_rate": 7.567132867132867e-07, - "loss": 0.3595, - "step": 46900 - }, - { - "epoch": 40.65, - "learning_rate": 7.560139860139861e-07, - "loss": 0.3588, - "step": 46910 - }, - { - "epoch": 40.66, - "learning_rate": 7.553146853146852e-07, - "loss": 0.3881, - "step": 46920 - }, - { - "epoch": 40.67, - "learning_rate": 7.546153846153845e-07, - "loss": 0.3375, - "step": 46930 - }, - { - "epoch": 40.68, - "learning_rate": 7.539160839160838e-07, - "loss": 0.304, - "step": 46940 - }, - { - "epoch": 40.68, - "learning_rate": 7.532167832167832e-07, - "loss": 0.3907, - "step": 46950 - }, - { - "epoch": 40.69, - "learning_rate": 7.525174825174825e-07, - "loss": 0.3802, - "step": 46960 - }, - { - "epoch": 40.7, - "learning_rate": 7.518181818181818e-07, - "loss": 0.3624, - "step": 46970 - }, - { - "epoch": 40.71, - "learning_rate": 7.511188811188811e-07, - "loss": 0.3823, - "step": 46980 - }, - { - "epoch": 40.72, - "learning_rate": 7.504195804195804e-07, - "loss": 0.3714, - "step": 46990 - }, - { - "epoch": 40.73, - "learning_rate": 7.497202797202797e-07, - "loss": 0.3438, - "step": 47000 - }, - { - "epoch": 40.74, - "learning_rate": 7.490209790209789e-07, - "loss": 0.3373, - "step": 47010 - }, - { - "epoch": 40.74, - "learning_rate": 7.483216783216783e-07, - "loss": 0.3587, - "step": 47020 - }, - { - "epoch": 40.75, - "learning_rate": 7.476223776223776e-07, - "loss": 0.3786, - "step": 47030 - }, - { - "epoch": 40.76, - "learning_rate": 7.469230769230769e-07, - "loss": 0.3028, - "step": 47040 - }, - { - "epoch": 40.77, - "learning_rate": 7.462237762237762e-07, - "loss": 0.3495, - "step": 47050 - }, - { - "epoch": 40.78, - "learning_rate": 7.455244755244756e-07, - "loss": 0.3871, - "step": 47060 - }, - { - "epoch": 40.79, - "learning_rate": 7.448251748251748e-07, - "loss": 0.3675, - "step": 47070 - }, - { - "epoch": 40.8, - "learning_rate": 7.441258741258741e-07, - "loss": 0.3547, - "step": 47080 - }, - { - "epoch": 40.81, - "learning_rate": 7.434265734265734e-07, - "loss": 0.3329, - "step": 47090 - }, - { - "epoch": 40.81, - "learning_rate": 7.427272727272727e-07, - "loss": 0.3788, - "step": 47100 - }, - { - "epoch": 40.82, - "learning_rate": 7.42027972027972e-07, - "loss": 0.3157, - "step": 47110 - }, - { - "epoch": 40.83, - "learning_rate": 7.413286713286713e-07, - "loss": 0.3474, - "step": 47120 - }, - { - "epoch": 40.84, - "learning_rate": 7.406293706293705e-07, - "loss": 0.3536, - "step": 47130 - }, - { - "epoch": 40.85, - "learning_rate": 7.399300699300699e-07, - "loss": 0.3388, - "step": 47140 - }, - { - "epoch": 40.86, - "learning_rate": 7.392307692307692e-07, - "loss": 0.3879, - "step": 47150 - }, - { - "epoch": 40.87, - "learning_rate": 7.385314685314685e-07, - "loss": 0.4051, - "step": 47160 - }, - { - "epoch": 40.87, - "learning_rate": 7.378321678321678e-07, - "loss": 0.3227, - "step": 47170 - }, - { - "epoch": 40.88, - "learning_rate": 7.371328671328672e-07, - "loss": 0.3035, - "step": 47180 - }, - { - "epoch": 40.89, - "learning_rate": 7.364335664335664e-07, - "loss": 0.3333, - "step": 47190 - }, - { - "epoch": 40.9, - "learning_rate": 7.357342657342656e-07, - "loss": 0.3611, - "step": 47200 - }, - { - "epoch": 40.91, - "learning_rate": 7.350349650349649e-07, - "loss": 0.4021, - "step": 47210 - }, - { - "epoch": 40.92, - "learning_rate": 7.343356643356643e-07, - "loss": 0.3797, - "step": 47220 - }, - { - "epoch": 40.93, - "learning_rate": 7.336363636363636e-07, - "loss": 0.3672, - "step": 47230 - }, - { - "epoch": 40.94, - "learning_rate": 7.329370629370629e-07, - "loss": 0.3057, - "step": 47240 - }, - { - "epoch": 40.94, - "learning_rate": 7.322377622377623e-07, - "loss": 0.3187, - "step": 47250 - }, - { - "epoch": 40.95, - "learning_rate": 7.315384615384616e-07, - "loss": 0.3606, - "step": 47260 - }, - { - "epoch": 40.96, - "learning_rate": 7.308391608391608e-07, - "loss": 0.3516, - "step": 47270 - }, - { - "epoch": 40.97, - "learning_rate": 7.3013986013986e-07, - "loss": 0.3528, - "step": 47280 - }, - { - "epoch": 40.98, - "learning_rate": 7.294405594405594e-07, - "loss": 0.397, - "step": 47290 - }, - { - "epoch": 40.99, - "learning_rate": 7.287412587412587e-07, - "loss": 0.3507, - "step": 47300 - }, - { - "epoch": 41.0, - "learning_rate": 7.28041958041958e-07, - "loss": 0.3513, - "step": 47310 - }, - { - "epoch": 41.0, - "eval_loss": 0.559901773929596, - "eval_runtime": 136.925, - "eval_samples_per_second": 3.885, - "eval_steps_per_second": 1.943, - "eval_wer": 0.24201324162756316, - "step": 47314 - }, - { - "epoch": 41.01, - "learning_rate": 7.273426573426573e-07, - "loss": 0.3905, - "step": 47320 - }, - { - "epoch": 41.01, - "learning_rate": 7.266433566433567e-07, - "loss": 0.3763, - "step": 47330 - }, - { - "epoch": 41.02, - "learning_rate": 7.25944055944056e-07, - "loss": 0.3119, - "step": 47340 - }, - { - "epoch": 41.03, - "learning_rate": 7.252447552447552e-07, - "loss": 0.3404, - "step": 47350 - }, - { - "epoch": 41.04, - "learning_rate": 7.245454545454544e-07, - "loss": 0.3944, - "step": 47360 - }, - { - "epoch": 41.05, - "learning_rate": 7.238461538461538e-07, - "loss": 0.4, - "step": 47370 - }, - { - "epoch": 41.06, - "learning_rate": 7.231468531468531e-07, - "loss": 0.3483, - "step": 47380 - }, - { - "epoch": 41.07, - "learning_rate": 7.224475524475524e-07, - "loss": 0.345, - "step": 47390 - }, - { - "epoch": 41.07, - "learning_rate": 7.217482517482517e-07, - "loss": 0.3332, - "step": 47400 - }, - { - "epoch": 41.08, - "learning_rate": 7.210489510489511e-07, - "loss": 0.3213, - "step": 47410 - }, - { - "epoch": 41.09, - "learning_rate": 7.203496503496503e-07, - "loss": 0.3375, - "step": 47420 - }, - { - "epoch": 41.1, - "learning_rate": 7.196503496503496e-07, - "loss": 0.3356, - "step": 47430 - }, - { - "epoch": 41.11, - "learning_rate": 7.189510489510489e-07, - "loss": 0.3306, - "step": 47440 - }, - { - "epoch": 41.12, - "learning_rate": 7.182517482517482e-07, - "loss": 0.4358, - "step": 47450 - }, - { - "epoch": 41.13, - "learning_rate": 7.175524475524475e-07, - "loss": 0.4413, - "step": 47460 - }, - { - "epoch": 41.14, - "learning_rate": 7.168531468531468e-07, - "loss": 0.3332, - "step": 47470 - }, - { - "epoch": 41.14, - "learning_rate": 7.161538461538461e-07, - "loss": 0.369, - "step": 47480 - }, - { - "epoch": 41.15, - "learning_rate": 7.154545454545454e-07, - "loss": 0.3748, - "step": 47490 - }, - { - "epoch": 41.16, - "learning_rate": 7.147552447552447e-07, - "loss": 0.3464, - "step": 47500 - }, - { - "epoch": 41.17, - "learning_rate": 7.14055944055944e-07, - "loss": 0.3844, - "step": 47510 - }, - { - "epoch": 41.18, - "learning_rate": 7.133566433566434e-07, - "loss": 0.3767, - "step": 47520 - }, - { - "epoch": 41.19, - "learning_rate": 7.126573426573427e-07, - "loss": 0.3676, - "step": 47530 - }, - { - "epoch": 41.2, - "learning_rate": 7.119580419580419e-07, - "loss": 0.3877, - "step": 47540 - }, - { - "epoch": 41.2, - "learning_rate": 7.112587412587412e-07, - "loss": 0.3902, - "step": 47550 - }, - { - "epoch": 41.21, - "learning_rate": 7.105594405594406e-07, - "loss": 0.3718, - "step": 47560 - }, - { - "epoch": 41.22, - "learning_rate": 7.098601398601398e-07, - "loss": 0.3501, - "step": 47570 - }, - { - "epoch": 41.23, - "learning_rate": 7.091608391608391e-07, - "loss": 0.3736, - "step": 47580 - }, - { - "epoch": 41.24, - "learning_rate": 7.084615384615384e-07, - "loss": 0.3599, - "step": 47590 - }, - { - "epoch": 41.25, - "learning_rate": 7.077622377622378e-07, - "loss": 0.3664, - "step": 47600 - }, - { - "epoch": 41.26, - "learning_rate": 7.070629370629371e-07, - "loss": 0.3893, - "step": 47610 - }, - { - "epoch": 41.27, - "learning_rate": 7.063636363636364e-07, - "loss": 0.3887, - "step": 47620 - }, - { - "epoch": 41.27, - "learning_rate": 7.056643356643355e-07, - "loss": 0.3254, - "step": 47630 - }, - { - "epoch": 41.28, - "learning_rate": 7.049650349650349e-07, - "loss": 0.3702, - "step": 47640 - }, - { - "epoch": 41.29, - "learning_rate": 7.042657342657342e-07, - "loss": 0.3874, - "step": 47650 - }, - { - "epoch": 41.3, - "learning_rate": 7.035664335664335e-07, - "loss": 0.3469, - "step": 47660 - }, - { - "epoch": 41.31, - "learning_rate": 7.028671328671328e-07, - "loss": 0.3587, - "step": 47670 - }, - { - "epoch": 41.32, - "learning_rate": 7.021678321678322e-07, - "loss": 0.3572, - "step": 47680 - }, - { - "epoch": 41.33, - "learning_rate": 7.014685314685315e-07, - "loss": 0.3382, - "step": 47690 - }, - { - "epoch": 41.33, - "learning_rate": 7.007692307692308e-07, - "loss": 0.3692, - "step": 47700 - }, - { - "epoch": 41.34, - "learning_rate": 7.0006993006993e-07, - "loss": 0.3552, - "step": 47710 - }, - { - "epoch": 41.35, - "learning_rate": 6.993706293706293e-07, - "loss": 0.3536, - "step": 47720 - }, - { - "epoch": 41.36, - "learning_rate": 6.986713286713286e-07, - "loss": 0.3274, - "step": 47730 - }, - { - "epoch": 41.37, - "learning_rate": 6.979720279720279e-07, - "loss": 0.368, - "step": 47740 - }, - { - "epoch": 41.38, - "learning_rate": 6.972727272727273e-07, - "loss": 0.4008, - "step": 47750 - }, - { - "epoch": 41.39, - "learning_rate": 6.965734265734266e-07, - "loss": 0.3336, - "step": 47760 - }, - { - "epoch": 41.39, - "learning_rate": 6.958741258741259e-07, - "loss": 0.3342, - "step": 47770 - }, - { - "epoch": 41.4, - "learning_rate": 6.951748251748251e-07, - "loss": 0.3587, - "step": 47780 - }, - { - "epoch": 41.41, - "learning_rate": 6.944755244755245e-07, - "loss": 0.371, - "step": 47790 - }, - { - "epoch": 41.42, - "learning_rate": 6.937762237762237e-07, - "loss": 0.3359, - "step": 47800 - }, - { - "epoch": 41.43, - "learning_rate": 6.93076923076923e-07, - "loss": 0.3806, - "step": 47810 - }, - { - "epoch": 41.44, - "learning_rate": 6.923776223776223e-07, - "loss": 0.369, - "step": 47820 - }, - { - "epoch": 41.45, - "learning_rate": 6.916783216783217e-07, - "loss": 0.3462, - "step": 47830 - }, - { - "epoch": 41.46, - "learning_rate": 6.90979020979021e-07, - "loss": 0.2829, - "step": 47840 - }, - { - "epoch": 41.46, - "learning_rate": 6.902797202797202e-07, - "loss": 0.3493, - "step": 47850 - }, - { - "epoch": 41.47, - "learning_rate": 6.895804195804195e-07, - "loss": 0.3654, - "step": 47860 - }, - { - "epoch": 41.48, - "learning_rate": 6.888811188811189e-07, - "loss": 0.3211, - "step": 47870 - }, - { - "epoch": 41.49, - "learning_rate": 6.881818181818182e-07, - "loss": 0.3532, - "step": 47880 - }, - { - "epoch": 41.5, - "learning_rate": 6.874825174825174e-07, - "loss": 0.3522, - "step": 47890 - }, - { - "epoch": 41.51, - "learning_rate": 6.867832167832167e-07, - "loss": 0.3524, - "step": 47900 - }, - { - "epoch": 41.52, - "learning_rate": 6.860839160839161e-07, - "loss": 0.3416, - "step": 47910 - }, - { - "epoch": 41.52, - "learning_rate": 6.853846153846153e-07, - "loss": 0.3726, - "step": 47920 - }, - { - "epoch": 41.53, - "learning_rate": 6.846853146853146e-07, - "loss": 0.3733, - "step": 47930 - }, - { - "epoch": 41.54, - "learning_rate": 6.839860139860139e-07, - "loss": 0.3302, - "step": 47940 - }, - { - "epoch": 41.55, - "learning_rate": 6.832867132867133e-07, - "loss": 0.368, - "step": 47950 - }, - { - "epoch": 41.56, - "learning_rate": 6.825874125874126e-07, - "loss": 0.3841, - "step": 47960 - }, - { - "epoch": 41.57, - "learning_rate": 6.818881118881119e-07, - "loss": 0.3956, - "step": 47970 - }, - { - "epoch": 41.58, - "learning_rate": 6.811888111888111e-07, - "loss": 0.3752, - "step": 47980 - }, - { - "epoch": 41.59, - "learning_rate": 6.804895104895104e-07, - "loss": 0.3636, - "step": 47990 - }, - { - "epoch": 41.59, - "learning_rate": 6.797902097902097e-07, - "loss": 0.3978, - "step": 48000 - }, - { - "epoch": 41.6, - "learning_rate": 6.79090909090909e-07, - "loss": 0.368, - "step": 48010 - }, - { - "epoch": 41.61, - "learning_rate": 6.783916083916084e-07, - "loss": 0.4165, - "step": 48020 - }, - { - "epoch": 41.62, - "learning_rate": 6.776923076923077e-07, - "loss": 0.3761, - "step": 48030 - }, - { - "epoch": 41.63, - "learning_rate": 6.76993006993007e-07, - "loss": 0.3411, - "step": 48040 - }, - { - "epoch": 41.64, - "learning_rate": 6.762937062937063e-07, - "loss": 0.3551, - "step": 48050 - }, - { - "epoch": 41.65, - "learning_rate": 6.755944055944057e-07, - "loss": 0.4011, - "step": 48060 - }, - { - "epoch": 41.65, - "learning_rate": 6.748951048951048e-07, - "loss": 0.3244, - "step": 48070 - }, - { - "epoch": 41.66, - "learning_rate": 6.741958041958041e-07, - "loss": 0.3954, - "step": 48080 - }, - { - "epoch": 41.67, - "learning_rate": 6.734965034965034e-07, - "loss": 0.3258, - "step": 48090 - }, - { - "epoch": 41.68, - "learning_rate": 6.727972027972028e-07, - "loss": 0.3887, - "step": 48100 - }, - { - "epoch": 41.69, - "learning_rate": 6.720979020979021e-07, - "loss": 0.3747, - "step": 48110 - }, - { - "epoch": 41.7, - "learning_rate": 6.713986013986014e-07, - "loss": 0.4292, - "step": 48120 - }, - { - "epoch": 41.71, - "learning_rate": 6.706993006993007e-07, - "loss": 0.3614, - "step": 48130 - }, - { - "epoch": 41.72, - "learning_rate": 6.7e-07, - "loss": 0.3716, - "step": 48140 - }, - { - "epoch": 41.72, - "learning_rate": 6.693006993006993e-07, - "loss": 0.3525, - "step": 48150 - }, - { - "epoch": 41.73, - "learning_rate": 6.686013986013985e-07, - "loss": 0.379, - "step": 48160 - }, - { - "epoch": 41.74, - "learning_rate": 6.679020979020978e-07, - "loss": 0.3761, - "step": 48170 - }, - { - "epoch": 41.75, - "learning_rate": 6.672027972027972e-07, - "loss": 0.4308, - "step": 48180 - }, - { - "epoch": 41.76, - "learning_rate": 6.665034965034965e-07, - "loss": 0.3468, - "step": 48190 - }, - { - "epoch": 41.77, - "learning_rate": 6.658041958041958e-07, - "loss": 0.3229, - "step": 48200 - }, - { - "epoch": 41.78, - "learning_rate": 6.65104895104895e-07, - "loss": 0.3045, - "step": 48210 - }, - { - "epoch": 41.78, - "learning_rate": 6.644055944055944e-07, - "loss": 0.3951, - "step": 48220 - }, - { - "epoch": 41.79, - "learning_rate": 6.637062937062937e-07, - "loss": 0.352, - "step": 48230 - }, - { - "epoch": 41.8, - "learning_rate": 6.63006993006993e-07, - "loss": 0.2722, - "step": 48240 - }, - { - "epoch": 41.81, - "learning_rate": 6.623076923076923e-07, - "loss": 0.3191, - "step": 48250 - }, - { - "epoch": 41.82, - "learning_rate": 6.616083916083916e-07, - "loss": 0.3697, - "step": 48260 - }, - { - "epoch": 41.83, - "learning_rate": 6.609090909090909e-07, - "loss": 0.3631, - "step": 48270 - }, - { - "epoch": 41.84, - "learning_rate": 6.602097902097901e-07, - "loss": 0.3518, - "step": 48280 - }, - { - "epoch": 41.85, - "learning_rate": 6.595104895104895e-07, - "loss": 0.2858, - "step": 48290 - }, - { - "epoch": 41.85, - "learning_rate": 6.588111888111888e-07, - "loss": 0.3709, - "step": 48300 - }, - { - "epoch": 41.86, - "learning_rate": 6.581118881118881e-07, - "loss": 0.3929, - "step": 48310 - }, - { - "epoch": 41.87, - "learning_rate": 6.574125874125874e-07, - "loss": 0.3, - "step": 48320 - }, - { - "epoch": 41.88, - "learning_rate": 6.567132867132867e-07, - "loss": 0.3737, - "step": 48330 - }, - { - "epoch": 41.89, - "learning_rate": 6.56013986013986e-07, - "loss": 0.3676, - "step": 48340 - }, - { - "epoch": 41.9, - "learning_rate": 6.553146853146852e-07, - "loss": 0.373, - "step": 48350 - }, - { - "epoch": 41.91, - "learning_rate": 6.546153846153845e-07, - "loss": 0.3846, - "step": 48360 - }, - { - "epoch": 41.91, - "learning_rate": 6.539160839160839e-07, - "loss": 0.3561, - "step": 48370 - }, - { - "epoch": 41.92, - "learning_rate": 6.532167832167832e-07, - "loss": 0.3453, - "step": 48380 - }, - { - "epoch": 41.93, - "learning_rate": 6.525174825174825e-07, - "loss": 0.3311, - "step": 48390 - }, - { - "epoch": 41.94, - "learning_rate": 6.518181818181818e-07, - "loss": 0.3983, - "step": 48400 - }, - { - "epoch": 41.95, - "learning_rate": 6.511188811188812e-07, - "loss": 0.3875, - "step": 48410 - }, - { - "epoch": 41.96, - "learning_rate": 6.504195804195803e-07, - "loss": 0.3334, - "step": 48420 - }, - { - "epoch": 41.97, - "learning_rate": 6.497202797202796e-07, - "loss": 0.4028, - "step": 48430 - }, - { - "epoch": 41.98, - "learning_rate": 6.490209790209789e-07, - "loss": 0.3421, - "step": 48440 - }, - { - "epoch": 41.98, - "learning_rate": 6.483216783216783e-07, - "loss": 0.3155, - "step": 48450 - }, - { - "epoch": 41.99, - "learning_rate": 6.476223776223776e-07, - "loss": 0.3739, - "step": 48460 - }, - { - "epoch": 42.0, - "eval_loss": 0.5668932199478149, - "eval_runtime": 136.0754, - "eval_samples_per_second": 3.91, - "eval_steps_per_second": 1.955, - "eval_wer": 0.24175612264575433, - "step": 48468 - }, - { - "epoch": 42.0, - "learning_rate": 6.469230769230769e-07, - "loss": 0.3767, - "step": 48470 - }, - { - "epoch": 42.01, - "learning_rate": 6.462237762237763e-07, - "loss": 0.389, - "step": 48480 - }, - { - "epoch": 42.02, - "learning_rate": 6.455244755244756e-07, - "loss": 0.3434, - "step": 48490 - }, - { - "epoch": 42.03, - "learning_rate": 6.448251748251748e-07, - "loss": 0.3547, - "step": 48500 - }, - { - "epoch": 42.04, - "learning_rate": 6.44125874125874e-07, - "loss": 0.3653, - "step": 48510 - }, - { - "epoch": 42.05, - "learning_rate": 6.434265734265734e-07, - "loss": 0.357, - "step": 48520 - }, - { - "epoch": 42.05, - "learning_rate": 6.427272727272727e-07, - "loss": 0.3694, - "step": 48530 - }, - { - "epoch": 42.06, - "learning_rate": 6.42027972027972e-07, - "loss": 0.3616, - "step": 48540 - }, - { - "epoch": 42.07, - "learning_rate": 6.413286713286713e-07, - "loss": 0.3419, - "step": 48550 - }, - { - "epoch": 42.08, - "learning_rate": 6.406293706293707e-07, - "loss": 0.385, - "step": 48560 - }, - { - "epoch": 42.09, - "learning_rate": 6.399300699300699e-07, - "loss": 0.3177, - "step": 48570 - }, - { - "epoch": 42.1, - "learning_rate": 6.392307692307692e-07, - "loss": 0.3408, - "step": 48580 - }, - { - "epoch": 42.11, - "learning_rate": 6.385314685314685e-07, - "loss": 0.3393, - "step": 48590 - }, - { - "epoch": 42.11, - "learning_rate": 6.378321678321678e-07, - "loss": 0.3989, - "step": 48600 - }, - { - "epoch": 42.12, - "learning_rate": 6.371328671328671e-07, - "loss": 0.3204, - "step": 48610 - }, - { - "epoch": 42.13, - "learning_rate": 6.364335664335664e-07, - "loss": 0.3511, - "step": 48620 - }, - { - "epoch": 42.14, - "learning_rate": 6.357342657342657e-07, - "loss": 0.3581, - "step": 48630 - }, - { - "epoch": 42.15, - "learning_rate": 6.35034965034965e-07, - "loss": 0.3515, - "step": 48640 - }, - { - "epoch": 42.16, - "learning_rate": 6.343356643356643e-07, - "loss": 0.3076, - "step": 48650 - }, - { - "epoch": 42.17, - "learning_rate": 6.336363636363636e-07, - "loss": 0.3228, - "step": 48660 - }, - { - "epoch": 42.17, - "learning_rate": 6.329370629370629e-07, - "loss": 0.3846, - "step": 48670 - }, - { - "epoch": 42.18, - "learning_rate": 6.322377622377623e-07, - "loss": 0.3596, - "step": 48680 - }, - { - "epoch": 42.19, - "learning_rate": 6.315384615384615e-07, - "loss": 0.2774, - "step": 48690 - }, - { - "epoch": 42.2, - "learning_rate": 6.308391608391608e-07, - "loss": 0.299, - "step": 48700 - }, - { - "epoch": 42.21, - "learning_rate": 6.3013986013986e-07, - "loss": 0.3831, - "step": 48710 - }, - { - "epoch": 42.22, - "learning_rate": 6.294405594405594e-07, - "loss": 0.3012, - "step": 48720 - }, - { - "epoch": 42.23, - "learning_rate": 6.287412587412587e-07, - "loss": 0.4169, - "step": 48730 - }, - { - "epoch": 42.24, - "learning_rate": 6.28041958041958e-07, - "loss": 0.3375, - "step": 48740 - }, - { - "epoch": 42.24, - "learning_rate": 6.273426573426574e-07, - "loss": 0.3376, - "step": 48750 - }, - { - "epoch": 42.25, - "learning_rate": 6.266433566433567e-07, - "loss": 0.3196, - "step": 48760 - }, - { - "epoch": 42.26, - "learning_rate": 6.25944055944056e-07, - "loss": 0.353, - "step": 48770 - }, - { - "epoch": 42.27, - "learning_rate": 6.252447552447551e-07, - "loss": 0.359, - "step": 48780 - }, - { - "epoch": 42.28, - "learning_rate": 6.245454545454545e-07, - "loss": 0.3557, - "step": 48790 - }, - { - "epoch": 42.29, - "learning_rate": 6.238461538461538e-07, - "loss": 0.3828, - "step": 48800 - }, - { - "epoch": 42.3, - "learning_rate": 6.231468531468531e-07, - "loss": 0.4027, - "step": 48810 - }, - { - "epoch": 42.3, - "learning_rate": 6.224475524475524e-07, - "loss": 0.3855, - "step": 48820 - }, - { - "epoch": 42.31, - "learning_rate": 6.217482517482518e-07, - "loss": 0.3452, - "step": 48830 - }, - { - "epoch": 42.32, - "learning_rate": 6.210489510489511e-07, - "loss": 0.4077, - "step": 48840 - }, - { - "epoch": 42.33, - "learning_rate": 6.203496503496504e-07, - "loss": 0.3513, - "step": 48850 - }, - { - "epoch": 42.34, - "learning_rate": 6.196503496503495e-07, - "loss": 0.4098, - "step": 48860 - }, - { - "epoch": 42.35, - "learning_rate": 6.189510489510489e-07, - "loss": 0.3481, - "step": 48870 - }, - { - "epoch": 42.36, - "learning_rate": 6.182517482517482e-07, - "loss": 0.3485, - "step": 48880 - }, - { - "epoch": 42.37, - "learning_rate": 6.175524475524475e-07, - "loss": 0.322, - "step": 48890 - }, - { - "epoch": 42.37, - "learning_rate": 6.168531468531468e-07, - "loss": 0.3485, - "step": 48900 - }, - { - "epoch": 42.38, - "learning_rate": 6.161538461538462e-07, - "loss": 0.3846, - "step": 48910 - }, - { - "epoch": 42.39, - "learning_rate": 6.154545454545455e-07, - "loss": 0.3714, - "step": 48920 - }, - { - "epoch": 42.4, - "learning_rate": 6.147552447552447e-07, - "loss": 0.3733, - "step": 48930 - }, - { - "epoch": 42.41, - "learning_rate": 6.14055944055944e-07, - "loss": 0.3456, - "step": 48940 - }, - { - "epoch": 42.42, - "learning_rate": 6.133566433566433e-07, - "loss": 0.3564, - "step": 48950 - }, - { - "epoch": 42.43, - "learning_rate": 6.126573426573426e-07, - "loss": 0.3668, - "step": 48960 - }, - { - "epoch": 42.43, - "learning_rate": 6.119580419580419e-07, - "loss": 0.3504, - "step": 48970 - }, - { - "epoch": 42.44, - "learning_rate": 6.112587412587413e-07, - "loss": 0.3736, - "step": 48980 - }, - { - "epoch": 42.45, - "learning_rate": 6.105594405594406e-07, - "loss": 0.4041, - "step": 48990 - }, - { - "epoch": 42.46, - "learning_rate": 6.098601398601398e-07, - "loss": 0.4201, - "step": 49000 - }, - { - "epoch": 42.47, - "learning_rate": 6.091608391608391e-07, - "loss": 0.3436, - "step": 49010 - }, - { - "epoch": 42.48, - "learning_rate": 6.084615384615385e-07, - "loss": 0.3663, - "step": 49020 - }, - { - "epoch": 42.49, - "learning_rate": 6.077622377622378e-07, - "loss": 0.3723, - "step": 49030 - }, - { - "epoch": 42.5, - "learning_rate": 6.07062937062937e-07, - "loss": 0.3465, - "step": 49040 - }, - { - "epoch": 42.5, - "learning_rate": 6.063636363636363e-07, - "loss": 0.3464, - "step": 49050 - }, - { - "epoch": 42.51, - "learning_rate": 6.056643356643357e-07, - "loss": 0.3682, - "step": 49060 - }, - { - "epoch": 42.52, - "learning_rate": 6.049650349650349e-07, - "loss": 0.3549, - "step": 49070 - }, - { - "epoch": 42.53, - "learning_rate": 6.042657342657342e-07, - "loss": 0.397, - "step": 49080 - }, - { - "epoch": 42.54, - "learning_rate": 6.035664335664335e-07, - "loss": 0.3514, - "step": 49090 - }, - { - "epoch": 42.55, - "learning_rate": 6.028671328671329e-07, - "loss": 0.3532, - "step": 49100 - }, - { - "epoch": 42.56, - "learning_rate": 6.021678321678322e-07, - "loss": 0.3897, - "step": 49110 - }, - { - "epoch": 42.56, - "learning_rate": 6.014685314685315e-07, - "loss": 0.3663, - "step": 49120 - }, - { - "epoch": 42.57, - "learning_rate": 6.007692307692307e-07, - "loss": 0.3393, - "step": 49130 - }, - { - "epoch": 42.58, - "learning_rate": 6.0006993006993e-07, - "loss": 0.3473, - "step": 49140 - }, - { - "epoch": 42.59, - "learning_rate": 5.993706293706293e-07, - "loss": 0.3699, - "step": 49150 - }, - { - "epoch": 42.6, - "learning_rate": 5.986713286713286e-07, - "loss": 0.4025, - "step": 49160 - }, - { - "epoch": 42.61, - "learning_rate": 5.979720279720279e-07, - "loss": 0.3543, - "step": 49170 - }, - { - "epoch": 42.62, - "learning_rate": 5.972727272727273e-07, - "loss": 0.3318, - "step": 49180 - }, - { - "epoch": 42.63, - "learning_rate": 5.965734265734266e-07, - "loss": 0.3419, - "step": 49190 - }, - { - "epoch": 42.63, - "learning_rate": 5.958741258741259e-07, - "loss": 0.3452, - "step": 49200 - }, - { - "epoch": 42.64, - "learning_rate": 5.951748251748253e-07, - "loss": 0.385, - "step": 49210 - }, - { - "epoch": 42.65, - "learning_rate": 5.944755244755244e-07, - "loss": 0.4066, - "step": 49220 - }, - { - "epoch": 42.66, - "learning_rate": 5.937762237762237e-07, - "loss": 0.3566, - "step": 49230 - }, - { - "epoch": 42.67, - "learning_rate": 5.93076923076923e-07, - "loss": 0.3442, - "step": 49240 - }, - { - "epoch": 42.68, - "learning_rate": 5.923776223776224e-07, - "loss": 0.3464, - "step": 49250 - }, - { - "epoch": 42.69, - "learning_rate": 5.916783216783217e-07, - "loss": 0.3406, - "step": 49260 - }, - { - "epoch": 42.69, - "learning_rate": 5.90979020979021e-07, - "loss": 0.3679, - "step": 49270 - }, - { - "epoch": 42.7, - "learning_rate": 5.902797202797202e-07, - "loss": 0.3481, - "step": 49280 - }, - { - "epoch": 42.71, - "learning_rate": 5.895804195804196e-07, - "loss": 0.3361, - "step": 49290 - }, - { - "epoch": 42.72, - "learning_rate": 5.888811188811188e-07, - "loss": 0.3668, - "step": 49300 - }, - { - "epoch": 42.73, - "learning_rate": 5.881818181818181e-07, - "loss": 0.3632, - "step": 49310 - }, - { - "epoch": 42.74, - "learning_rate": 5.874825174825174e-07, - "loss": 0.391, - "step": 49320 - }, - { - "epoch": 42.75, - "learning_rate": 5.867832167832168e-07, - "loss": 0.3493, - "step": 49330 - }, - { - "epoch": 42.76, - "learning_rate": 5.860839160839161e-07, - "loss": 0.3616, - "step": 49340 - }, - { - "epoch": 42.76, - "learning_rate": 5.853846153846154e-07, - "loss": 0.4051, - "step": 49350 - }, - { - "epoch": 42.77, - "learning_rate": 5.846853146853146e-07, - "loss": 0.3538, - "step": 49360 - }, - { - "epoch": 42.78, - "learning_rate": 5.83986013986014e-07, - "loss": 0.4155, - "step": 49370 - }, - { - "epoch": 42.79, - "learning_rate": 5.832867132867133e-07, - "loss": 0.3261, - "step": 49380 - }, - { - "epoch": 42.8, - "learning_rate": 5.825874125874125e-07, - "loss": 0.3531, - "step": 49390 - }, - { - "epoch": 42.81, - "learning_rate": 5.818881118881118e-07, - "loss": 0.3218, - "step": 49400 - }, - { - "epoch": 42.82, - "learning_rate": 5.811888111888112e-07, - "loss": 0.3846, - "step": 49410 - }, - { - "epoch": 42.82, - "learning_rate": 5.804895104895105e-07, - "loss": 0.3391, - "step": 49420 - }, - { - "epoch": 42.83, - "learning_rate": 5.797902097902097e-07, - "loss": 0.345, - "step": 49430 - }, - { - "epoch": 42.84, - "learning_rate": 5.79090909090909e-07, - "loss": 0.3244, - "step": 49440 - }, - { - "epoch": 42.85, - "learning_rate": 5.783916083916084e-07, - "loss": 0.386, - "step": 49450 - }, - { - "epoch": 42.86, - "learning_rate": 5.776923076923077e-07, - "loss": 0.4148, - "step": 49460 - }, - { - "epoch": 42.87, - "learning_rate": 5.76993006993007e-07, - "loss": 0.3254, - "step": 49470 - }, - { - "epoch": 42.88, - "learning_rate": 5.762937062937062e-07, - "loss": 0.3659, - "step": 49480 - }, - { - "epoch": 42.89, - "learning_rate": 5.755944055944056e-07, - "loss": 0.3793, - "step": 49490 - }, - { - "epoch": 42.89, - "learning_rate": 5.748951048951048e-07, - "loss": 0.3521, - "step": 49500 - }, - { - "epoch": 42.9, - "learning_rate": 5.741958041958041e-07, - "loss": 0.3591, - "step": 49510 - }, - { - "epoch": 42.91, - "learning_rate": 5.734965034965035e-07, - "loss": 0.3978, - "step": 49520 - }, - { - "epoch": 42.92, - "learning_rate": 5.727972027972028e-07, - "loss": 0.3468, - "step": 49530 - }, - { - "epoch": 42.93, - "learning_rate": 5.720979020979021e-07, - "loss": 0.381, - "step": 49540 - }, - { - "epoch": 42.94, - "learning_rate": 5.713986013986014e-07, - "loss": 0.3439, - "step": 49550 - }, - { - "epoch": 42.95, - "learning_rate": 5.706993006993008e-07, - "loss": 0.3546, - "step": 49560 - }, - { - "epoch": 42.95, - "learning_rate": 5.699999999999999e-07, - "loss": 0.3392, - "step": 49570 - }, - { - "epoch": 42.96, - "learning_rate": 5.693006993006992e-07, - "loss": 0.3253, - "step": 49580 - }, - { - "epoch": 42.97, - "learning_rate": 5.686013986013985e-07, - "loss": 0.3876, - "step": 49590 - }, - { - "epoch": 42.98, - "learning_rate": 5.679020979020979e-07, - "loss": 0.3507, - "step": 49600 - }, - { - "epoch": 42.99, - "learning_rate": 5.672027972027972e-07, - "loss": 0.3843, - "step": 49610 - }, - { - "epoch": 43.0, - "learning_rate": 5.665034965034965e-07, - "loss": 0.3702, - "step": 49620 - }, - { - "epoch": 43.0, - "eval_loss": 0.5646147727966309, - "eval_runtime": 138.0762, - "eval_samples_per_second": 3.853, - "eval_steps_per_second": 1.926, - "eval_wer": 0.24413447322748602, - "step": 49622 - }, - { - "epoch": 43.01, - "learning_rate": 5.658041958041958e-07, - "loss": 0.4483, - "step": 49630 - }, - { - "epoch": 43.02, - "learning_rate": 5.651048951048952e-07, - "loss": 0.3129, - "step": 49640 - }, - { - "epoch": 43.02, - "learning_rate": 5.644055944055944e-07, - "loss": 0.3615, - "step": 49650 - }, - { - "epoch": 43.03, - "learning_rate": 5.637062937062936e-07, - "loss": 0.4337, - "step": 49660 - }, - { - "epoch": 43.04, - "learning_rate": 5.630069930069929e-07, - "loss": 0.3558, - "step": 49670 - }, - { - "epoch": 43.05, - "learning_rate": 5.623076923076923e-07, - "loss": 0.3202, - "step": 49680 - }, - { - "epoch": 43.06, - "learning_rate": 5.616083916083916e-07, - "loss": 0.3395, - "step": 49690 - }, - { - "epoch": 43.07, - "learning_rate": 5.609090909090909e-07, - "loss": 0.3591, - "step": 49700 - }, - { - "epoch": 43.08, - "learning_rate": 5.602097902097903e-07, - "loss": 0.4359, - "step": 49710 - }, - { - "epoch": 43.08, - "learning_rate": 5.595104895104895e-07, - "loss": 0.3346, - "step": 49720 - }, - { - "epoch": 43.09, - "learning_rate": 5.588111888111888e-07, - "loss": 0.3803, - "step": 49730 - }, - { - "epoch": 43.1, - "learning_rate": 5.581118881118881e-07, - "loss": 0.3718, - "step": 49740 - }, - { - "epoch": 43.11, - "learning_rate": 5.574125874125874e-07, - "loss": 0.335, - "step": 49750 - }, - { - "epoch": 43.12, - "learning_rate": 5.567132867132867e-07, - "loss": 0.3856, - "step": 49760 - }, - { - "epoch": 43.13, - "learning_rate": 5.56083916083916e-07, - "loss": 0.3488, - "step": 49770 - }, - { - "epoch": 43.14, - "learning_rate": 5.553846153846153e-07, - "loss": 0.3367, - "step": 49780 - }, - { - "epoch": 43.15, - "learning_rate": 5.546853146853146e-07, - "loss": 0.3346, - "step": 49790 - }, - { - "epoch": 43.15, - "learning_rate": 5.53986013986014e-07, - "loss": 0.3368, - "step": 49800 - }, - { - "epoch": 43.16, - "learning_rate": 5.532867132867133e-07, - "loss": 0.3931, - "step": 49810 - }, - { - "epoch": 43.17, - "learning_rate": 5.525874125874126e-07, - "loss": 0.3877, - "step": 49820 - }, - { - "epoch": 43.18, - "learning_rate": 5.51888111888112e-07, - "loss": 0.3382, - "step": 49830 - }, - { - "epoch": 43.19, - "learning_rate": 5.511888111888111e-07, - "loss": 0.3488, - "step": 49840 - }, - { - "epoch": 43.2, - "learning_rate": 5.504895104895104e-07, - "loss": 0.3033, - "step": 49850 - }, - { - "epoch": 43.21, - "learning_rate": 5.497902097902097e-07, - "loss": 0.3465, - "step": 49860 - }, - { - "epoch": 43.21, - "learning_rate": 5.490909090909091e-07, - "loss": 0.3864, - "step": 49870 - }, - { - "epoch": 43.22, - "learning_rate": 5.483916083916084e-07, - "loss": 0.3856, - "step": 49880 - }, - { - "epoch": 43.23, - "learning_rate": 5.476923076923077e-07, - "loss": 0.3992, - "step": 49890 - }, - { - "epoch": 43.24, - "learning_rate": 5.46993006993007e-07, - "loss": 0.351, - "step": 49900 - }, - { - "epoch": 43.25, - "learning_rate": 5.462937062937063e-07, - "loss": 0.3492, - "step": 49910 - }, - { - "epoch": 43.26, - "learning_rate": 5.455944055944056e-07, - "loss": 0.3662, - "step": 49920 - }, - { - "epoch": 43.27, - "learning_rate": 5.448951048951048e-07, - "loss": 0.3553, - "step": 49930 - }, - { - "epoch": 43.28, - "learning_rate": 5.441958041958041e-07, - "loss": 0.403, - "step": 49940 - }, - { - "epoch": 43.28, - "learning_rate": 5.434965034965035e-07, - "loss": 0.3562, - "step": 49950 - }, - { - "epoch": 43.29, - "learning_rate": 5.427972027972028e-07, - "loss": 0.3855, - "step": 49960 - }, - { - "epoch": 43.3, - "learning_rate": 5.420979020979021e-07, - "loss": 0.3589, - "step": 49970 - }, - { - "epoch": 43.31, - "learning_rate": 5.413986013986013e-07, - "loss": 0.3787, - "step": 49980 - }, - { - "epoch": 43.32, - "learning_rate": 5.406993006993007e-07, - "loss": 0.3631, - "step": 49990 - }, - { - "epoch": 43.33, - "learning_rate": 5.4e-07, - "loss": 0.3099, - "step": 50000 - }, - { - "epoch": 43.34, - "learning_rate": 5.393006993006993e-07, - "loss": 0.349, - "step": 50010 - }, - { - "epoch": 43.34, - "learning_rate": 5.386013986013985e-07, - "loss": 0.4186, - "step": 50020 - }, - { - "epoch": 43.35, - "learning_rate": 5.379020979020979e-07, - "loss": 0.349, - "step": 50030 - }, - { - "epoch": 43.36, - "learning_rate": 5.372027972027972e-07, - "loss": 0.377, - "step": 50040 - }, - { - "epoch": 43.37, - "learning_rate": 5.365034965034964e-07, - "loss": 0.3425, - "step": 50050 - }, - { - "epoch": 43.38, - "learning_rate": 5.358041958041957e-07, - "loss": 0.3438, - "step": 50060 - }, - { - "epoch": 43.39, - "learning_rate": 5.351048951048951e-07, - "loss": 0.385, - "step": 50070 - }, - { - "epoch": 43.4, - "learning_rate": 5.344055944055944e-07, - "loss": 0.3116, - "step": 50080 - }, - { - "epoch": 43.41, - "learning_rate": 5.337062937062937e-07, - "loss": 0.3366, - "step": 50090 - }, - { - "epoch": 43.41, - "learning_rate": 5.330069930069931e-07, - "loss": 0.347, - "step": 50100 - }, - { - "epoch": 43.42, - "learning_rate": 5.323076923076923e-07, - "loss": 0.359, - "step": 50110 - }, - { - "epoch": 43.43, - "learning_rate": 5.316083916083915e-07, - "loss": 0.3482, - "step": 50120 - }, - { - "epoch": 43.44, - "learning_rate": 5.309090909090908e-07, - "loss": 0.4245, - "step": 50130 - }, - { - "epoch": 43.45, - "learning_rate": 5.302097902097902e-07, - "loss": 0.4013, - "step": 50140 - }, - { - "epoch": 43.46, - "learning_rate": 5.295104895104895e-07, - "loss": 0.3183, - "step": 50150 - }, - { - "epoch": 43.47, - "learning_rate": 5.288111888111888e-07, - "loss": 0.3847, - "step": 50160 - }, - { - "epoch": 43.47, - "learning_rate": 5.281118881118881e-07, - "loss": 0.3408, - "step": 50170 - }, - { - "epoch": 43.48, - "learning_rate": 5.274125874125875e-07, - "loss": 0.3204, - "step": 50180 - }, - { - "epoch": 43.49, - "learning_rate": 5.267132867132868e-07, - "loss": 0.3748, - "step": 50190 - }, - { - "epoch": 43.5, - "learning_rate": 5.260139860139859e-07, - "loss": 0.3272, - "step": 50200 - }, - { - "epoch": 43.51, - "learning_rate": 5.253146853146852e-07, - "loss": 0.3443, - "step": 50210 - }, - { - "epoch": 43.52, - "learning_rate": 5.246153846153846e-07, - "loss": 0.334, - "step": 50220 - }, - { - "epoch": 43.53, - "learning_rate": 5.239160839160839e-07, - "loss": 0.3717, - "step": 50230 - }, - { - "epoch": 43.54, - "learning_rate": 5.232167832167832e-07, - "loss": 0.3835, - "step": 50240 - }, - { - "epoch": 43.54, - "learning_rate": 5.225174825174825e-07, - "loss": 0.3446, - "step": 50250 - }, - { - "epoch": 43.55, - "learning_rate": 5.218181818181819e-07, - "loss": 0.3764, - "step": 50260 - }, - { - "epoch": 43.56, - "learning_rate": 5.211188811188811e-07, - "loss": 0.3715, - "step": 50270 - }, - { - "epoch": 43.57, - "learning_rate": 5.204195804195804e-07, - "loss": 0.3868, - "step": 50280 - }, - { - "epoch": 43.58, - "learning_rate": 5.197202797202796e-07, - "loss": 0.3194, - "step": 50290 - }, - { - "epoch": 43.59, - "learning_rate": 5.19020979020979e-07, - "loss": 0.3496, - "step": 50300 - }, - { - "epoch": 43.6, - "learning_rate": 5.183216783216783e-07, - "loss": 0.3352, - "step": 50310 - }, - { - "epoch": 43.6, - "learning_rate": 5.176223776223776e-07, - "loss": 0.3579, - "step": 50320 - }, - { - "epoch": 43.61, - "learning_rate": 5.16923076923077e-07, - "loss": 0.3405, - "step": 50330 - }, - { - "epoch": 43.62, - "learning_rate": 5.162237762237762e-07, - "loss": 0.3587, - "step": 50340 - }, - { - "epoch": 43.63, - "learning_rate": 5.155244755244755e-07, - "loss": 0.3614, - "step": 50350 - }, - { - "epoch": 43.64, - "learning_rate": 5.148251748251748e-07, - "loss": 0.3478, - "step": 50360 - }, - { - "epoch": 43.65, - "learning_rate": 5.141258741258741e-07, - "loss": 0.3754, - "step": 50370 - }, - { - "epoch": 43.66, - "learning_rate": 5.134265734265734e-07, - "loss": 0.3146, - "step": 50380 - }, - { - "epoch": 43.67, - "learning_rate": 5.127272727272727e-07, - "loss": 0.3599, - "step": 50390 - }, - { - "epoch": 43.67, - "learning_rate": 5.12027972027972e-07, - "loss": 0.3302, - "step": 50400 - }, - { - "epoch": 43.68, - "learning_rate": 5.113286713286713e-07, - "loss": 0.3394, - "step": 50410 - }, - { - "epoch": 43.69, - "learning_rate": 5.106293706293706e-07, - "loss": 0.3385, - "step": 50420 - }, - { - "epoch": 43.7, - "learning_rate": 5.099300699300699e-07, - "loss": 0.3213, - "step": 50430 - }, - { - "epoch": 43.71, - "learning_rate": 5.092307692307692e-07, - "loss": 0.3575, - "step": 50440 - }, - { - "epoch": 43.72, - "learning_rate": 5.085314685314686e-07, - "loss": 0.3492, - "step": 50450 - }, - { - "epoch": 43.73, - "learning_rate": 5.078321678321678e-07, - "loss": 0.3904, - "step": 50460 - }, - { - "epoch": 43.73, - "learning_rate": 5.071328671328671e-07, - "loss": 0.388, - "step": 50470 - }, - { - "epoch": 43.74, - "learning_rate": 5.064335664335663e-07, - "loss": 0.4397, - "step": 50480 - }, - { - "epoch": 43.75, - "learning_rate": 5.057342657342657e-07, - "loss": 0.3186, - "step": 50490 - }, - { - "epoch": 43.76, - "learning_rate": 5.05034965034965e-07, - "loss": 0.3315, - "step": 50500 - }, - { - "epoch": 43.77, - "learning_rate": 5.043356643356643e-07, - "loss": 0.3556, - "step": 50510 - }, - { - "epoch": 43.78, - "learning_rate": 5.036363636363636e-07, - "loss": 0.4012, - "step": 50520 - }, - { - "epoch": 43.79, - "learning_rate": 5.02937062937063e-07, - "loss": 0.3227, - "step": 50530 - }, - { - "epoch": 43.8, - "learning_rate": 5.022377622377623e-07, - "loss": 0.3532, - "step": 50540 - }, - { - "epoch": 43.8, - "learning_rate": 5.015384615384614e-07, - "loss": 0.3468, - "step": 50550 - }, - { - "epoch": 43.81, - "learning_rate": 5.008391608391607e-07, - "loss": 0.3401, - "step": 50560 - }, - { - "epoch": 43.82, - "learning_rate": 5.001398601398601e-07, - "loss": 0.3841, - "step": 50570 - }, - { - "epoch": 43.83, - "learning_rate": 4.995104895104895e-07, - "loss": 0.3204, - "step": 50580 - }, - { - "epoch": 43.84, - "learning_rate": 4.988111888111888e-07, - "loss": 0.3945, - "step": 50590 - }, - { - "epoch": 43.85, - "learning_rate": 4.98111888111888e-07, - "loss": 0.3158, - "step": 50600 - }, - { - "epoch": 43.86, - "learning_rate": 4.974125874125874e-07, - "loss": 0.3709, - "step": 50610 - }, - { - "epoch": 43.86, - "learning_rate": 4.967132867132867e-07, - "loss": 0.3594, - "step": 50620 - }, - { - "epoch": 43.87, - "learning_rate": 4.96013986013986e-07, - "loss": 0.2674, - "step": 50630 - }, - { - "epoch": 43.88, - "learning_rate": 4.953146853146853e-07, - "loss": 0.3399, - "step": 50640 - }, - { - "epoch": 43.89, - "learning_rate": 4.946153846153846e-07, - "loss": 0.3651, - "step": 50650 - }, - { - "epoch": 43.9, - "learning_rate": 4.939160839160839e-07, - "loss": 0.3881, - "step": 50660 - }, - { - "epoch": 43.91, - "learning_rate": 4.932167832167831e-07, - "loss": 0.3616, - "step": 50670 - }, - { - "epoch": 43.92, - "learning_rate": 4.925174825174824e-07, - "loss": 0.3515, - "step": 50680 - }, - { - "epoch": 43.93, - "learning_rate": 4.918181818181818e-07, - "loss": 0.383, - "step": 50690 - }, - { - "epoch": 43.93, - "learning_rate": 4.911188811188811e-07, - "loss": 0.3215, - "step": 50700 - }, - { - "epoch": 43.94, - "learning_rate": 4.904195804195804e-07, - "loss": 0.3708, - "step": 50710 - }, - { - "epoch": 43.95, - "learning_rate": 4.897202797202797e-07, - "loss": 0.4286, - "step": 50720 - }, - { - "epoch": 43.96, - "learning_rate": 4.89020979020979e-07, - "loss": 0.4208, - "step": 50730 - }, - { - "epoch": 43.97, - "learning_rate": 4.883216783216784e-07, - "loss": 0.3737, - "step": 50740 - }, - { - "epoch": 43.98, - "learning_rate": 4.876223776223776e-07, - "loss": 0.299, - "step": 50750 - }, - { - "epoch": 43.99, - "learning_rate": 4.869230769230769e-07, - "loss": 0.4187, - "step": 50760 - }, - { - "epoch": 43.99, - "learning_rate": 4.862237762237762e-07, - "loss": 0.3444, - "step": 50770 - }, - { - "epoch": 44.0, - "eval_loss": 0.565770149230957, - "eval_runtime": 137.6557, - "eval_samples_per_second": 3.865, - "eval_steps_per_second": 1.932, - "eval_wer": 0.24130616442758887, - "step": 50776 - }, - { - "epoch": 44.0, - "learning_rate": 4.855244755244755e-07, - "loss": 0.325, - "step": 50780 - }, - { - "epoch": 44.01, - "learning_rate": 4.848251748251748e-07, - "loss": 0.3413, - "step": 50790 - }, - { - "epoch": 44.02, - "learning_rate": 4.841258741258741e-07, - "loss": 0.3148, - "step": 50800 - }, - { - "epoch": 44.03, - "learning_rate": 4.834265734265734e-07, - "loss": 0.4056, - "step": 50810 - }, - { - "epoch": 44.04, - "learning_rate": 4.827272727272727e-07, - "loss": 0.3773, - "step": 50820 - }, - { - "epoch": 44.05, - "learning_rate": 4.82027972027972e-07, - "loss": 0.3485, - "step": 50830 - }, - { - "epoch": 44.06, - "learning_rate": 4.813286713286713e-07, - "loss": 0.3589, - "step": 50840 - }, - { - "epoch": 44.06, - "learning_rate": 4.806293706293706e-07, - "loss": 0.3755, - "step": 50850 - }, - { - "epoch": 44.07, - "learning_rate": 4.799300699300699e-07, - "loss": 0.3676, - "step": 50860 - }, - { - "epoch": 44.08, - "learning_rate": 4.792307692307692e-07, - "loss": 0.3682, - "step": 50870 - }, - { - "epoch": 44.09, - "learning_rate": 4.785314685314686e-07, - "loss": 0.3834, - "step": 50880 - }, - { - "epoch": 44.1, - "learning_rate": 4.778321678321677e-07, - "loss": 0.4024, - "step": 50890 - }, - { - "epoch": 44.11, - "learning_rate": 4.771328671328671e-07, - "loss": 0.3543, - "step": 50900 - }, - { - "epoch": 44.12, - "learning_rate": 4.764335664335664e-07, - "loss": 0.3748, - "step": 50910 - }, - { - "epoch": 44.12, - "learning_rate": 4.757342657342657e-07, - "loss": 0.3427, - "step": 50920 - }, - { - "epoch": 44.13, - "learning_rate": 4.7503496503496504e-07, - "loss": 0.3596, - "step": 50930 - }, - { - "epoch": 44.14, - "learning_rate": 4.7433566433566427e-07, - "loss": 0.3468, - "step": 50940 - }, - { - "epoch": 44.15, - "learning_rate": 4.736363636363636e-07, - "loss": 0.3084, - "step": 50950 - }, - { - "epoch": 44.16, - "learning_rate": 4.7293706293706295e-07, - "loss": 0.3412, - "step": 50960 - }, - { - "epoch": 44.17, - "learning_rate": 4.7223776223776223e-07, - "loss": 0.3512, - "step": 50970 - }, - { - "epoch": 44.18, - "learning_rate": 4.715384615384615e-07, - "loss": 0.3601, - "step": 50980 - }, - { - "epoch": 44.19, - "learning_rate": 4.708391608391608e-07, - "loss": 0.4109, - "step": 50990 - }, - { - "epoch": 44.19, - "learning_rate": 4.7013986013986014e-07, - "loss": 0.3168, - "step": 51000 - }, - { - "epoch": 44.2, - "learning_rate": 4.6944055944055943e-07, - "loss": 0.3551, - "step": 51010 - }, - { - "epoch": 44.21, - "learning_rate": 4.687412587412587e-07, - "loss": 0.3557, - "step": 51020 - }, - { - "epoch": 44.22, - "learning_rate": 4.68041958041958e-07, - "loss": 0.3283, - "step": 51030 - }, - { - "epoch": 44.23, - "learning_rate": 4.6734265734265734e-07, - "loss": 0.3595, - "step": 51040 - }, - { - "epoch": 44.24, - "learning_rate": 4.666433566433566e-07, - "loss": 0.3826, - "step": 51050 - }, - { - "epoch": 44.25, - "learning_rate": 4.6594405594405596e-07, - "loss": 0.3451, - "step": 51060 - }, - { - "epoch": 44.25, - "learning_rate": 4.652447552447552e-07, - "loss": 0.3752, - "step": 51070 - }, - { - "epoch": 44.26, - "learning_rate": 4.6454545454545453e-07, - "loss": 0.3869, - "step": 51080 - }, - { - "epoch": 44.27, - "learning_rate": 4.638461538461538e-07, - "loss": 0.3548, - "step": 51090 - }, - { - "epoch": 44.28, - "learning_rate": 4.6314685314685315e-07, - "loss": 0.3236, - "step": 51100 - }, - { - "epoch": 44.29, - "learning_rate": 4.624475524475524e-07, - "loss": 0.3261, - "step": 51110 - }, - { - "epoch": 44.3, - "learning_rate": 4.617482517482517e-07, - "loss": 0.342, - "step": 51120 - }, - { - "epoch": 44.31, - "learning_rate": 4.61048951048951e-07, - "loss": 0.3196, - "step": 51130 - }, - { - "epoch": 44.32, - "learning_rate": 4.6034965034965035e-07, - "loss": 0.319, - "step": 51140 - }, - { - "epoch": 44.32, - "learning_rate": 4.5965034965034963e-07, - "loss": 0.3924, - "step": 51150 - }, - { - "epoch": 44.33, - "learning_rate": 4.589510489510489e-07, - "loss": 0.3715, - "step": 51160 - }, - { - "epoch": 44.34, - "learning_rate": 4.582517482517482e-07, - "loss": 0.3719, - "step": 51170 - }, - { - "epoch": 44.35, - "learning_rate": 4.5755244755244754e-07, - "loss": 0.3456, - "step": 51180 - }, - { - "epoch": 44.36, - "learning_rate": 4.568531468531469e-07, - "loss": 0.3956, - "step": 51190 - }, - { - "epoch": 44.37, - "learning_rate": 4.561538461538461e-07, - "loss": 0.3757, - "step": 51200 - }, - { - "epoch": 44.38, - "learning_rate": 4.5545454545454545e-07, - "loss": 0.3573, - "step": 51210 - }, - { - "epoch": 44.38, - "learning_rate": 4.5475524475524473e-07, - "loss": 0.362, - "step": 51220 - }, - { - "epoch": 44.39, - "learning_rate": 4.5405594405594407e-07, - "loss": 0.4066, - "step": 51230 - }, - { - "epoch": 44.4, - "learning_rate": 4.533566433566433e-07, - "loss": 0.386, - "step": 51240 - }, - { - "epoch": 44.41, - "learning_rate": 4.5265734265734264e-07, - "loss": 0.3183, - "step": 51250 - }, - { - "epoch": 44.42, - "learning_rate": 4.5195804195804193e-07, - "loss": 0.3254, - "step": 51260 - }, - { - "epoch": 44.43, - "learning_rate": 4.5125874125874127e-07, - "loss": 0.3963, - "step": 51270 - }, - { - "epoch": 44.44, - "learning_rate": 4.5055944055944055e-07, - "loss": 0.2913, - "step": 51280 - }, - { - "epoch": 44.45, - "learning_rate": 4.4986013986013984e-07, - "loss": 0.3316, - "step": 51290 - }, - { - "epoch": 44.45, - "learning_rate": 4.491608391608391e-07, - "loss": 0.3397, - "step": 51300 - }, - { - "epoch": 44.46, - "learning_rate": 4.4846153846153846e-07, - "loss": 0.3333, - "step": 51310 - }, - { - "epoch": 44.47, - "learning_rate": 4.4776223776223775e-07, - "loss": 0.4175, - "step": 51320 - }, - { - "epoch": 44.48, - "learning_rate": 4.4706293706293703e-07, - "loss": 0.3613, - "step": 51330 - }, - { - "epoch": 44.49, - "learning_rate": 4.463636363636363e-07, - "loss": 0.3953, - "step": 51340 - }, - { - "epoch": 44.5, - "learning_rate": 4.4566433566433565e-07, - "loss": 0.3269, - "step": 51350 - }, - { - "epoch": 44.51, - "learning_rate": 4.4496503496503494e-07, - "loss": 0.3545, - "step": 51360 - }, - { - "epoch": 44.51, - "learning_rate": 4.442657342657343e-07, - "loss": 0.4028, - "step": 51370 - }, - { - "epoch": 44.52, - "learning_rate": 4.435664335664335e-07, - "loss": 0.4086, - "step": 51380 - }, - { - "epoch": 44.53, - "learning_rate": 4.4286713286713285e-07, - "loss": 0.3323, - "step": 51390 - }, - { - "epoch": 44.54, - "learning_rate": 4.4216783216783213e-07, - "loss": 0.3906, - "step": 51400 - }, - { - "epoch": 44.55, - "learning_rate": 4.4146853146853147e-07, - "loss": 0.3551, - "step": 51410 - }, - { - "epoch": 44.56, - "learning_rate": 4.407692307692307e-07, - "loss": 0.3603, - "step": 51420 - }, - { - "epoch": 44.57, - "learning_rate": 4.4006993006993004e-07, - "loss": 0.2797, - "step": 51430 - }, - { - "epoch": 44.58, - "learning_rate": 4.393706293706294e-07, - "loss": 0.3186, - "step": 51440 - }, - { - "epoch": 44.58, - "learning_rate": 4.3867132867132866e-07, - "loss": 0.3282, - "step": 51450 - }, - { - "epoch": 44.59, - "learning_rate": 4.37972027972028e-07, - "loss": 0.3359, - "step": 51460 - }, - { - "epoch": 44.6, - "learning_rate": 4.3727272727272723e-07, - "loss": 0.3761, - "step": 51470 - }, - { - "epoch": 44.61, - "learning_rate": 4.3657342657342657e-07, - "loss": 0.3203, - "step": 51480 - }, - { - "epoch": 44.62, - "learning_rate": 4.3587412587412586e-07, - "loss": 0.366, - "step": 51490 - }, - { - "epoch": 44.63, - "learning_rate": 4.351748251748252e-07, - "loss": 0.28, - "step": 51500 - }, - { - "epoch": 44.64, - "learning_rate": 4.3447552447552443e-07, - "loss": 0.3208, - "step": 51510 - }, - { - "epoch": 44.64, - "learning_rate": 4.3377622377622377e-07, - "loss": 0.3376, - "step": 51520 - }, - { - "epoch": 44.65, - "learning_rate": 4.3307692307692305e-07, - "loss": 0.3777, - "step": 51530 - }, - { - "epoch": 44.66, - "learning_rate": 4.323776223776224e-07, - "loss": 0.3316, - "step": 51540 - }, - { - "epoch": 44.67, - "learning_rate": 4.316783216783216e-07, - "loss": 0.3205, - "step": 51550 - }, - { - "epoch": 44.68, - "learning_rate": 4.3097902097902096e-07, - "loss": 0.3252, - "step": 51560 - }, - { - "epoch": 44.69, - "learning_rate": 4.3027972027972025e-07, - "loss": 0.3657, - "step": 51570 - }, - { - "epoch": 44.7, - "learning_rate": 4.295804195804196e-07, - "loss": 0.361, - "step": 51580 - }, - { - "epoch": 44.71, - "learning_rate": 4.2888111888111887e-07, - "loss": 0.4195, - "step": 51590 - }, - { - "epoch": 44.71, - "learning_rate": 4.2818181818181815e-07, - "loss": 0.306, - "step": 51600 - }, - { - "epoch": 44.72, - "learning_rate": 4.2748251748251744e-07, - "loss": 0.3697, - "step": 51610 - }, - { - "epoch": 44.73, - "learning_rate": 4.267832167832168e-07, - "loss": 0.3762, - "step": 51620 - }, - { - "epoch": 44.74, - "learning_rate": 4.2608391608391606e-07, - "loss": 0.4058, - "step": 51630 - }, - { - "epoch": 44.75, - "learning_rate": 4.2538461538461535e-07, - "loss": 0.3401, - "step": 51640 - }, - { - "epoch": 44.76, - "learning_rate": 4.2468531468531463e-07, - "loss": 0.3201, - "step": 51650 - }, - { - "epoch": 44.77, - "learning_rate": 4.2398601398601397e-07, - "loss": 0.3638, - "step": 51660 - }, - { - "epoch": 44.77, - "learning_rate": 4.2328671328671326e-07, - "loss": 0.3522, - "step": 51670 - }, - { - "epoch": 44.78, - "learning_rate": 4.225874125874126e-07, - "loss": 0.361, - "step": 51680 - }, - { - "epoch": 44.79, - "learning_rate": 4.218881118881119e-07, - "loss": 0.3551, - "step": 51690 - }, - { - "epoch": 44.8, - "learning_rate": 4.2118881118881116e-07, - "loss": 0.3629, - "step": 51700 - }, - { - "epoch": 44.81, - "learning_rate": 4.204895104895105e-07, - "loss": 0.3809, - "step": 51710 - }, - { - "epoch": 44.82, - "learning_rate": 4.197902097902098e-07, - "loss": 0.4204, - "step": 51720 - }, - { - "epoch": 44.83, - "learning_rate": 4.1909090909090907e-07, - "loss": 0.3504, - "step": 51730 - }, - { - "epoch": 44.83, - "learning_rate": 4.1839160839160836e-07, - "loss": 0.321, - "step": 51740 - }, - { - "epoch": 44.84, - "learning_rate": 4.176923076923077e-07, - "loss": 0.3443, - "step": 51750 - }, - { - "epoch": 44.85, - "learning_rate": 4.16993006993007e-07, - "loss": 0.3294, - "step": 51760 - }, - { - "epoch": 44.86, - "learning_rate": 4.1629370629370627e-07, - "loss": 0.3754, - "step": 51770 - }, - { - "epoch": 44.87, - "learning_rate": 4.1559440559440555e-07, - "loss": 0.359, - "step": 51780 - }, - { - "epoch": 44.88, - "learning_rate": 4.148951048951049e-07, - "loss": 0.3334, - "step": 51790 - }, - { - "epoch": 44.89, - "learning_rate": 4.141958041958042e-07, - "loss": 0.3306, - "step": 51800 - }, - { - "epoch": 44.9, - "learning_rate": 4.134965034965035e-07, - "loss": 0.3905, - "step": 51810 - }, - { - "epoch": 44.9, - "learning_rate": 4.1279720279720275e-07, - "loss": 0.3473, - "step": 51820 - }, - { - "epoch": 44.91, - "learning_rate": 4.120979020979021e-07, - "loss": 0.3089, - "step": 51830 - }, - { - "epoch": 44.92, - "learning_rate": 4.1139860139860137e-07, - "loss": 0.3684, - "step": 51840 - }, - { - "epoch": 44.93, - "learning_rate": 4.106993006993007e-07, - "loss": 0.343, - "step": 51850 - }, - { - "epoch": 44.94, - "learning_rate": 4.0999999999999994e-07, - "loss": 0.3692, - "step": 51860 - }, - { - "epoch": 44.95, - "learning_rate": 4.093006993006993e-07, - "loss": 0.388, - "step": 51870 - }, - { - "epoch": 44.96, - "learning_rate": 4.0860139860139856e-07, - "loss": 0.3411, - "step": 51880 - }, - { - "epoch": 44.96, - "learning_rate": 4.079020979020979e-07, - "loss": 0.3736, - "step": 51890 - }, - { - "epoch": 44.97, - "learning_rate": 4.072027972027972e-07, - "loss": 0.3311, - "step": 51900 - }, - { - "epoch": 44.98, - "learning_rate": 4.0650349650349647e-07, - "loss": 0.368, - "step": 51910 - }, - { - "epoch": 44.99, - "learning_rate": 4.0580419580419576e-07, - "loss": 0.3885, - "step": 51920 - }, - { - "epoch": 45.0, - "learning_rate": 4.051048951048951e-07, - "loss": 0.3152, - "step": 51930 - }, - { - "epoch": 45.0, - "eval_loss": 0.5559401512145996, - "eval_runtime": 138.3022, - "eval_samples_per_second": 3.847, - "eval_steps_per_second": 1.923, - "eval_wer": 0.24021340875490133, - "step": 51930 - }, - { - "epoch": 45.01, - "learning_rate": 4.0440559440559443e-07, - "loss": 0.3634, - "step": 51940 - }, - { - "epoch": 45.02, - "learning_rate": 4.0370629370629366e-07, - "loss": 0.3808, - "step": 51950 - }, - { - "epoch": 45.03, - "learning_rate": 4.03006993006993e-07, - "loss": 0.2829, - "step": 51960 - }, - { - "epoch": 45.03, - "learning_rate": 4.023076923076923e-07, - "loss": 0.3541, - "step": 51970 - }, - { - "epoch": 45.04, - "learning_rate": 4.016083916083916e-07, - "loss": 0.2983, - "step": 51980 - }, - { - "epoch": 45.05, - "learning_rate": 4.0090909090909086e-07, - "loss": 0.3205, - "step": 51990 - }, - { - "epoch": 45.06, - "learning_rate": 4.002097902097902e-07, - "loss": 0.3651, - "step": 52000 - }, - { - "epoch": 45.07, - "learning_rate": 3.995104895104895e-07, - "loss": 0.3451, - "step": 52010 - }, - { - "epoch": 45.08, - "learning_rate": 3.988111888111888e-07, - "loss": 0.3793, - "step": 52020 - }, - { - "epoch": 45.09, - "learning_rate": 3.981118881118881e-07, - "loss": 0.3988, - "step": 52030 - }, - { - "epoch": 45.1, - "learning_rate": 3.974125874125874e-07, - "loss": 0.3919, - "step": 52040 - }, - { - "epoch": 45.1, - "learning_rate": 3.967132867132867e-07, - "loss": 0.3249, - "step": 52050 - }, - { - "epoch": 45.11, - "learning_rate": 3.96013986013986e-07, - "loss": 0.3432, - "step": 52060 - }, - { - "epoch": 45.12, - "learning_rate": 3.953146853146853e-07, - "loss": 0.3442, - "step": 52070 - }, - { - "epoch": 45.13, - "learning_rate": 3.946153846153846e-07, - "loss": 0.3305, - "step": 52080 - }, - { - "epoch": 45.14, - "learning_rate": 3.9391608391608387e-07, - "loss": 0.3412, - "step": 52090 - }, - { - "epoch": 45.15, - "learning_rate": 3.932167832167832e-07, - "loss": 0.3864, - "step": 52100 - }, - { - "epoch": 45.16, - "learning_rate": 3.925174825174825e-07, - "loss": 0.3563, - "step": 52110 - }, - { - "epoch": 45.16, - "learning_rate": 3.9181818181818183e-07, - "loss": 0.3579, - "step": 52120 - }, - { - "epoch": 45.17, - "learning_rate": 3.9111888111888106e-07, - "loss": 0.416, - "step": 52130 - }, - { - "epoch": 45.18, - "learning_rate": 3.904195804195804e-07, - "loss": 0.3637, - "step": 52140 - }, - { - "epoch": 45.19, - "learning_rate": 3.897202797202797e-07, - "loss": 0.3377, - "step": 52150 - }, - { - "epoch": 45.2, - "learning_rate": 3.89020979020979e-07, - "loss": 0.3395, - "step": 52160 - }, - { - "epoch": 45.21, - "learning_rate": 3.8832167832167826e-07, - "loss": 0.3114, - "step": 52170 - }, - { - "epoch": 45.22, - "learning_rate": 3.876223776223776e-07, - "loss": 0.3728, - "step": 52180 - }, - { - "epoch": 45.23, - "learning_rate": 3.8692307692307693e-07, - "loss": 0.348, - "step": 52190 - }, - { - "epoch": 45.23, - "learning_rate": 3.862237762237762e-07, - "loss": 0.3457, - "step": 52200 - }, - { - "epoch": 45.24, - "learning_rate": 3.8552447552447556e-07, - "loss": 0.3347, - "step": 52210 - }, - { - "epoch": 45.25, - "learning_rate": 3.848251748251748e-07, - "loss": 0.3706, - "step": 52220 - }, - { - "epoch": 45.26, - "learning_rate": 3.841258741258741e-07, - "loss": 0.3942, - "step": 52230 - }, - { - "epoch": 45.27, - "learning_rate": 3.834265734265734e-07, - "loss": 0.3266, - "step": 52240 - }, - { - "epoch": 45.28, - "learning_rate": 3.8272727272727275e-07, - "loss": 0.3274, - "step": 52250 - }, - { - "epoch": 45.29, - "learning_rate": 3.82027972027972e-07, - "loss": 0.2802, - "step": 52260 - }, - { - "epoch": 45.29, - "learning_rate": 3.813286713286713e-07, - "loss": 0.3797, - "step": 52270 - }, - { - "epoch": 45.3, - "learning_rate": 3.806293706293706e-07, - "loss": 0.3517, - "step": 52280 - }, - { - "epoch": 45.31, - "learning_rate": 3.7993006993006994e-07, - "loss": 0.3494, - "step": 52290 - }, - { - "epoch": 45.32, - "learning_rate": 3.792307692307692e-07, - "loss": 0.3575, - "step": 52300 - }, - { - "epoch": 45.33, - "learning_rate": 3.785314685314685e-07, - "loss": 0.3258, - "step": 52310 - }, - { - "epoch": 45.34, - "learning_rate": 3.778321678321678e-07, - "loss": 0.361, - "step": 52320 - }, - { - "epoch": 45.35, - "learning_rate": 3.7713286713286714e-07, - "loss": 0.3957, - "step": 52330 - }, - { - "epoch": 45.36, - "learning_rate": 3.764335664335664e-07, - "loss": 0.3734, - "step": 52340 - }, - { - "epoch": 45.36, - "learning_rate": 3.757342657342657e-07, - "loss": 0.3217, - "step": 52350 - }, - { - "epoch": 45.37, - "learning_rate": 3.75034965034965e-07, - "loss": 0.352, - "step": 52360 - }, - { - "epoch": 45.38, - "learning_rate": 3.7433566433566433e-07, - "loss": 0.3292, - "step": 52370 - }, - { - "epoch": 45.39, - "learning_rate": 3.736363636363636e-07, - "loss": 0.3959, - "step": 52380 - }, - { - "epoch": 45.4, - "learning_rate": 3.729370629370629e-07, - "loss": 0.3335, - "step": 52390 - }, - { - "epoch": 45.41, - "learning_rate": 3.722377622377622e-07, - "loss": 0.3569, - "step": 52400 - }, - { - "epoch": 45.42, - "learning_rate": 3.715384615384615e-07, - "loss": 0.3919, - "step": 52410 - }, - { - "epoch": 45.42, - "learning_rate": 3.7083916083916086e-07, - "loss": 0.3862, - "step": 52420 - }, - { - "epoch": 45.43, - "learning_rate": 3.7013986013986015e-07, - "loss": 0.3332, - "step": 52430 - }, - { - "epoch": 45.44, - "learning_rate": 3.6944055944055943e-07, - "loss": 0.348, - "step": 52440 - }, - { - "epoch": 45.45, - "learning_rate": 3.687412587412587e-07, - "loss": 0.3456, - "step": 52450 - }, - { - "epoch": 45.46, - "learning_rate": 3.6804195804195806e-07, - "loss": 0.3297, - "step": 52460 - }, - { - "epoch": 45.47, - "learning_rate": 3.6734265734265734e-07, - "loss": 0.4109, - "step": 52470 - }, - { - "epoch": 45.48, - "learning_rate": 3.666433566433566e-07, - "loss": 0.3729, - "step": 52480 - }, - { - "epoch": 45.49, - "learning_rate": 3.659440559440559e-07, - "loss": 0.3014, - "step": 52490 - }, - { - "epoch": 45.49, - "learning_rate": 3.6524475524475525e-07, - "loss": 0.4247, - "step": 52500 - }, - { - "epoch": 45.5, - "learning_rate": 3.6454545454545453e-07, - "loss": 0.3382, - "step": 52510 - }, - { - "epoch": 45.51, - "learning_rate": 3.638461538461538e-07, - "loss": 0.3732, - "step": 52520 - }, - { - "epoch": 45.52, - "learning_rate": 3.631468531468531e-07, - "loss": 0.3224, - "step": 52530 - }, - { - "epoch": 45.53, - "learning_rate": 3.6244755244755244e-07, - "loss": 0.3809, - "step": 52540 - }, - { - "epoch": 45.54, - "learning_rate": 3.6174825174825173e-07, - "loss": 0.3758, - "step": 52550 - }, - { - "epoch": 45.55, - "learning_rate": 3.6104895104895107e-07, - "loss": 0.3511, - "step": 52560 - }, - { - "epoch": 45.55, - "learning_rate": 3.603496503496503e-07, - "loss": 0.3247, - "step": 52570 - }, - { - "epoch": 45.56, - "learning_rate": 3.5965034965034964e-07, - "loss": 0.4197, - "step": 52580 - }, - { - "epoch": 45.57, - "learning_rate": 3.589510489510489e-07, - "loss": 0.3722, - "step": 52590 - }, - { - "epoch": 45.58, - "learning_rate": 3.5825174825174826e-07, - "loss": 0.3467, - "step": 52600 - }, - { - "epoch": 45.59, - "learning_rate": 3.575524475524475e-07, - "loss": 0.2931, - "step": 52610 - }, - { - "epoch": 45.6, - "learning_rate": 3.5685314685314683e-07, - "loss": 0.391, - "step": 52620 - }, - { - "epoch": 45.61, - "learning_rate": 3.561538461538461e-07, - "loss": 0.3567, - "step": 52630 - }, - { - "epoch": 45.61, - "learning_rate": 3.5545454545454545e-07, - "loss": 0.3436, - "step": 52640 - }, - { - "epoch": 45.62, - "learning_rate": 3.5475524475524474e-07, - "loss": 0.3486, - "step": 52650 - }, - { - "epoch": 45.63, - "learning_rate": 3.54055944055944e-07, - "loss": 0.3513, - "step": 52660 - }, - { - "epoch": 45.64, - "learning_rate": 3.533566433566433e-07, - "loss": 0.3871, - "step": 52670 - }, - { - "epoch": 45.65, - "learning_rate": 3.5265734265734265e-07, - "loss": 0.3758, - "step": 52680 - }, - { - "epoch": 45.66, - "learning_rate": 3.51958041958042e-07, - "loss": 0.3677, - "step": 52690 - }, - { - "epoch": 45.67, - "learning_rate": 3.512587412587412e-07, - "loss": 0.3368, - "step": 52700 - }, - { - "epoch": 45.68, - "learning_rate": 3.5055944055944056e-07, - "loss": 0.3457, - "step": 52710 - }, - { - "epoch": 45.68, - "learning_rate": 3.4986013986013984e-07, - "loss": 0.3342, - "step": 52720 - }, - { - "epoch": 45.69, - "learning_rate": 3.491608391608392e-07, - "loss": 0.3456, - "step": 52730 - }, - { - "epoch": 45.7, - "learning_rate": 3.4846153846153846e-07, - "loss": 0.3281, - "step": 52740 - }, - { - "epoch": 45.71, - "learning_rate": 3.4776223776223775e-07, - "loss": 0.3023, - "step": 52750 - }, - { - "epoch": 45.72, - "learning_rate": 3.4706293706293703e-07, - "loss": 0.4121, - "step": 52760 - }, - { - "epoch": 45.73, - "learning_rate": 3.4636363636363637e-07, - "loss": 0.3656, - "step": 52770 - }, - { - "epoch": 45.74, - "learning_rate": 3.4566433566433566e-07, - "loss": 0.3331, - "step": 52780 - }, - { - "epoch": 45.74, - "learning_rate": 3.4496503496503494e-07, - "loss": 0.3769, - "step": 52790 - }, - { - "epoch": 45.75, - "learning_rate": 3.4426573426573423e-07, - "loss": 0.3901, - "step": 52800 - }, - { - "epoch": 45.76, - "learning_rate": 3.4356643356643357e-07, - "loss": 0.3108, - "step": 52810 - }, - { - "epoch": 45.77, - "learning_rate": 3.4286713286713285e-07, - "loss": 0.3604, - "step": 52820 - }, - { - "epoch": 45.78, - "learning_rate": 3.4216783216783214e-07, - "loss": 0.335, - "step": 52830 - }, - { - "epoch": 45.79, - "learning_rate": 3.414685314685314e-07, - "loss": 0.349, - "step": 52840 - }, - { - "epoch": 45.8, - "learning_rate": 3.4076923076923076e-07, - "loss": 0.3362, - "step": 52850 - }, - { - "epoch": 45.81, - "learning_rate": 3.4006993006993005e-07, - "loss": 0.3089, - "step": 52860 - }, - { - "epoch": 45.81, - "learning_rate": 3.393706293706294e-07, - "loss": 0.3587, - "step": 52870 - }, - { - "epoch": 45.82, - "learning_rate": 3.386713286713286e-07, - "loss": 0.3461, - "step": 52880 - }, - { - "epoch": 45.83, - "learning_rate": 3.3797202797202795e-07, - "loss": 0.3051, - "step": 52890 - }, - { - "epoch": 45.84, - "learning_rate": 3.3727272727272724e-07, - "loss": 0.3519, - "step": 52900 - }, - { - "epoch": 45.85, - "learning_rate": 3.365734265734266e-07, - "loss": 0.3095, - "step": 52910 - }, - { - "epoch": 45.86, - "learning_rate": 3.358741258741258e-07, - "loss": 0.3646, - "step": 52920 - }, - { - "epoch": 45.87, - "learning_rate": 3.3517482517482515e-07, - "loss": 0.3363, - "step": 52930 - }, - { - "epoch": 45.87, - "learning_rate": 3.344755244755245e-07, - "loss": 0.3295, - "step": 52940 - }, - { - "epoch": 45.88, - "learning_rate": 3.3377622377622377e-07, - "loss": 0.3362, - "step": 52950 - }, - { - "epoch": 45.89, - "learning_rate": 3.330769230769231e-07, - "loss": 0.4204, - "step": 52960 - }, - { - "epoch": 45.9, - "learning_rate": 3.3237762237762234e-07, - "loss": 0.3752, - "step": 52970 - }, - { - "epoch": 45.91, - "learning_rate": 3.316783216783217e-07, - "loss": 0.3524, - "step": 52980 - }, - { - "epoch": 45.92, - "learning_rate": 3.3097902097902096e-07, - "loss": 0.3185, - "step": 52990 - }, - { - "epoch": 45.93, - "learning_rate": 3.302797202797203e-07, - "loss": 0.3749, - "step": 53000 - }, - { - "epoch": 45.94, - "learning_rate": 3.2958041958041954e-07, - "loss": 0.3107, - "step": 53010 - }, - { - "epoch": 45.94, - "learning_rate": 3.2888111888111887e-07, - "loss": 0.3935, - "step": 53020 - }, - { - "epoch": 45.95, - "learning_rate": 3.2818181818181816e-07, - "loss": 0.3288, - "step": 53030 - }, - { - "epoch": 45.96, - "learning_rate": 3.274825174825175e-07, - "loss": 0.3549, - "step": 53040 - }, - { - "epoch": 45.97, - "learning_rate": 3.2678321678321673e-07, - "loss": 0.3727, - "step": 53050 - }, - { - "epoch": 45.98, - "learning_rate": 3.2608391608391607e-07, - "loss": 0.3913, - "step": 53060 - }, - { - "epoch": 45.99, - "learning_rate": 3.2538461538461535e-07, - "loss": 0.3895, - "step": 53070 - }, - { - "epoch": 46.0, - "learning_rate": 3.246853146853147e-07, - "loss": 0.4, - "step": 53080 - }, - { - "epoch": 46.0, - "eval_loss": 0.5598962903022766, - "eval_runtime": 136.728, - "eval_samples_per_second": 3.891, - "eval_steps_per_second": 1.945, - "eval_wer": 0.24291315806389407, - "step": 53084 - }, - { - "epoch": 46.01, - "learning_rate": 3.23986013986014e-07, - "loss": 0.338, - "step": 53090 - }, - { - "epoch": 46.01, - "learning_rate": 3.2328671328671326e-07, - "loss": 0.3319, - "step": 53100 - }, - { - "epoch": 46.02, - "learning_rate": 3.2258741258741255e-07, - "loss": 0.361, - "step": 53110 - }, - { - "epoch": 46.03, - "learning_rate": 3.218881118881119e-07, - "loss": 0.3428, - "step": 53120 - }, - { - "epoch": 46.04, - "learning_rate": 3.2118881118881117e-07, - "loss": 0.3781, - "step": 53130 - }, - { - "epoch": 46.05, - "learning_rate": 3.2048951048951045e-07, - "loss": 0.3949, - "step": 53140 - }, - { - "epoch": 46.06, - "learning_rate": 3.1979020979020974e-07, - "loss": 0.3512, - "step": 53150 - }, - { - "epoch": 46.07, - "learning_rate": 3.190909090909091e-07, - "loss": 0.3601, - "step": 53160 - }, - { - "epoch": 46.07, - "learning_rate": 3.183916083916084e-07, - "loss": 0.3801, - "step": 53170 - }, - { - "epoch": 46.08, - "learning_rate": 3.176923076923077e-07, - "loss": 0.3381, - "step": 53180 - }, - { - "epoch": 46.09, - "learning_rate": 3.16993006993007e-07, - "loss": 0.3352, - "step": 53190 - }, - { - "epoch": 46.1, - "learning_rate": 3.1629370629370627e-07, - "loss": 0.3853, - "step": 53200 - }, - { - "epoch": 46.11, - "learning_rate": 3.155944055944056e-07, - "loss": 0.3489, - "step": 53210 - }, - { - "epoch": 46.12, - "learning_rate": 3.148951048951049e-07, - "loss": 0.3868, - "step": 53220 - }, - { - "epoch": 46.13, - "learning_rate": 3.141958041958042e-07, - "loss": 0.293, - "step": 53230 - }, - { - "epoch": 46.14, - "learning_rate": 3.1349650349650346e-07, - "loss": 0.3221, - "step": 53240 - }, - { - "epoch": 46.14, - "learning_rate": 3.127972027972028e-07, - "loss": 0.3962, - "step": 53250 - }, - { - "epoch": 46.15, - "learning_rate": 3.120979020979021e-07, - "loss": 0.3337, - "step": 53260 - }, - { - "epoch": 46.16, - "learning_rate": 3.1139860139860137e-07, - "loss": 0.3624, - "step": 53270 - }, - { - "epoch": 46.17, - "learning_rate": 3.1069930069930066e-07, - "loss": 0.3983, - "step": 53280 - }, - { - "epoch": 46.18, - "learning_rate": 3.1e-07, - "loss": 0.3618, - "step": 53290 - }, - { - "epoch": 46.19, - "learning_rate": 3.093006993006993e-07, - "loss": 0.3796, - "step": 53300 - }, - { - "epoch": 46.2, - "learning_rate": 3.086013986013986e-07, - "loss": 0.3536, - "step": 53310 - }, - { - "epoch": 46.2, - "learning_rate": 3.0790209790209785e-07, - "loss": 0.362, - "step": 53320 - }, - { - "epoch": 46.21, - "learning_rate": 3.072027972027972e-07, - "loss": 0.3184, - "step": 53330 - }, - { - "epoch": 46.22, - "learning_rate": 3.065034965034965e-07, - "loss": 0.3803, - "step": 53340 - }, - { - "epoch": 46.23, - "learning_rate": 3.058041958041958e-07, - "loss": 0.3361, - "step": 53350 - }, - { - "epoch": 46.24, - "learning_rate": 3.0510489510489505e-07, - "loss": 0.3337, - "step": 53360 - }, - { - "epoch": 46.25, - "learning_rate": 3.044055944055944e-07, - "loss": 0.3476, - "step": 53370 - }, - { - "epoch": 46.26, - "learning_rate": 3.0370629370629367e-07, - "loss": 0.3582, - "step": 53380 - }, - { - "epoch": 46.27, - "learning_rate": 3.03006993006993e-07, - "loss": 0.3691, - "step": 53390 - }, - { - "epoch": 46.27, - "learning_rate": 3.0230769230769235e-07, - "loss": 0.3526, - "step": 53400 - }, - { - "epoch": 46.28, - "learning_rate": 3.016083916083916e-07, - "loss": 0.3684, - "step": 53410 - }, - { - "epoch": 46.29, - "learning_rate": 3.009090909090909e-07, - "loss": 0.4539, - "step": 53420 - }, - { - "epoch": 46.3, - "learning_rate": 3.002097902097902e-07, - "loss": 0.3908, - "step": 53430 - }, - { - "epoch": 46.31, - "learning_rate": 2.9951048951048954e-07, - "loss": 0.3204, - "step": 53440 - }, - { - "epoch": 46.32, - "learning_rate": 2.9881118881118877e-07, - "loss": 0.3961, - "step": 53450 - }, - { - "epoch": 46.33, - "learning_rate": 2.981118881118881e-07, - "loss": 0.335, - "step": 53460 - }, - { - "epoch": 46.33, - "learning_rate": 2.974125874125874e-07, - "loss": 0.374, - "step": 53470 - }, - { - "epoch": 46.34, - "learning_rate": 2.9671328671328673e-07, - "loss": 0.449, - "step": 53480 - }, - { - "epoch": 46.35, - "learning_rate": 2.96013986013986e-07, - "loss": 0.3361, - "step": 53490 - }, - { - "epoch": 46.36, - "learning_rate": 2.953146853146853e-07, - "loss": 0.3499, - "step": 53500 - }, - { - "epoch": 46.37, - "learning_rate": 2.946153846153846e-07, - "loss": 0.3204, - "step": 53510 - }, - { - "epoch": 46.38, - "learning_rate": 2.939160839160839e-07, - "loss": 0.3682, - "step": 53520 - }, - { - "epoch": 46.39, - "learning_rate": 2.932167832167832e-07, - "loss": 0.3741, - "step": 53530 - }, - { - "epoch": 46.39, - "learning_rate": 2.925174825174825e-07, - "loss": 0.3433, - "step": 53540 - }, - { - "epoch": 46.4, - "learning_rate": 2.918181818181818e-07, - "loss": 0.3687, - "step": 53550 - }, - { - "epoch": 46.41, - "learning_rate": 2.911188811188811e-07, - "loss": 0.319, - "step": 53560 - }, - { - "epoch": 46.42, - "learning_rate": 2.904195804195804e-07, - "loss": 0.3686, - "step": 53570 - }, - { - "epoch": 46.43, - "learning_rate": 2.897202797202797e-07, - "loss": 0.3313, - "step": 53580 - }, - { - "epoch": 46.44, - "learning_rate": 2.89020979020979e-07, - "loss": 0.3729, - "step": 53590 - }, - { - "epoch": 46.45, - "learning_rate": 2.883216783216783e-07, - "loss": 0.4025, - "step": 53600 - }, - { - "epoch": 46.46, - "learning_rate": 2.876223776223776e-07, - "loss": 0.2871, - "step": 53610 - }, - { - "epoch": 46.46, - "learning_rate": 2.8692307692307694e-07, - "loss": 0.3758, - "step": 53620 - }, - { - "epoch": 46.47, - "learning_rate": 2.8622377622377617e-07, - "loss": 0.3482, - "step": 53630 - }, - { - "epoch": 46.48, - "learning_rate": 2.855244755244755e-07, - "loss": 0.3169, - "step": 53640 - }, - { - "epoch": 46.49, - "learning_rate": 2.848251748251748e-07, - "loss": 0.3718, - "step": 53650 - }, - { - "epoch": 46.5, - "learning_rate": 2.8412587412587413e-07, - "loss": 0.2951, - "step": 53660 - }, - { - "epoch": 46.51, - "learning_rate": 2.834265734265734e-07, - "loss": 0.3914, - "step": 53670 - }, - { - "epoch": 46.52, - "learning_rate": 2.827272727272727e-07, - "loss": 0.3822, - "step": 53680 - }, - { - "epoch": 46.52, - "learning_rate": 2.8202797202797204e-07, - "loss": 0.3789, - "step": 53690 - }, - { - "epoch": 46.53, - "learning_rate": 2.813286713286713e-07, - "loss": 0.3486, - "step": 53700 - }, - { - "epoch": 46.54, - "learning_rate": 2.8062937062937066e-07, - "loss": 0.3458, - "step": 53710 - }, - { - "epoch": 46.55, - "learning_rate": 2.799300699300699e-07, - "loss": 0.3958, - "step": 53720 - }, - { - "epoch": 46.56, - "learning_rate": 2.7923076923076923e-07, - "loss": 0.3574, - "step": 53730 - }, - { - "epoch": 46.57, - "learning_rate": 2.785314685314685e-07, - "loss": 0.3624, - "step": 53740 - }, - { - "epoch": 46.58, - "learning_rate": 2.7783216783216786e-07, - "loss": 0.3705, - "step": 53750 - }, - { - "epoch": 46.59, - "learning_rate": 2.771328671328671e-07, - "loss": 0.3209, - "step": 53760 - }, - { - "epoch": 46.59, - "learning_rate": 2.764335664335664e-07, - "loss": 0.3529, - "step": 53770 - }, - { - "epoch": 46.6, - "learning_rate": 2.757342657342657e-07, - "loss": 0.3359, - "step": 53780 - }, - { - "epoch": 46.61, - "learning_rate": 2.7503496503496505e-07, - "loss": 0.3595, - "step": 53790 - }, - { - "epoch": 46.62, - "learning_rate": 2.743356643356643e-07, - "loss": 0.3597, - "step": 53800 - }, - { - "epoch": 46.63, - "learning_rate": 2.736363636363636e-07, - "loss": 0.3038, - "step": 53810 - }, - { - "epoch": 46.64, - "learning_rate": 2.729370629370629e-07, - "loss": 0.3261, - "step": 53820 - }, - { - "epoch": 46.65, - "learning_rate": 2.7223776223776224e-07, - "loss": 0.3323, - "step": 53830 - }, - { - "epoch": 46.65, - "learning_rate": 2.7153846153846153e-07, - "loss": 0.3983, - "step": 53840 - }, - { - "epoch": 46.66, - "learning_rate": 2.708391608391608e-07, - "loss": 0.373, - "step": 53850 - }, - { - "epoch": 46.67, - "learning_rate": 2.701398601398601e-07, - "loss": 0.3463, - "step": 53860 - }, - { - "epoch": 46.68, - "learning_rate": 2.6944055944055944e-07, - "loss": 0.3492, - "step": 53870 - }, - { - "epoch": 46.69, - "learning_rate": 2.687412587412587e-07, - "loss": 0.3555, - "step": 53880 - }, - { - "epoch": 46.7, - "learning_rate": 2.68041958041958e-07, - "loss": 0.3306, - "step": 53890 - }, - { - "epoch": 46.71, - "learning_rate": 2.673426573426573e-07, - "loss": 0.3866, - "step": 53900 - }, - { - "epoch": 46.72, - "learning_rate": 2.6664335664335663e-07, - "loss": 0.4149, - "step": 53910 - }, - { - "epoch": 46.72, - "learning_rate": 2.6594405594405597e-07, - "loss": 0.4307, - "step": 53920 - }, - { - "epoch": 46.73, - "learning_rate": 2.6524475524475525e-07, - "loss": 0.3798, - "step": 53930 - }, - { - "epoch": 46.74, - "learning_rate": 2.6454545454545454e-07, - "loss": 0.385, - "step": 53940 - }, - { - "epoch": 46.75, - "learning_rate": 2.638461538461538e-07, - "loss": 0.3675, - "step": 53950 - }, - { - "epoch": 46.76, - "learning_rate": 2.6314685314685316e-07, - "loss": 0.3411, - "step": 53960 - }, - { - "epoch": 46.77, - "learning_rate": 2.6244755244755245e-07, - "loss": 0.3486, - "step": 53970 - }, - { - "epoch": 46.78, - "learning_rate": 2.6174825174825173e-07, - "loss": 0.2884, - "step": 53980 - }, - { - "epoch": 46.78, - "learning_rate": 2.61048951048951e-07, - "loss": 0.3276, - "step": 53990 - }, - { - "epoch": 46.79, - "learning_rate": 2.6034965034965036e-07, - "loss": 0.3774, - "step": 54000 - }, - { - "epoch": 46.8, - "learning_rate": 2.5965034965034964e-07, - "loss": 0.3754, - "step": 54010 - }, - { - "epoch": 46.81, - "learning_rate": 2.58951048951049e-07, - "loss": 0.3675, - "step": 54020 - }, - { - "epoch": 46.82, - "learning_rate": 2.582517482517482e-07, - "loss": 0.3309, - "step": 54030 - }, - { - "epoch": 46.83, - "learning_rate": 2.5755244755244755e-07, - "loss": 0.3408, - "step": 54040 - }, - { - "epoch": 46.84, - "learning_rate": 2.5685314685314684e-07, - "loss": 0.334, - "step": 54050 - }, - { - "epoch": 46.85, - "learning_rate": 2.5615384615384617e-07, - "loss": 0.3203, - "step": 54060 - }, - { - "epoch": 46.85, - "learning_rate": 2.554545454545454e-07, - "loss": 0.3555, - "step": 54070 - }, - { - "epoch": 46.86, - "learning_rate": 2.5475524475524474e-07, - "loss": 0.366, - "step": 54080 - }, - { - "epoch": 46.87, - "learning_rate": 2.5405594405594403e-07, - "loss": 0.3755, - "step": 54090 - }, - { - "epoch": 46.88, - "learning_rate": 2.5335664335664337e-07, - "loss": 0.3058, - "step": 54100 - }, - { - "epoch": 46.89, - "learning_rate": 2.526573426573426e-07, - "loss": 0.3177, - "step": 54110 - }, - { - "epoch": 46.9, - "learning_rate": 2.5195804195804194e-07, - "loss": 0.3584, - "step": 54120 - }, - { - "epoch": 46.91, - "learning_rate": 2.512587412587412e-07, - "loss": 0.3873, - "step": 54130 - }, - { - "epoch": 46.91, - "learning_rate": 2.5055944055944056e-07, - "loss": 0.3423, - "step": 54140 - }, - { - "epoch": 46.92, - "learning_rate": 2.4986013986013985e-07, - "loss": 0.3947, - "step": 54150 - }, - { - "epoch": 46.93, - "learning_rate": 2.491608391608392e-07, - "loss": 0.288, - "step": 54160 - }, - { - "epoch": 46.94, - "learning_rate": 2.4846153846153847e-07, - "loss": 0.3879, - "step": 54170 - }, - { - "epoch": 46.95, - "learning_rate": 2.4776223776223775e-07, - "loss": 0.3688, - "step": 54180 - }, - { - "epoch": 46.96, - "learning_rate": 2.4706293706293704e-07, - "loss": 0.2977, - "step": 54190 - }, - { - "epoch": 46.97, - "learning_rate": 2.463636363636364e-07, - "loss": 0.3618, - "step": 54200 - }, - { - "epoch": 46.98, - "learning_rate": 2.4566433566433566e-07, - "loss": 0.3247, - "step": 54210 - }, - { - "epoch": 46.98, - "learning_rate": 2.4496503496503495e-07, - "loss": 0.3606, - "step": 54220 - }, - { - "epoch": 46.99, - "learning_rate": 2.4426573426573423e-07, - "loss": 0.4154, - "step": 54230 - }, - { - "epoch": 47.0, - "eval_loss": 0.5568397641181946, - "eval_runtime": 137.629, - "eval_samples_per_second": 3.865, - "eval_steps_per_second": 1.933, - "eval_wer": 0.24304171755479848, - "step": 54238 - }, - { - "epoch": 47.0, - "learning_rate": 2.4356643356643357e-07, - "loss": 0.3797, - "step": 54240 - }, - { - "epoch": 47.01, - "learning_rate": 2.4286713286713286e-07, - "loss": 0.3366, - "step": 54250 - }, - { - "epoch": 47.02, - "learning_rate": 2.4216783216783214e-07, - "loss": 0.3544, - "step": 54260 - }, - { - "epoch": 47.03, - "learning_rate": 2.414685314685315e-07, - "loss": 0.3364, - "step": 54270 - }, - { - "epoch": 47.04, - "learning_rate": 2.4076923076923076e-07, - "loss": 0.3394, - "step": 54280 - }, - { - "epoch": 47.05, - "learning_rate": 2.4006993006993005e-07, - "loss": 0.3604, - "step": 54290 - }, - { - "epoch": 47.05, - "learning_rate": 2.3937062937062934e-07, - "loss": 0.3669, - "step": 54300 - }, - { - "epoch": 47.06, - "learning_rate": 2.3867132867132867e-07, - "loss": 0.2888, - "step": 54310 - }, - { - "epoch": 47.07, - "learning_rate": 2.3797202797202796e-07, - "loss": 0.3718, - "step": 54320 - }, - { - "epoch": 47.08, - "learning_rate": 2.3727272727272727e-07, - "loss": 0.3313, - "step": 54330 - }, - { - "epoch": 47.09, - "learning_rate": 2.3657342657342656e-07, - "loss": 0.3984, - "step": 54340 - }, - { - "epoch": 47.1, - "learning_rate": 2.3587412587412587e-07, - "loss": 0.3705, - "step": 54350 - }, - { - "epoch": 47.11, - "learning_rate": 2.3517482517482518e-07, - "loss": 0.3335, - "step": 54360 - }, - { - "epoch": 47.11, - "learning_rate": 2.3447552447552446e-07, - "loss": 0.3551, - "step": 54370 - }, - { - "epoch": 47.12, - "learning_rate": 2.3377622377622378e-07, - "loss": 0.3671, - "step": 54380 - }, - { - "epoch": 47.13, - "learning_rate": 2.3307692307692306e-07, - "loss": 0.3905, - "step": 54390 - }, - { - "epoch": 47.14, - "learning_rate": 2.3237762237762237e-07, - "loss": 0.3684, - "step": 54400 - }, - { - "epoch": 47.15, - "learning_rate": 2.3167832167832166e-07, - "loss": 0.3137, - "step": 54410 - }, - { - "epoch": 47.16, - "learning_rate": 2.3097902097902097e-07, - "loss": 0.2697, - "step": 54420 - }, - { - "epoch": 47.17, - "learning_rate": 2.3027972027972025e-07, - "loss": 0.381, - "step": 54430 - }, - { - "epoch": 47.17, - "learning_rate": 2.2958041958041957e-07, - "loss": 0.366, - "step": 54440 - }, - { - "epoch": 47.18, - "learning_rate": 2.2888111888111888e-07, - "loss": 0.3381, - "step": 54450 - }, - { - "epoch": 47.19, - "learning_rate": 2.2818181818181816e-07, - "loss": 0.3675, - "step": 54460 - }, - { - "epoch": 47.2, - "learning_rate": 2.2748251748251747e-07, - "loss": 0.4371, - "step": 54470 - }, - { - "epoch": 47.21, - "learning_rate": 2.2678321678321676e-07, - "loss": 0.3368, - "step": 54480 - }, - { - "epoch": 47.22, - "learning_rate": 2.2608391608391607e-07, - "loss": 0.3477, - "step": 54490 - }, - { - "epoch": 47.23, - "learning_rate": 2.2538461538461536e-07, - "loss": 0.3952, - "step": 54500 - }, - { - "epoch": 47.24, - "learning_rate": 2.2468531468531467e-07, - "loss": 0.382, - "step": 54510 - }, - { - "epoch": 47.24, - "learning_rate": 2.2398601398601395e-07, - "loss": 0.3393, - "step": 54520 - }, - { - "epoch": 47.25, - "learning_rate": 2.232867132867133e-07, - "loss": 0.377, - "step": 54530 - }, - { - "epoch": 47.26, - "learning_rate": 2.2258741258741258e-07, - "loss": 0.3356, - "step": 54540 - }, - { - "epoch": 47.27, - "learning_rate": 2.218881118881119e-07, - "loss": 0.3276, - "step": 54550 - }, - { - "epoch": 47.28, - "learning_rate": 2.211888111888112e-07, - "loss": 0.3384, - "step": 54560 - }, - { - "epoch": 47.29, - "learning_rate": 2.2048951048951049e-07, - "loss": 0.3336, - "step": 54570 - }, - { - "epoch": 47.3, - "learning_rate": 2.197902097902098e-07, - "loss": 0.3849, - "step": 54580 - }, - { - "epoch": 47.3, - "learning_rate": 2.1909090909090908e-07, - "loss": 0.3696, - "step": 54590 - }, - { - "epoch": 47.31, - "learning_rate": 2.183916083916084e-07, - "loss": 0.3393, - "step": 54600 - }, - { - "epoch": 47.32, - "learning_rate": 2.1769230769230768e-07, - "loss": 0.3248, - "step": 54610 - }, - { - "epoch": 47.33, - "learning_rate": 2.16993006993007e-07, - "loss": 0.3582, - "step": 54620 - }, - { - "epoch": 47.34, - "learning_rate": 2.1629370629370628e-07, - "loss": 0.3992, - "step": 54630 - }, - { - "epoch": 47.35, - "learning_rate": 2.155944055944056e-07, - "loss": 0.3919, - "step": 54640 - }, - { - "epoch": 47.36, - "learning_rate": 2.1489510489510487e-07, - "loss": 0.3243, - "step": 54650 - }, - { - "epoch": 47.37, - "learning_rate": 2.1419580419580418e-07, - "loss": 0.3565, - "step": 54660 - }, - { - "epoch": 47.37, - "learning_rate": 2.134965034965035e-07, - "loss": 0.3303, - "step": 54670 - }, - { - "epoch": 47.38, - "learning_rate": 2.1279720279720278e-07, - "loss": 0.379, - "step": 54680 - }, - { - "epoch": 47.39, - "learning_rate": 2.120979020979021e-07, - "loss": 0.3638, - "step": 54690 - }, - { - "epoch": 47.4, - "learning_rate": 2.1139860139860138e-07, - "loss": 0.3546, - "step": 54700 - }, - { - "epoch": 47.41, - "learning_rate": 2.106993006993007e-07, - "loss": 0.3522, - "step": 54710 - }, - { - "epoch": 47.42, - "learning_rate": 2.0999999999999997e-07, - "loss": 0.3087, - "step": 54720 - }, - { - "epoch": 47.43, - "learning_rate": 2.0930069930069929e-07, - "loss": 0.3587, - "step": 54730 - }, - { - "epoch": 47.43, - "learning_rate": 2.0860139860139857e-07, - "loss": 0.3933, - "step": 54740 - }, - { - "epoch": 47.44, - "learning_rate": 2.0790209790209788e-07, - "loss": 0.3762, - "step": 54750 - }, - { - "epoch": 47.45, - "learning_rate": 2.0720279720279717e-07, - "loss": 0.2997, - "step": 54760 - }, - { - "epoch": 47.46, - "learning_rate": 2.065034965034965e-07, - "loss": 0.3557, - "step": 54770 - }, - { - "epoch": 47.47, - "learning_rate": 2.0580419580419582e-07, - "loss": 0.3875, - "step": 54780 - }, - { - "epoch": 47.48, - "learning_rate": 2.051048951048951e-07, - "loss": 0.3961, - "step": 54790 - }, - { - "epoch": 47.49, - "learning_rate": 2.0440559440559441e-07, - "loss": 0.3651, - "step": 54800 - }, - { - "epoch": 47.5, - "learning_rate": 2.037062937062937e-07, - "loss": 0.3966, - "step": 54810 - }, - { - "epoch": 47.5, - "learning_rate": 2.03006993006993e-07, - "loss": 0.3651, - "step": 54820 - }, - { - "epoch": 47.51, - "learning_rate": 2.023076923076923e-07, - "loss": 0.3566, - "step": 54830 - }, - { - "epoch": 47.52, - "learning_rate": 2.016083916083916e-07, - "loss": 0.3443, - "step": 54840 - }, - { - "epoch": 47.53, - "learning_rate": 2.009090909090909e-07, - "loss": 0.3262, - "step": 54850 - }, - { - "epoch": 47.54, - "learning_rate": 2.002097902097902e-07, - "loss": 0.3129, - "step": 54860 - }, - { - "epoch": 47.55, - "learning_rate": 1.995104895104895e-07, - "loss": 0.3609, - "step": 54870 - }, - { - "epoch": 47.56, - "learning_rate": 1.988111888111888e-07, - "loss": 0.2917, - "step": 54880 - }, - { - "epoch": 47.56, - "learning_rate": 1.9811188811188811e-07, - "loss": 0.391, - "step": 54890 - }, - { - "epoch": 47.57, - "learning_rate": 1.974125874125874e-07, - "loss": 0.3483, - "step": 54900 - }, - { - "epoch": 47.58, - "learning_rate": 1.967132867132867e-07, - "loss": 0.3754, - "step": 54910 - }, - { - "epoch": 47.59, - "learning_rate": 1.96013986013986e-07, - "loss": 0.3642, - "step": 54920 - }, - { - "epoch": 47.6, - "learning_rate": 1.953146853146853e-07, - "loss": 0.3519, - "step": 54930 - }, - { - "epoch": 47.61, - "learning_rate": 1.946153846153846e-07, - "loss": 0.4031, - "step": 54940 - }, - { - "epoch": 47.62, - "learning_rate": 1.939160839160839e-07, - "loss": 0.3196, - "step": 54950 - }, - { - "epoch": 47.63, - "learning_rate": 1.932167832167832e-07, - "loss": 0.3574, - "step": 54960 - }, - { - "epoch": 47.63, - "learning_rate": 1.925174825174825e-07, - "loss": 0.342, - "step": 54970 - }, - { - "epoch": 47.64, - "learning_rate": 1.9181818181818179e-07, - "loss": 0.3426, - "step": 54980 - }, - { - "epoch": 47.65, - "learning_rate": 1.911188811188811e-07, - "loss": 0.3166, - "step": 54990 - }, - { - "epoch": 47.66, - "learning_rate": 1.904195804195804e-07, - "loss": 0.3258, - "step": 55000 - }, - { - "epoch": 47.67, - "learning_rate": 1.897202797202797e-07, - "loss": 0.3332, - "step": 55010 - }, - { - "epoch": 47.68, - "learning_rate": 1.8902097902097903e-07, - "loss": 0.3769, - "step": 55020 - }, - { - "epoch": 47.69, - "learning_rate": 1.8832167832167832e-07, - "loss": 0.4165, - "step": 55030 - }, - { - "epoch": 47.69, - "learning_rate": 1.8769230769230767e-07, - "loss": 0.3893, - "step": 55040 - }, - { - "epoch": 47.7, - "learning_rate": 1.8699300699300699e-07, - "loss": 0.3782, - "step": 55050 - }, - { - "epoch": 47.71, - "learning_rate": 1.8629370629370627e-07, - "loss": 0.3125, - "step": 55060 - }, - { - "epoch": 47.72, - "learning_rate": 1.8559440559440558e-07, - "loss": 0.3644, - "step": 55070 - }, - { - "epoch": 47.73, - "learning_rate": 1.8489510489510487e-07, - "loss": 0.339, - "step": 55080 - }, - { - "epoch": 47.74, - "learning_rate": 1.8419580419580418e-07, - "loss": 0.3563, - "step": 55090 - }, - { - "epoch": 47.75, - "learning_rate": 1.834965034965035e-07, - "loss": 0.3465, - "step": 55100 - }, - { - "epoch": 47.76, - "learning_rate": 1.8279720279720278e-07, - "loss": 0.3255, - "step": 55110 - }, - { - "epoch": 47.76, - "learning_rate": 1.820979020979021e-07, - "loss": 0.3639, - "step": 55120 - }, - { - "epoch": 47.77, - "learning_rate": 1.8139860139860137e-07, - "loss": 0.3893, - "step": 55130 - }, - { - "epoch": 47.78, - "learning_rate": 1.806993006993007e-07, - "loss": 0.3311, - "step": 55140 - }, - { - "epoch": 47.79, - "learning_rate": 1.8e-07, - "loss": 0.3554, - "step": 55150 - }, - { - "epoch": 47.8, - "learning_rate": 1.793006993006993e-07, - "loss": 0.3587, - "step": 55160 - }, - { - "epoch": 47.81, - "learning_rate": 1.786013986013986e-07, - "loss": 0.301, - "step": 55170 - }, - { - "epoch": 47.82, - "learning_rate": 1.779020979020979e-07, - "loss": 0.3313, - "step": 55180 - }, - { - "epoch": 47.82, - "learning_rate": 1.772027972027972e-07, - "loss": 0.3896, - "step": 55190 - }, - { - "epoch": 47.83, - "learning_rate": 1.765034965034965e-07, - "loss": 0.3046, - "step": 55200 - }, - { - "epoch": 47.84, - "learning_rate": 1.7580419580419581e-07, - "loss": 0.3305, - "step": 55210 - }, - { - "epoch": 47.85, - "learning_rate": 1.751048951048951e-07, - "loss": 0.3427, - "step": 55220 - }, - { - "epoch": 47.86, - "learning_rate": 1.744055944055944e-07, - "loss": 0.3899, - "step": 55230 - }, - { - "epoch": 47.87, - "learning_rate": 1.737062937062937e-07, - "loss": 0.3873, - "step": 55240 - }, - { - "epoch": 47.88, - "learning_rate": 1.73006993006993e-07, - "loss": 0.3425, - "step": 55250 - }, - { - "epoch": 47.89, - "learning_rate": 1.723076923076923e-07, - "loss": 0.3016, - "step": 55260 - }, - { - "epoch": 47.89, - "learning_rate": 1.716083916083916e-07, - "loss": 0.3186, - "step": 55270 - }, - { - "epoch": 47.9, - "learning_rate": 1.709090909090909e-07, - "loss": 0.3615, - "step": 55280 - }, - { - "epoch": 47.91, - "learning_rate": 1.702097902097902e-07, - "loss": 0.3495, - "step": 55290 - }, - { - "epoch": 47.92, - "learning_rate": 1.6951048951048949e-07, - "loss": 0.317, - "step": 55300 - }, - { - "epoch": 47.93, - "learning_rate": 1.688111888111888e-07, - "loss": 0.4341, - "step": 55310 - }, - { - "epoch": 47.94, - "learning_rate": 1.681118881118881e-07, - "loss": 0.3467, - "step": 55320 - }, - { - "epoch": 47.95, - "learning_rate": 1.674125874125874e-07, - "loss": 0.3802, - "step": 55330 - }, - { - "epoch": 47.95, - "learning_rate": 1.667132867132867e-07, - "loss": 0.3541, - "step": 55340 - }, - { - "epoch": 47.96, - "learning_rate": 1.66013986013986e-07, - "loss": 0.3015, - "step": 55350 - }, - { - "epoch": 47.97, - "learning_rate": 1.653146853146853e-07, - "loss": 0.3601, - "step": 55360 - }, - { - "epoch": 47.98, - "learning_rate": 1.646153846153846e-07, - "loss": 0.3906, - "step": 55370 - }, - { - "epoch": 47.99, - "learning_rate": 1.6391608391608393e-07, - "loss": 0.3486, - "step": 55380 - }, - { - "epoch": 48.0, - "learning_rate": 1.632167832167832e-07, - "loss": 0.3158, - "step": 55390 - }, - { - "epoch": 48.0, - "eval_loss": 0.560836672782898, - "eval_runtime": 134.7766, - "eval_samples_per_second": 3.947, - "eval_steps_per_second": 1.974, - "eval_wer": 0.24284887831844185, - "step": 55392 - }, - { - "epoch": 48.01, - "learning_rate": 1.6251748251748252e-07, - "loss": 0.3843, - "step": 55400 - }, - { - "epoch": 48.02, - "learning_rate": 1.618181818181818e-07, - "loss": 0.4182, - "step": 55410 - }, - { - "epoch": 48.02, - "learning_rate": 1.6111888111888112e-07, - "loss": 0.2969, - "step": 55420 - }, - { - "epoch": 48.03, - "learning_rate": 1.6041958041958043e-07, - "loss": 0.3782, - "step": 55430 - }, - { - "epoch": 48.04, - "learning_rate": 1.5972027972027972e-07, - "loss": 0.3769, - "step": 55440 - }, - { - "epoch": 48.05, - "learning_rate": 1.5902097902097903e-07, - "loss": 0.3307, - "step": 55450 - }, - { - "epoch": 48.06, - "learning_rate": 1.5832167832167831e-07, - "loss": 0.3369, - "step": 55460 - }, - { - "epoch": 48.07, - "learning_rate": 1.5762237762237763e-07, - "loss": 0.3782, - "step": 55470 - }, - { - "epoch": 48.08, - "learning_rate": 1.569230769230769e-07, - "loss": 0.389, - "step": 55480 - }, - { - "epoch": 48.08, - "learning_rate": 1.5622377622377622e-07, - "loss": 0.3859, - "step": 55490 - }, - { - "epoch": 48.09, - "learning_rate": 1.555244755244755e-07, - "loss": 0.3444, - "step": 55500 - }, - { - "epoch": 48.1, - "learning_rate": 1.5482517482517482e-07, - "loss": 0.3688, - "step": 55510 - }, - { - "epoch": 48.11, - "learning_rate": 1.541258741258741e-07, - "loss": 0.3124, - "step": 55520 - }, - { - "epoch": 48.12, - "learning_rate": 1.5342657342657342e-07, - "loss": 0.303, - "step": 55530 - }, - { - "epoch": 48.13, - "learning_rate": 1.5272727272727273e-07, - "loss": 0.3582, - "step": 55540 - }, - { - "epoch": 48.14, - "learning_rate": 1.5202797202797201e-07, - "loss": 0.351, - "step": 55550 - }, - { - "epoch": 48.15, - "learning_rate": 1.5132867132867132e-07, - "loss": 0.41, - "step": 55560 - }, - { - "epoch": 48.15, - "learning_rate": 1.506293706293706e-07, - "loss": 0.3245, - "step": 55570 - }, - { - "epoch": 48.16, - "learning_rate": 1.4993006993006992e-07, - "loss": 0.3326, - "step": 55580 - }, - { - "epoch": 48.17, - "learning_rate": 1.492307692307692e-07, - "loss": 0.3845, - "step": 55590 - }, - { - "epoch": 48.18, - "learning_rate": 1.4853146853146852e-07, - "loss": 0.3734, - "step": 55600 - }, - { - "epoch": 48.19, - "learning_rate": 1.478321678321678e-07, - "loss": 0.3646, - "step": 55610 - }, - { - "epoch": 48.2, - "learning_rate": 1.4713286713286712e-07, - "loss": 0.3872, - "step": 55620 - }, - { - "epoch": 48.21, - "learning_rate": 1.464335664335664e-07, - "loss": 0.4069, - "step": 55630 - }, - { - "epoch": 48.21, - "learning_rate": 1.4573426573426574e-07, - "loss": 0.4001, - "step": 55640 - }, - { - "epoch": 48.22, - "learning_rate": 1.4503496503496505e-07, - "loss": 0.3788, - "step": 55650 - }, - { - "epoch": 48.23, - "learning_rate": 1.4433566433566434e-07, - "loss": 0.3732, - "step": 55660 - }, - { - "epoch": 48.24, - "learning_rate": 1.4363636363636365e-07, - "loss": 0.3641, - "step": 55670 - }, - { - "epoch": 48.25, - "learning_rate": 1.4293706293706293e-07, - "loss": 0.3531, - "step": 55680 - }, - { - "epoch": 48.26, - "learning_rate": 1.4223776223776224e-07, - "loss": 0.3396, - "step": 55690 - }, - { - "epoch": 48.27, - "learning_rate": 1.4153846153846153e-07, - "loss": 0.379, - "step": 55700 - }, - { - "epoch": 48.28, - "learning_rate": 1.4083916083916084e-07, - "loss": 0.3456, - "step": 55710 - }, - { - "epoch": 48.28, - "learning_rate": 1.4013986013986013e-07, - "loss": 0.2917, - "step": 55720 - }, - { - "epoch": 48.29, - "learning_rate": 1.3944055944055944e-07, - "loss": 0.3777, - "step": 55730 - }, - { - "epoch": 48.3, - "learning_rate": 1.3874125874125875e-07, - "loss": 0.3455, - "step": 55740 - }, - { - "epoch": 48.31, - "learning_rate": 1.3804195804195803e-07, - "loss": 0.3494, - "step": 55750 - }, - { - "epoch": 48.32, - "learning_rate": 1.3734265734265735e-07, - "loss": 0.3303, - "step": 55760 - }, - { - "epoch": 48.33, - "learning_rate": 1.3664335664335663e-07, - "loss": 0.3415, - "step": 55770 - }, - { - "epoch": 48.34, - "learning_rate": 1.3594405594405594e-07, - "loss": 0.3074, - "step": 55780 - }, - { - "epoch": 48.34, - "learning_rate": 1.3524475524475523e-07, - "loss": 0.4096, - "step": 55790 - }, - { - "epoch": 48.35, - "learning_rate": 1.3454545454545454e-07, - "loss": 0.3875, - "step": 55800 - }, - { - "epoch": 48.36, - "learning_rate": 1.3384615384615383e-07, - "loss": 0.344, - "step": 55810 - }, - { - "epoch": 48.37, - "learning_rate": 1.3314685314685314e-07, - "loss": 0.2696, - "step": 55820 - }, - { - "epoch": 48.38, - "learning_rate": 1.3244755244755242e-07, - "loss": 0.339, - "step": 55830 - }, - { - "epoch": 48.39, - "learning_rate": 1.3174825174825173e-07, - "loss": 0.354, - "step": 55840 - }, - { - "epoch": 48.4, - "learning_rate": 1.3104895104895105e-07, - "loss": 0.3863, - "step": 55850 - }, - { - "epoch": 48.41, - "learning_rate": 1.3034965034965033e-07, - "loss": 0.3484, - "step": 55860 - }, - { - "epoch": 48.41, - "learning_rate": 1.2965034965034964e-07, - "loss": 0.4278, - "step": 55870 - }, - { - "epoch": 48.42, - "learning_rate": 1.2895104895104895e-07, - "loss": 0.3246, - "step": 55880 - }, - { - "epoch": 48.43, - "learning_rate": 1.2825174825174827e-07, - "loss": 0.3766, - "step": 55890 - }, - { - "epoch": 48.44, - "learning_rate": 1.2755244755244755e-07, - "loss": 0.3238, - "step": 55900 - }, - { - "epoch": 48.45, - "learning_rate": 1.2685314685314686e-07, - "loss": 0.4097, - "step": 55910 - }, - { - "epoch": 48.46, - "learning_rate": 1.2615384615384615e-07, - "loss": 0.3207, - "step": 55920 - }, - { - "epoch": 48.47, - "learning_rate": 1.2545454545454546e-07, - "loss": 0.3636, - "step": 55930 - }, - { - "epoch": 48.47, - "learning_rate": 1.2475524475524474e-07, - "loss": 0.359, - "step": 55940 - }, - { - "epoch": 48.48, - "learning_rate": 1.2405594405594406e-07, - "loss": 0.3375, - "step": 55950 - }, - { - "epoch": 48.49, - "learning_rate": 1.2335664335664334e-07, - "loss": 0.3635, - "step": 55960 - }, - { - "epoch": 48.5, - "learning_rate": 1.2265734265734265e-07, - "loss": 0.2793, - "step": 55970 - }, - { - "epoch": 48.51, - "learning_rate": 1.2195804195804194e-07, - "loss": 0.41, - "step": 55980 - }, - { - "epoch": 48.52, - "learning_rate": 1.2125874125874125e-07, - "loss": 0.39, - "step": 55990 - }, - { - "epoch": 48.53, - "learning_rate": 1.2055944055944053e-07, - "loss": 0.3814, - "step": 56000 - }, - { - "epoch": 48.54, - "learning_rate": 1.1986013986013987e-07, - "loss": 0.3057, - "step": 56010 - }, - { - "epoch": 48.54, - "learning_rate": 1.1916083916083916e-07, - "loss": 0.3332, - "step": 56020 - }, - { - "epoch": 48.55, - "learning_rate": 1.1846153846153846e-07, - "loss": 0.3852, - "step": 56030 - }, - { - "epoch": 48.56, - "learning_rate": 1.1776223776223775e-07, - "loss": 0.4011, - "step": 56040 - }, - { - "epoch": 48.57, - "learning_rate": 1.1706293706293705e-07, - "loss": 0.3123, - "step": 56050 - }, - { - "epoch": 48.58, - "learning_rate": 1.1636363636363636e-07, - "loss": 0.3529, - "step": 56060 - }, - { - "epoch": 48.59, - "learning_rate": 1.1566433566433566e-07, - "loss": 0.3336, - "step": 56070 - }, - { - "epoch": 48.6, - "learning_rate": 1.1496503496503496e-07, - "loss": 0.3159, - "step": 56080 - }, - { - "epoch": 48.6, - "learning_rate": 1.1426573426573426e-07, - "loss": 0.3929, - "step": 56090 - }, - { - "epoch": 48.61, - "learning_rate": 1.1356643356643356e-07, - "loss": 0.3498, - "step": 56100 - }, - { - "epoch": 48.62, - "learning_rate": 1.1286713286713286e-07, - "loss": 0.3591, - "step": 56110 - }, - { - "epoch": 48.63, - "learning_rate": 1.1216783216783217e-07, - "loss": 0.3466, - "step": 56120 - }, - { - "epoch": 48.64, - "learning_rate": 1.1146853146853147e-07, - "loss": 0.3921, - "step": 56130 - }, - { - "epoch": 48.65, - "learning_rate": 1.1076923076923077e-07, - "loss": 0.42, - "step": 56140 - }, - { - "epoch": 48.66, - "learning_rate": 1.1006993006993006e-07, - "loss": 0.3855, - "step": 56150 - }, - { - "epoch": 48.67, - "learning_rate": 1.0937062937062936e-07, - "loss": 0.3384, - "step": 56160 - }, - { - "epoch": 48.67, - "learning_rate": 1.0867132867132866e-07, - "loss": 0.3103, - "step": 56170 - }, - { - "epoch": 48.68, - "learning_rate": 1.0797202797202796e-07, - "loss": 0.3521, - "step": 56180 - }, - { - "epoch": 48.69, - "learning_rate": 1.0727272727272727e-07, - "loss": 0.3497, - "step": 56190 - }, - { - "epoch": 48.7, - "learning_rate": 1.0657342657342657e-07, - "loss": 0.371, - "step": 56200 - }, - { - "epoch": 48.71, - "learning_rate": 1.0587412587412587e-07, - "loss": 0.324, - "step": 56210 - }, - { - "epoch": 48.72, - "learning_rate": 1.0517482517482518e-07, - "loss": 0.3263, - "step": 56220 - }, - { - "epoch": 48.73, - "learning_rate": 1.0447552447552448e-07, - "loss": 0.3513, - "step": 56230 - }, - { - "epoch": 48.73, - "learning_rate": 1.0377622377622378e-07, - "loss": 0.3406, - "step": 56240 - }, - { - "epoch": 48.74, - "learning_rate": 1.0307692307692307e-07, - "loss": 0.3813, - "step": 56250 - }, - { - "epoch": 48.75, - "learning_rate": 1.0237762237762237e-07, - "loss": 0.391, - "step": 56260 - }, - { - "epoch": 48.76, - "learning_rate": 1.0167832167832167e-07, - "loss": 0.3442, - "step": 56270 - }, - { - "epoch": 48.77, - "learning_rate": 1.0097902097902097e-07, - "loss": 0.375, - "step": 56280 - }, - { - "epoch": 48.78, - "learning_rate": 1.0027972027972027e-07, - "loss": 0.3793, - "step": 56290 - }, - { - "epoch": 48.79, - "learning_rate": 9.958041958041957e-08, - "loss": 0.31, - "step": 56300 - }, - { - "epoch": 48.8, - "learning_rate": 9.888111888111888e-08, - "loss": 0.3603, - "step": 56310 - }, - { - "epoch": 48.8, - "learning_rate": 9.818181818181818e-08, - "loss": 0.3785, - "step": 56320 - }, - { - "epoch": 48.81, - "learning_rate": 9.748251748251749e-08, - "loss": 0.3666, - "step": 56330 - }, - { - "epoch": 48.82, - "learning_rate": 9.678321678321679e-08, - "loss": 0.3912, - "step": 56340 - }, - { - "epoch": 48.83, - "learning_rate": 9.608391608391609e-08, - "loss": 0.3119, - "step": 56350 - }, - { - "epoch": 48.84, - "learning_rate": 9.538461538461538e-08, - "loss": 0.3483, - "step": 56360 - }, - { - "epoch": 48.85, - "learning_rate": 9.468531468531468e-08, - "loss": 0.3031, - "step": 56370 - }, - { - "epoch": 48.86, - "learning_rate": 9.398601398601398e-08, - "loss": 0.3225, - "step": 56380 - }, - { - "epoch": 48.86, - "learning_rate": 9.328671328671328e-08, - "loss": 0.3636, - "step": 56390 - }, - { - "epoch": 48.87, - "learning_rate": 9.258741258741258e-08, - "loss": 0.2924, - "step": 56400 - }, - { - "epoch": 48.88, - "learning_rate": 9.188811188811188e-08, - "loss": 0.333, - "step": 56410 - }, - { - "epoch": 48.89, - "learning_rate": 9.118881118881117e-08, - "loss": 0.3425, - "step": 56420 - }, - { - "epoch": 48.9, - "learning_rate": 9.048951048951047e-08, - "loss": 0.3841, - "step": 56430 - }, - { - "epoch": 48.91, - "learning_rate": 8.97902097902098e-08, - "loss": 0.3724, - "step": 56440 - }, - { - "epoch": 48.92, - "learning_rate": 8.90909090909091e-08, - "loss": 0.3315, - "step": 56450 - }, - { - "epoch": 48.93, - "learning_rate": 8.83916083916084e-08, - "loss": 0.3965, - "step": 56460 - }, - { - "epoch": 48.93, - "learning_rate": 8.769230769230769e-08, - "loss": 0.3083, - "step": 56470 - }, - { - "epoch": 48.94, - "learning_rate": 8.699300699300699e-08, - "loss": 0.3607, - "step": 56480 - }, - { - "epoch": 48.95, - "learning_rate": 8.629370629370629e-08, - "loss": 0.3723, - "step": 56490 - }, - { - "epoch": 48.96, - "learning_rate": 8.559440559440559e-08, - "loss": 0.388, - "step": 56500 - }, - { - "epoch": 48.97, - "learning_rate": 8.489510489510489e-08, - "loss": 0.3396, - "step": 56510 - }, - { - "epoch": 48.98, - "learning_rate": 8.419580419580418e-08, - "loss": 0.2864, - "step": 56520 - }, - { - "epoch": 48.99, - "learning_rate": 8.349650349650348e-08, - "loss": 0.3396, - "step": 56530 - }, - { - "epoch": 48.99, - "learning_rate": 8.27972027972028e-08, - "loss": 0.3577, - "step": 56540 - }, - { - "epoch": 49.0, - "eval_loss": 0.5593469738960266, - "eval_runtime": 135.5272, - "eval_samples_per_second": 3.925, - "eval_steps_per_second": 1.963, - "eval_wer": 0.24117760493668444, - "step": 56546 - }, - { - "epoch": 49.0, - "learning_rate": 8.209790209790209e-08, - "loss": 0.3164, - "step": 56550 - }, - { - "epoch": 49.01, - "learning_rate": 8.13986013986014e-08, - "loss": 0.3259, - "step": 56560 - }, - { - "epoch": 49.02, - "learning_rate": 8.06993006993007e-08, - "loss": 0.3391, - "step": 56570 - }, - { - "epoch": 49.03, - "learning_rate": 8e-08, - "loss": 0.3855, - "step": 56580 - }, - { - "epoch": 49.04, - "learning_rate": 7.93006993006993e-08, - "loss": 0.3719, - "step": 56590 - }, - { - "epoch": 49.05, - "learning_rate": 7.86013986013986e-08, - "loss": 0.3446, - "step": 56600 - }, - { - "epoch": 49.06, - "learning_rate": 7.79020979020979e-08, - "loss": 0.291, - "step": 56610 - }, - { - "epoch": 49.06, - "learning_rate": 7.72027972027972e-08, - "loss": 0.3151, - "step": 56620 - }, - { - "epoch": 49.07, - "learning_rate": 7.65034965034965e-08, - "loss": 0.3284, - "step": 56630 - }, - { - "epoch": 49.08, - "learning_rate": 7.580419580419579e-08, - "loss": 0.386, - "step": 56640 - }, - { - "epoch": 49.09, - "learning_rate": 7.51048951048951e-08, - "loss": 0.3983, - "step": 56650 - }, - { - "epoch": 49.1, - "learning_rate": 7.44055944055944e-08, - "loss": 0.4279, - "step": 56660 - }, - { - "epoch": 49.11, - "learning_rate": 7.37062937062937e-08, - "loss": 0.3545, - "step": 56670 - }, - { - "epoch": 49.12, - "learning_rate": 7.300699300699301e-08, - "loss": 0.3488, - "step": 56680 - }, - { - "epoch": 49.12, - "learning_rate": 7.230769230769231e-08, - "loss": 0.336, - "step": 56690 - }, - { - "epoch": 49.13, - "learning_rate": 7.160839160839161e-08, - "loss": 0.2867, - "step": 56700 - }, - { - "epoch": 49.14, - "learning_rate": 7.090909090909091e-08, - "loss": 0.3295, - "step": 56710 - }, - { - "epoch": 49.15, - "learning_rate": 7.02097902097902e-08, - "loss": 0.3409, - "step": 56720 - }, - { - "epoch": 49.16, - "learning_rate": 6.95104895104895e-08, - "loss": 0.3139, - "step": 56730 - }, - { - "epoch": 49.17, - "learning_rate": 6.88111888111888e-08, - "loss": 0.3372, - "step": 56740 - }, - { - "epoch": 49.18, - "learning_rate": 6.81118881118881e-08, - "loss": 0.3601, - "step": 56750 - }, - { - "epoch": 49.19, - "learning_rate": 6.741258741258741e-08, - "loss": 0.4306, - "step": 56760 - }, - { - "epoch": 49.19, - "learning_rate": 6.671328671328671e-08, - "loss": 0.3192, - "step": 56770 - }, - { - "epoch": 49.2, - "learning_rate": 6.601398601398601e-08, - "loss": 0.4052, - "step": 56780 - }, - { - "epoch": 49.21, - "learning_rate": 6.531468531468531e-08, - "loss": 0.3666, - "step": 56790 - }, - { - "epoch": 49.22, - "learning_rate": 6.461538461538462e-08, - "loss": 0.3323, - "step": 56800 - }, - { - "epoch": 49.23, - "learning_rate": 6.391608391608392e-08, - "loss": 0.3665, - "step": 56810 - }, - { - "epoch": 49.24, - "learning_rate": 6.321678321678322e-08, - "loss": 0.3556, - "step": 56820 - }, - { - "epoch": 49.25, - "learning_rate": 6.251748251748252e-08, - "loss": 0.3442, - "step": 56830 - }, - { - "epoch": 49.25, - "learning_rate": 6.181818181818181e-08, - "loss": 0.3433, - "step": 56840 - }, - { - "epoch": 49.26, - "learning_rate": 6.111888111888111e-08, - "loss": 0.2919, - "step": 56850 - }, - { - "epoch": 49.27, - "learning_rate": 6.041958041958041e-08, - "loss": 0.3386, - "step": 56860 - }, - { - "epoch": 49.28, - "learning_rate": 5.972027972027972e-08, - "loss": 0.3452, - "step": 56870 - }, - { - "epoch": 49.29, - "learning_rate": 5.9020979020979014e-08, - "loss": 0.3379, - "step": 56880 - }, - { - "epoch": 49.3, - "learning_rate": 5.832167832167832e-08, - "loss": 0.3258, - "step": 56890 - }, - { - "epoch": 49.31, - "learning_rate": 5.7622377622377624e-08, - "loss": 0.4041, - "step": 56900 - }, - { - "epoch": 49.32, - "learning_rate": 5.692307692307692e-08, - "loss": 0.3279, - "step": 56910 - }, - { - "epoch": 49.32, - "learning_rate": 5.622377622377622e-08, - "loss": 0.3576, - "step": 56920 - }, - { - "epoch": 49.33, - "learning_rate": 5.552447552447552e-08, - "loss": 0.31, - "step": 56930 - }, - { - "epoch": 49.34, - "learning_rate": 5.4825174825174824e-08, - "loss": 0.3643, - "step": 56940 - }, - { - "epoch": 49.35, - "learning_rate": 5.412587412587412e-08, - "loss": 0.368, - "step": 56950 - }, - { - "epoch": 49.36, - "learning_rate": 5.342657342657343e-08, - "loss": 0.3732, - "step": 56960 - }, - { - "epoch": 49.37, - "learning_rate": 5.2727272727272726e-08, - "loss": 0.3594, - "step": 56970 - }, - { - "epoch": 49.38, - "learning_rate": 5.2027972027972024e-08, - "loss": 0.3388, - "step": 56980 - }, - { - "epoch": 49.38, - "learning_rate": 5.132867132867132e-08, - "loss": 0.4067, - "step": 56990 - }, - { - "epoch": 49.39, - "learning_rate": 5.062937062937063e-08, - "loss": 0.3645, - "step": 57000 - }, - { - "epoch": 49.4, - "learning_rate": 4.9930069930069926e-08, - "loss": 0.387, - "step": 57010 - }, - { - "epoch": 49.41, - "learning_rate": 4.923076923076923e-08, - "loss": 0.347, - "step": 57020 - }, - { - "epoch": 49.42, - "learning_rate": 4.853146853146853e-08, - "loss": 0.3459, - "step": 57030 - }, - { - "epoch": 49.43, - "learning_rate": 4.783216783216783e-08, - "loss": 0.3654, - "step": 57040 - }, - { - "epoch": 49.44, - "learning_rate": 4.713286713286713e-08, - "loss": 0.3412, - "step": 57050 - }, - { - "epoch": 49.45, - "learning_rate": 4.643356643356643e-08, - "loss": 0.3725, - "step": 57060 - }, - { - "epoch": 49.45, - "learning_rate": 4.573426573426573e-08, - "loss": 0.2922, - "step": 57070 - }, - { - "epoch": 49.46, - "learning_rate": 4.5034965034965035e-08, - "loss": 0.3583, - "step": 57080 - }, - { - "epoch": 49.47, - "learning_rate": 4.4335664335664333e-08, - "loss": 0.3585, - "step": 57090 - }, - { - "epoch": 49.48, - "learning_rate": 4.363636363636364e-08, - "loss": 0.3408, - "step": 57100 - }, - { - "epoch": 49.49, - "learning_rate": 4.293706293706294e-08, - "loss": 0.3853, - "step": 57110 - }, - { - "epoch": 49.5, - "learning_rate": 4.2237762237762235e-08, - "loss": 0.323, - "step": 57120 - }, - { - "epoch": 49.51, - "learning_rate": 4.1538461538461534e-08, - "loss": 0.3322, - "step": 57130 - }, - { - "epoch": 49.51, - "learning_rate": 4.083916083916084e-08, - "loss": 0.3715, - "step": 57140 - }, - { - "epoch": 49.52, - "learning_rate": 4.013986013986014e-08, - "loss": 0.3399, - "step": 57150 - }, - { - "epoch": 49.53, - "learning_rate": 3.944055944055944e-08, - "loss": 0.3108, - "step": 57160 - }, - { - "epoch": 49.54, - "learning_rate": 3.874125874125874e-08, - "loss": 0.3839, - "step": 57170 - }, - { - "epoch": 49.55, - "learning_rate": 3.804195804195804e-08, - "loss": 0.3441, - "step": 57180 - }, - { - "epoch": 49.56, - "learning_rate": 3.734265734265734e-08, - "loss": 0.3805, - "step": 57190 - }, - { - "epoch": 49.57, - "learning_rate": 3.6643356643356636e-08, - "loss": 0.357, - "step": 57200 - }, - { - "epoch": 49.58, - "learning_rate": 3.594405594405595e-08, - "loss": 0.3623, - "step": 57210 - }, - { - "epoch": 49.58, - "learning_rate": 3.5244755244755246e-08, - "loss": 0.3106, - "step": 57220 - }, - { - "epoch": 49.59, - "learning_rate": 3.4545454545454544e-08, - "loss": 0.3441, - "step": 57230 - }, - { - "epoch": 49.6, - "learning_rate": 3.384615384615384e-08, - "loss": 0.3801, - "step": 57240 - }, - { - "epoch": 49.61, - "learning_rate": 3.314685314685314e-08, - "loss": 0.4127, - "step": 57250 - }, - { - "epoch": 49.62, - "learning_rate": 3.2447552447552446e-08, - "loss": 0.3755, - "step": 57260 - }, - { - "epoch": 49.63, - "learning_rate": 3.174825174825175e-08, - "loss": 0.3613, - "step": 57270 - }, - { - "epoch": 49.64, - "learning_rate": 3.104895104895105e-08, - "loss": 0.3935, - "step": 57280 - }, - { - "epoch": 49.64, - "learning_rate": 3.034965034965035e-08, - "loss": 0.398, - "step": 57290 - }, - { - "epoch": 49.65, - "learning_rate": 2.965034965034965e-08, - "loss": 0.3381, - "step": 57300 - }, - { - "epoch": 49.66, - "learning_rate": 2.895104895104895e-08, - "loss": 0.3744, - "step": 57310 - }, - { - "epoch": 49.67, - "learning_rate": 2.825174825174825e-08, - "loss": 0.354, - "step": 57320 - }, - { - "epoch": 49.68, - "learning_rate": 2.7552447552447552e-08, - "loss": 0.3696, - "step": 57330 - }, - { - "epoch": 49.69, - "learning_rate": 2.6853146853146853e-08, - "loss": 0.351, - "step": 57340 - }, - { - "epoch": 49.7, - "learning_rate": 2.6153846153846152e-08, - "loss": 0.3758, - "step": 57350 - }, - { - "epoch": 49.71, - "learning_rate": 2.5454545454545454e-08, - "loss": 0.3705, - "step": 57360 - }, - { - "epoch": 49.71, - "learning_rate": 2.4755244755244755e-08, - "loss": 0.3173, - "step": 57370 - }, - { - "epoch": 49.72, - "learning_rate": 2.4055944055944057e-08, - "loss": 0.3319, - "step": 57380 - }, - { - "epoch": 49.73, - "learning_rate": 2.3356643356643355e-08, - "loss": 0.3558, - "step": 57390 - }, - { - "epoch": 49.74, - "learning_rate": 2.2657342657342654e-08, - "loss": 0.3602, - "step": 57400 - }, - { - "epoch": 49.75, - "learning_rate": 2.195804195804196e-08, - "loss": 0.3973, - "step": 57410 - }, - { - "epoch": 49.76, - "learning_rate": 2.1258741258741257e-08, - "loss": 0.3605, - "step": 57420 - }, - { - "epoch": 49.77, - "learning_rate": 2.0559440559440556e-08, - "loss": 0.3571, - "step": 57430 - }, - { - "epoch": 49.77, - "learning_rate": 1.986013986013986e-08, - "loss": 0.3679, - "step": 57440 - }, - { - "epoch": 49.78, - "learning_rate": 1.916083916083916e-08, - "loss": 0.3385, - "step": 57450 - }, - { - "epoch": 49.79, - "learning_rate": 1.846153846153846e-08, - "loss": 0.3208, - "step": 57460 - }, - { - "epoch": 49.8, - "learning_rate": 1.7762237762237763e-08, - "loss": 0.3961, - "step": 57470 - }, - { - "epoch": 49.81, - "learning_rate": 1.706293706293706e-08, - "loss": 0.4047, - "step": 57480 - }, - { - "epoch": 49.82, - "learning_rate": 1.6363636363636363e-08, - "loss": 0.417, - "step": 57490 - }, - { - "epoch": 49.83, - "learning_rate": 1.5664335664335665e-08, - "loss": 0.3229, - "step": 57500 - }, - { - "epoch": 49.83, - "learning_rate": 1.4965034965034966e-08, - "loss": 0.3654, - "step": 57510 - }, - { - "epoch": 49.84, - "learning_rate": 1.4265734265734266e-08, - "loss": 0.3457, - "step": 57520 - }, - { - "epoch": 49.85, - "learning_rate": 1.3566433566433565e-08, - "loss": 0.2899, - "step": 57530 - }, - { - "epoch": 49.86, - "learning_rate": 1.2867132867132866e-08, - "loss": 0.3838, - "step": 57540 - }, - { - "epoch": 49.87, - "learning_rate": 1.2167832167832168e-08, - "loss": 0.3387, - "step": 57550 - }, - { - "epoch": 49.88, - "learning_rate": 1.1468531468531468e-08, - "loss": 0.3008, - "step": 57560 - }, - { - "epoch": 49.89, - "learning_rate": 1.0769230769230768e-08, - "loss": 0.3183, - "step": 57570 - }, - { - "epoch": 49.9, - "learning_rate": 1.006993006993007e-08, - "loss": 0.3564, - "step": 57580 - }, - { - "epoch": 49.9, - "learning_rate": 9.37062937062937e-09, - "loss": 0.394, - "step": 57590 - }, - { - "epoch": 49.91, - "learning_rate": 8.671328671328672e-09, - "loss": 0.3434, - "step": 57600 - }, - { - "epoch": 49.92, - "learning_rate": 7.972027972027972e-09, - "loss": 0.3544, - "step": 57610 - }, - { - "epoch": 49.93, - "learning_rate": 7.272727272727273e-09, - "loss": 0.3326, - "step": 57620 - }, - { - "epoch": 49.94, - "learning_rate": 6.573426573426574e-09, - "loss": 0.3242, - "step": 57630 - }, - { - "epoch": 49.95, - "learning_rate": 5.874125874125874e-09, - "loss": 0.3569, - "step": 57640 - }, - { - "epoch": 49.96, - "learning_rate": 5.174825174825175e-09, - "loss": 0.3385, - "step": 57650 - }, - { - "epoch": 49.96, - "learning_rate": 4.4755244755244756e-09, - "loss": 0.3149, - "step": 57660 - }, - { - "epoch": 49.97, - "learning_rate": 3.776223776223776e-09, - "loss": 0.3932, - "step": 57670 - }, - { - "epoch": 49.98, - "learning_rate": 3.076923076923077e-09, - "loss": 0.3831, - "step": 57680 - }, - { - "epoch": 49.99, - "learning_rate": 2.3776223776223774e-09, - "loss": 0.3698, - "step": 57690 - }, - { - "epoch": 50.0, - "learning_rate": 1.6783216783216783e-09, - "loss": 0.3456, - "step": 57700 - }, { "epoch": 50.0, - "eval_loss": 0.5582728385925293, - "eval_runtime": 137.2226, - "eval_samples_per_second": 3.877, - "eval_steps_per_second": 1.938, - "eval_wer": 0.24034196824580575, - "step": 57700 + "eval_loss": 0.5403211116790771, + "eval_runtime": 128.4757, + "eval_samples_per_second": 4.141, + "eval_steps_per_second": 0.521, + "eval_wer": 0.24606286559105225, + "step": 3600 }, { "epoch": 50.0, - "step": 57700, - "total_flos": 1.359460060199037e+20, - "train_loss": 0.38523074480235264, - "train_runtime": 114469.7461, - "train_samples_per_second": 2.017, - "train_steps_per_second": 0.504 + "step": 3600, + "total_flos": 1.3601359172236221e+20, + "train_loss": 0.3682790127065447, + "train_runtime": 95293.0206, + "train_samples_per_second": 2.423, + "train_steps_per_second": 0.038 } ], - "max_steps": 57700, + "max_steps": 3600, "num_train_epochs": 50, - "total_flos": 1.359460060199037e+20, + "total_flos": 1.3601359172236221e+20, "trial_name": null, "trial_params": null }