{ "best_metric": 0.5390881299972534, "best_model_checkpoint": "ai-light-dance_singing3_ft_wav2vec2-large-xlsr-53-v1/checkpoint-26542", "epoch": 49.999566912083154, "global_step": 57700, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.01, "learning_rate": 7.2e-08, "loss": 0.4498, "step": 10 }, { "epoch": 0.02, "learning_rate": 1.5199999999999998e-07, "loss": 0.389, "step": 20 }, { "epoch": 0.03, "learning_rate": 2.24e-07, "loss": 0.4604, "step": 30 }, { "epoch": 0.03, "learning_rate": 3.0399999999999997e-07, "loss": 0.369, "step": 40 }, { "epoch": 0.04, "learning_rate": 3.84e-07, "loss": 0.4513, "step": 50 }, { "epoch": 0.05, "learning_rate": 4.64e-07, "loss": 0.4209, "step": 60 }, { "epoch": 0.06, "learning_rate": 5.44e-07, "loss": 0.4298, "step": 70 }, { "epoch": 0.07, "learning_rate": 6.24e-07, "loss": 0.4385, "step": 80 }, { "epoch": 0.08, "learning_rate": 7.04e-07, "loss": 0.4532, "step": 90 }, { "epoch": 0.09, "learning_rate": 7.84e-07, "loss": 0.4732, "step": 100 }, { "epoch": 0.1, "learning_rate": 8.639999999999999e-07, "loss": 0.4583, "step": 110 }, { "epoch": 0.1, "learning_rate": 9.439999999999999e-07, "loss": 0.403, "step": 120 }, { "epoch": 0.11, "learning_rate": 1.024e-06, "loss": 0.3758, "step": 130 }, { "epoch": 0.12, "learning_rate": 1.1040000000000001e-06, "loss": 0.417, "step": 140 }, { "epoch": 0.13, "learning_rate": 1.1839999999999998e-06, "loss": 0.4178, "step": 150 }, { "epoch": 0.14, "learning_rate": 1.2639999999999999e-06, "loss": 0.4161, "step": 160 }, { "epoch": 0.15, "learning_rate": 1.344e-06, "loss": 0.3947, "step": 170 }, { "epoch": 0.16, "learning_rate": 1.4239999999999998e-06, "loss": 0.4235, "step": 180 }, { "epoch": 0.16, "learning_rate": 1.504e-06, "loss": 0.4218, "step": 190 }, { "epoch": 0.17, "learning_rate": 1.576e-06, "loss": 0.5228, "step": 200 }, { "epoch": 0.18, "learning_rate": 1.656e-06, "loss": 0.3904, "step": 210 }, { "epoch": 0.19, "learning_rate": 1.736e-06, "loss": 0.3903, "step": 220 }, { "epoch": 0.2, "learning_rate": 1.816e-06, "loss": 0.4197, "step": 230 }, { "epoch": 0.21, "learning_rate": 1.8959999999999997e-06, "loss": 0.3821, "step": 240 }, { "epoch": 0.22, "learning_rate": 1.976e-06, "loss": 0.4262, "step": 250 }, { "epoch": 0.23, "learning_rate": 2.056e-06, "loss": 0.4515, "step": 260 }, { "epoch": 0.23, "learning_rate": 2.136e-06, "loss": 0.4216, "step": 270 }, { "epoch": 0.24, "learning_rate": 2.216e-06, "loss": 0.3975, "step": 280 }, { "epoch": 0.25, "learning_rate": 2.2959999999999997e-06, "loss": 0.4543, "step": 290 }, { "epoch": 0.26, "learning_rate": 2.3759999999999998e-06, "loss": 0.4256, "step": 300 }, { "epoch": 0.27, "learning_rate": 2.456e-06, "loss": 0.4268, "step": 310 }, { "epoch": 0.28, "learning_rate": 2.536e-06, "loss": 0.4296, "step": 320 }, { "epoch": 0.29, "learning_rate": 2.616e-06, "loss": 0.4022, "step": 330 }, { "epoch": 0.29, "learning_rate": 2.696e-06, "loss": 0.395, "step": 340 }, { "epoch": 0.3, "learning_rate": 2.7759999999999998e-06, "loss": 0.4097, "step": 350 }, { "epoch": 0.31, "learning_rate": 2.856e-06, "loss": 0.459, "step": 360 }, { "epoch": 0.32, "learning_rate": 2.936e-06, "loss": 0.4474, "step": 370 }, { "epoch": 0.33, "learning_rate": 3.016e-06, "loss": 0.478, "step": 380 }, { "epoch": 0.34, "learning_rate": 3.096e-06, "loss": 0.4229, "step": 390 }, { "epoch": 0.35, "learning_rate": 3.176e-06, "loss": 0.4721, "step": 400 }, { "epoch": 0.36, "learning_rate": 3.256e-06, "loss": 0.4086, "step": 410 }, { "epoch": 0.36, "learning_rate": 3.336e-06, "loss": 0.403, "step": 420 }, { "epoch": 0.37, "learning_rate": 3.4159999999999996e-06, "loss": 0.4572, "step": 430 }, { "epoch": 0.38, "learning_rate": 3.4959999999999996e-06, "loss": 0.4601, "step": 440 }, { "epoch": 0.39, "learning_rate": 3.5759999999999997e-06, "loss": 0.3899, "step": 450 }, { "epoch": 0.4, "learning_rate": 3.656e-06, "loss": 0.4057, "step": 460 }, { "epoch": 0.41, "learning_rate": 3.736e-06, "loss": 0.4259, "step": 470 }, { "epoch": 0.42, "learning_rate": 3.8159999999999995e-06, "loss": 0.4377, "step": 480 }, { "epoch": 0.42, "learning_rate": 3.896e-06, "loss": 0.4794, "step": 490 }, { "epoch": 0.43, "learning_rate": 3.976e-06, "loss": 0.3526, "step": 500 }, { "epoch": 0.44, "learning_rate": 3.999510489510489e-06, "loss": 0.4127, "step": 510 }, { "epoch": 0.45, "learning_rate": 3.998811188811188e-06, "loss": 0.4779, "step": 520 }, { "epoch": 0.46, "learning_rate": 3.998111888111888e-06, "loss": 0.4301, "step": 530 }, { "epoch": 0.47, "learning_rate": 3.997412587412587e-06, "loss": 0.4345, "step": 540 }, { "epoch": 0.48, "learning_rate": 3.996713286713287e-06, "loss": 0.4821, "step": 550 }, { "epoch": 0.49, "learning_rate": 3.996013986013986e-06, "loss": 0.4621, "step": 560 }, { "epoch": 0.49, "learning_rate": 3.995314685314685e-06, "loss": 0.4367, "step": 570 }, { "epoch": 0.5, "learning_rate": 3.994615384615384e-06, "loss": 0.476, "step": 580 }, { "epoch": 0.51, "learning_rate": 3.993916083916084e-06, "loss": 0.4139, "step": 590 }, { "epoch": 0.52, "learning_rate": 3.993216783216783e-06, "loss": 0.4758, "step": 600 }, { "epoch": 0.53, "learning_rate": 3.992517482517483e-06, "loss": 0.4698, "step": 610 }, { "epoch": 0.54, "learning_rate": 3.9918181818181816e-06, "loss": 0.4321, "step": 620 }, { "epoch": 0.55, "learning_rate": 3.991118881118881e-06, "loss": 0.3903, "step": 630 }, { "epoch": 0.55, "learning_rate": 3.9904195804195806e-06, "loss": 0.4298, "step": 640 }, { "epoch": 0.56, "learning_rate": 3.989720279720279e-06, "loss": 0.4029, "step": 650 }, { "epoch": 0.57, "learning_rate": 3.989020979020979e-06, "loss": 0.3981, "step": 660 }, { "epoch": 0.58, "learning_rate": 3.988321678321678e-06, "loss": 0.4351, "step": 670 }, { "epoch": 0.59, "learning_rate": 3.987622377622378e-06, "loss": 0.3695, "step": 680 }, { "epoch": 0.6, "learning_rate": 3.986923076923076e-06, "loss": 0.3704, "step": 690 }, { "epoch": 0.61, "learning_rate": 3.986223776223776e-06, "loss": 0.473, "step": 700 }, { "epoch": 0.61, "learning_rate": 3.985524475524475e-06, "loss": 0.4391, "step": 710 }, { "epoch": 0.62, "learning_rate": 3.984825174825175e-06, "loss": 0.5259, "step": 720 }, { "epoch": 0.63, "learning_rate": 3.9841258741258735e-06, "loss": 0.3641, "step": 730 }, { "epoch": 0.64, "learning_rate": 3.983426573426573e-06, "loss": 0.4462, "step": 740 }, { "epoch": 0.65, "learning_rate": 3.9827272727272725e-06, "loss": 0.4094, "step": 750 }, { "epoch": 0.66, "learning_rate": 3.982027972027972e-06, "loss": 0.4254, "step": 760 }, { "epoch": 0.67, "learning_rate": 3.9813286713286715e-06, "loss": 0.4275, "step": 770 }, { "epoch": 0.68, "learning_rate": 3.98062937062937e-06, "loss": 0.4205, "step": 780 }, { "epoch": 0.68, "learning_rate": 3.97993006993007e-06, "loss": 0.3875, "step": 790 }, { "epoch": 0.69, "learning_rate": 3.979230769230769e-06, "loss": 0.3841, "step": 800 }, { "epoch": 0.7, "learning_rate": 3.978531468531469e-06, "loss": 0.441, "step": 810 }, { "epoch": 0.71, "learning_rate": 3.977832167832168e-06, "loss": 0.384, "step": 820 }, { "epoch": 0.72, "learning_rate": 3.977132867132867e-06, "loss": 0.4162, "step": 830 }, { "epoch": 0.73, "learning_rate": 3.976433566433566e-06, "loss": 0.4469, "step": 840 }, { "epoch": 0.74, "learning_rate": 3.975734265734266e-06, "loss": 0.4394, "step": 850 }, { "epoch": 0.74, "learning_rate": 3.975034965034965e-06, "loss": 0.3957, "step": 860 }, { "epoch": 0.75, "learning_rate": 3.974335664335664e-06, "loss": 0.4293, "step": 870 }, { "epoch": 0.76, "learning_rate": 3.973636363636363e-06, "loss": 0.3948, "step": 880 }, { "epoch": 0.77, "learning_rate": 3.972937062937063e-06, "loss": 0.4366, "step": 890 }, { "epoch": 0.78, "learning_rate": 3.9722377622377615e-06, "loss": 0.4388, "step": 900 }, { "epoch": 0.79, "learning_rate": 3.971538461538461e-06, "loss": 0.3781, "step": 910 }, { "epoch": 0.8, "learning_rate": 3.9708391608391605e-06, "loss": 0.4174, "step": 920 }, { "epoch": 0.81, "learning_rate": 3.97013986013986e-06, "loss": 0.393, "step": 930 }, { "epoch": 0.81, "learning_rate": 3.9694405594405595e-06, "loss": 0.4458, "step": 940 }, { "epoch": 0.82, "learning_rate": 3.968741258741258e-06, "loss": 0.4534, "step": 950 }, { "epoch": 0.83, "learning_rate": 3.968041958041958e-06, "loss": 0.4391, "step": 960 }, { "epoch": 0.84, "learning_rate": 3.967342657342657e-06, "loss": 0.4267, "step": 970 }, { "epoch": 0.85, "learning_rate": 3.966643356643357e-06, "loss": 0.4302, "step": 980 }, { "epoch": 0.86, "learning_rate": 3.965944055944056e-06, "loss": 0.4674, "step": 990 }, { "epoch": 0.87, "learning_rate": 3.965244755244755e-06, "loss": 0.4632, "step": 1000 }, { "epoch": 0.87, "learning_rate": 3.964545454545454e-06, "loss": 0.4233, "step": 1010 }, { "epoch": 0.88, "learning_rate": 3.963846153846154e-06, "loss": 0.4044, "step": 1020 }, { "epoch": 0.89, "learning_rate": 3.963146853146853e-06, "loss": 0.4616, "step": 1030 }, { "epoch": 0.9, "learning_rate": 3.962447552447553e-06, "loss": 0.4386, "step": 1040 }, { "epoch": 0.91, "learning_rate": 3.9617482517482515e-06, "loss": 0.4154, "step": 1050 }, { "epoch": 0.92, "learning_rate": 3.961048951048951e-06, "loss": 0.4102, "step": 1060 }, { "epoch": 0.93, "learning_rate": 3.9603496503496505e-06, "loss": 0.4106, "step": 1070 }, { "epoch": 0.94, "learning_rate": 3.959650349650349e-06, "loss": 0.449, "step": 1080 }, { "epoch": 0.94, "learning_rate": 3.958951048951049e-06, "loss": 0.4715, "step": 1090 }, { "epoch": 0.95, "learning_rate": 3.958251748251748e-06, "loss": 0.4988, "step": 1100 }, { "epoch": 0.96, "learning_rate": 3.957552447552448e-06, "loss": 0.4438, "step": 1110 }, { "epoch": 0.97, "learning_rate": 3.956853146853146e-06, "loss": 0.4058, "step": 1120 }, { "epoch": 0.98, "learning_rate": 3.956153846153846e-06, "loss": 0.3781, "step": 1130 }, { "epoch": 0.99, "learning_rate": 3.955454545454545e-06, "loss": 0.3865, "step": 1140 }, { "epoch": 1.0, "learning_rate": 3.954755244755245e-06, "loss": 0.4806, "step": 1150 }, { "epoch": 1.0, "eval_loss": 0.5673575401306152, "eval_runtime": 131.9861, "eval_samples_per_second": 4.031, "eval_steps_per_second": 2.015, "eval_wer": 0.26997493089927366, "step": 1154 }, { "epoch": 1.01, "learning_rate": 3.954055944055943e-06, "loss": 0.4652, "step": 1160 }, { "epoch": 1.01, "learning_rate": 3.953356643356643e-06, "loss": 0.4642, "step": 1170 }, { "epoch": 1.02, "learning_rate": 3.952657342657342e-06, "loss": 0.4661, "step": 1180 }, { "epoch": 1.03, "learning_rate": 3.951958041958042e-06, "loss": 0.435, "step": 1190 }, { "epoch": 1.04, "learning_rate": 3.951258741258741e-06, "loss": 0.4269, "step": 1200 }, { "epoch": 1.05, "learning_rate": 3.950559440559441e-06, "loss": 0.4067, "step": 1210 }, { "epoch": 1.06, "learning_rate": 3.9498601398601395e-06, "loss": 0.397, "step": 1220 }, { "epoch": 1.07, "learning_rate": 3.949160839160839e-06, "loss": 0.3716, "step": 1230 }, { "epoch": 1.07, "learning_rate": 3.9484615384615385e-06, "loss": 0.446, "step": 1240 }, { "epoch": 1.08, "learning_rate": 3.947762237762238e-06, "loss": 0.4251, "step": 1250 }, { "epoch": 1.09, "learning_rate": 3.947062937062937e-06, "loss": 0.4264, "step": 1260 }, { "epoch": 1.1, "learning_rate": 3.946363636363636e-06, "loss": 0.4241, "step": 1270 }, { "epoch": 1.11, "learning_rate": 3.945664335664336e-06, "loss": 0.3776, "step": 1280 }, { "epoch": 1.12, "learning_rate": 3.944965034965035e-06, "loss": 0.4869, "step": 1290 }, { "epoch": 1.13, "learning_rate": 3.944265734265734e-06, "loss": 0.4406, "step": 1300 }, { "epoch": 1.14, "learning_rate": 3.943566433566433e-06, "loss": 0.3714, "step": 1310 }, { "epoch": 1.14, "learning_rate": 3.942867132867133e-06, "loss": 0.4296, "step": 1320 }, { "epoch": 1.15, "learning_rate": 3.9421678321678314e-06, "loss": 0.4316, "step": 1330 }, { "epoch": 1.16, "learning_rate": 3.941468531468531e-06, "loss": 0.407, "step": 1340 }, { "epoch": 1.17, "learning_rate": 3.9407692307692304e-06, "loss": 0.4837, "step": 1350 }, { "epoch": 1.18, "learning_rate": 3.94006993006993e-06, "loss": 0.4113, "step": 1360 }, { "epoch": 1.19, "learning_rate": 3.9393706293706294e-06, "loss": 0.4394, "step": 1370 }, { "epoch": 1.2, "learning_rate": 3.938671328671328e-06, "loss": 0.4117, "step": 1380 }, { "epoch": 1.2, "learning_rate": 3.937972027972028e-06, "loss": 0.4547, "step": 1390 }, { "epoch": 1.21, "learning_rate": 3.937272727272727e-06, "loss": 0.42, "step": 1400 }, { "epoch": 1.22, "learning_rate": 3.9365734265734266e-06, "loss": 0.5635, "step": 1410 }, { "epoch": 1.23, "learning_rate": 3.935874125874126e-06, "loss": 0.363, "step": 1420 }, { "epoch": 1.24, "learning_rate": 3.935174825174825e-06, "loss": 0.3753, "step": 1430 }, { "epoch": 1.25, "learning_rate": 3.934475524475524e-06, "loss": 0.414, "step": 1440 }, { "epoch": 1.26, "learning_rate": 3.933776223776224e-06, "loss": 0.4094, "step": 1450 }, { "epoch": 1.27, "learning_rate": 3.933076923076923e-06, "loss": 0.4114, "step": 1460 }, { "epoch": 1.27, "learning_rate": 3.932377622377623e-06, "loss": 0.44, "step": 1470 }, { "epoch": 1.28, "learning_rate": 3.931678321678321e-06, "loss": 0.4268, "step": 1480 }, { "epoch": 1.29, "learning_rate": 3.930979020979021e-06, "loss": 0.4548, "step": 1490 }, { "epoch": 1.3, "learning_rate": 3.93027972027972e-06, "loss": 0.4305, "step": 1500 }, { "epoch": 1.31, "learning_rate": 3.929580419580419e-06, "loss": 0.4156, "step": 1510 }, { "epoch": 1.32, "learning_rate": 3.9288811188811185e-06, "loss": 0.3706, "step": 1520 }, { "epoch": 1.33, "learning_rate": 3.928181818181818e-06, "loss": 0.4603, "step": 1530 }, { "epoch": 1.33, "learning_rate": 3.9274825174825175e-06, "loss": 0.4222, "step": 1540 }, { "epoch": 1.34, "learning_rate": 3.926783216783216e-06, "loss": 0.436, "step": 1550 }, { "epoch": 1.35, "learning_rate": 3.926083916083916e-06, "loss": 0.4884, "step": 1560 }, { "epoch": 1.36, "learning_rate": 3.925384615384615e-06, "loss": 0.3887, "step": 1570 }, { "epoch": 1.37, "learning_rate": 3.924685314685315e-06, "loss": 0.3735, "step": 1580 }, { "epoch": 1.38, "learning_rate": 3.923986013986013e-06, "loss": 0.3924, "step": 1590 }, { "epoch": 1.39, "learning_rate": 3.923286713286713e-06, "loss": 0.4278, "step": 1600 }, { "epoch": 1.39, "learning_rate": 3.922587412587412e-06, "loss": 0.4174, "step": 1610 }, { "epoch": 1.4, "learning_rate": 3.921888111888112e-06, "loss": 0.3733, "step": 1620 }, { "epoch": 1.41, "learning_rate": 3.921188811188811e-06, "loss": 0.4129, "step": 1630 }, { "epoch": 1.42, "learning_rate": 3.920489510489511e-06, "loss": 0.3954, "step": 1640 }, { "epoch": 1.43, "learning_rate": 3.919790209790209e-06, "loss": 0.4381, "step": 1650 }, { "epoch": 1.44, "learning_rate": 3.919090909090909e-06, "loss": 0.4233, "step": 1660 }, { "epoch": 1.45, "learning_rate": 3.918391608391608e-06, "loss": 0.4528, "step": 1670 }, { "epoch": 1.46, "learning_rate": 3.917692307692308e-06, "loss": 0.4385, "step": 1680 }, { "epoch": 1.46, "learning_rate": 3.9169930069930066e-06, "loss": 0.4328, "step": 1690 }, { "epoch": 1.47, "learning_rate": 3.916293706293706e-06, "loss": 0.4573, "step": 1700 }, { "epoch": 1.48, "learning_rate": 3.9155944055944056e-06, "loss": 0.483, "step": 1710 }, { "epoch": 1.49, "learning_rate": 3.914895104895105e-06, "loss": 0.4303, "step": 1720 }, { "epoch": 1.5, "learning_rate": 3.914195804195804e-06, "loss": 0.37, "step": 1730 }, { "epoch": 1.51, "learning_rate": 3.913496503496503e-06, "loss": 0.3627, "step": 1740 }, { "epoch": 1.52, "learning_rate": 3.912797202797203e-06, "loss": 0.4677, "step": 1750 }, { "epoch": 1.52, "learning_rate": 3.912097902097902e-06, "loss": 0.3917, "step": 1760 }, { "epoch": 1.53, "learning_rate": 3.911398601398601e-06, "loss": 0.3872, "step": 1770 }, { "epoch": 1.54, "learning_rate": 3.9106993006993e-06, "loss": 0.4367, "step": 1780 }, { "epoch": 1.55, "learning_rate": 3.91e-06, "loss": 0.3843, "step": 1790 }, { "epoch": 1.56, "learning_rate": 3.909300699300699e-06, "loss": 0.4319, "step": 1800 }, { "epoch": 1.57, "learning_rate": 3.908601398601398e-06, "loss": 0.4144, "step": 1810 }, { "epoch": 1.58, "learning_rate": 3.9079020979020975e-06, "loss": 0.4558, "step": 1820 }, { "epoch": 1.59, "learning_rate": 3.907202797202797e-06, "loss": 0.4162, "step": 1830 }, { "epoch": 1.59, "learning_rate": 3.9065034965034965e-06, "loss": 0.4819, "step": 1840 }, { "epoch": 1.6, "learning_rate": 3.905804195804196e-06, "loss": 0.4162, "step": 1850 }, { "epoch": 1.61, "learning_rate": 3.9051048951048955e-06, "loss": 0.4193, "step": 1860 }, { "epoch": 1.62, "learning_rate": 3.904405594405594e-06, "loss": 0.4649, "step": 1870 }, { "epoch": 1.63, "learning_rate": 3.903706293706294e-06, "loss": 0.4096, "step": 1880 }, { "epoch": 1.64, "learning_rate": 3.903006993006993e-06, "loss": 0.4651, "step": 1890 }, { "epoch": 1.65, "learning_rate": 3.902307692307693e-06, "loss": 0.4042, "step": 1900 }, { "epoch": 1.65, "learning_rate": 3.901608391608391e-06, "loss": 0.4365, "step": 1910 }, { "epoch": 1.66, "learning_rate": 3.900909090909091e-06, "loss": 0.4693, "step": 1920 }, { "epoch": 1.67, "learning_rate": 3.90020979020979e-06, "loss": 0.3902, "step": 1930 }, { "epoch": 1.68, "learning_rate": 3.89951048951049e-06, "loss": 0.4166, "step": 1940 }, { "epoch": 1.69, "learning_rate": 3.898811188811188e-06, "loss": 0.4452, "step": 1950 }, { "epoch": 1.7, "learning_rate": 3.898111888111888e-06, "loss": 0.4268, "step": 1960 }, { "epoch": 1.71, "learning_rate": 3.897412587412587e-06, "loss": 0.4681, "step": 1970 }, { "epoch": 1.72, "learning_rate": 3.896713286713286e-06, "loss": 0.4049, "step": 1980 }, { "epoch": 1.72, "learning_rate": 3.8960139860139855e-06, "loss": 0.471, "step": 1990 }, { "epoch": 1.73, "learning_rate": 3.895314685314685e-06, "loss": 0.4484, "step": 2000 }, { "epoch": 1.74, "learning_rate": 3.8946153846153845e-06, "loss": 0.4749, "step": 2010 }, { "epoch": 1.75, "learning_rate": 3.893916083916084e-06, "loss": 0.4929, "step": 2020 }, { "epoch": 1.76, "learning_rate": 3.893216783216783e-06, "loss": 0.4125, "step": 2030 }, { "epoch": 1.77, "learning_rate": 3.892517482517482e-06, "loss": 0.4171, "step": 2040 }, { "epoch": 1.78, "learning_rate": 3.891818181818182e-06, "loss": 0.5211, "step": 2050 }, { "epoch": 1.78, "learning_rate": 3.891118881118881e-06, "loss": 0.4221, "step": 2060 }, { "epoch": 1.79, "learning_rate": 3.890419580419581e-06, "loss": 0.4622, "step": 2070 }, { "epoch": 1.8, "learning_rate": 3.889720279720279e-06, "loss": 0.403, "step": 2080 }, { "epoch": 1.81, "learning_rate": 3.889020979020979e-06, "loss": 0.432, "step": 2090 }, { "epoch": 1.82, "learning_rate": 3.888321678321678e-06, "loss": 0.439, "step": 2100 }, { "epoch": 1.83, "learning_rate": 3.887622377622378e-06, "loss": 0.4619, "step": 2110 }, { "epoch": 1.84, "learning_rate": 3.8869230769230765e-06, "loss": 0.4404, "step": 2120 }, { "epoch": 1.85, "learning_rate": 3.886223776223776e-06, "loss": 0.4447, "step": 2130 }, { "epoch": 1.85, "learning_rate": 3.8855244755244755e-06, "loss": 0.4246, "step": 2140 }, { "epoch": 1.86, "learning_rate": 3.884825174825175e-06, "loss": 0.4289, "step": 2150 }, { "epoch": 1.87, "learning_rate": 3.884125874125874e-06, "loss": 0.5245, "step": 2160 }, { "epoch": 1.88, "learning_rate": 3.883426573426573e-06, "loss": 0.405, "step": 2170 }, { "epoch": 1.89, "learning_rate": 3.882727272727273e-06, "loss": 0.4307, "step": 2180 }, { "epoch": 1.9, "learning_rate": 3.882027972027972e-06, "loss": 0.4372, "step": 2190 }, { "epoch": 1.91, "learning_rate": 3.881328671328671e-06, "loss": 0.4754, "step": 2200 }, { "epoch": 1.91, "learning_rate": 3.88062937062937e-06, "loss": 0.4121, "step": 2210 }, { "epoch": 1.92, "learning_rate": 3.88e-06, "loss": 0.44, "step": 2220 }, { "epoch": 1.93, "learning_rate": 3.879300699300699e-06, "loss": 0.4103, "step": 2230 }, { "epoch": 1.94, "learning_rate": 3.878601398601398e-06, "loss": 0.4443, "step": 2240 }, { "epoch": 1.95, "learning_rate": 3.877902097902098e-06, "loss": 0.4186, "step": 2250 }, { "epoch": 1.96, "learning_rate": 3.877202797202797e-06, "loss": 0.4083, "step": 2260 }, { "epoch": 1.97, "learning_rate": 3.876503496503497e-06, "loss": 0.4846, "step": 2270 }, { "epoch": 1.98, "learning_rate": 3.875804195804195e-06, "loss": 0.4019, "step": 2280 }, { "epoch": 1.98, "learning_rate": 3.875104895104895e-06, "loss": 0.4598, "step": 2290 }, { "epoch": 1.99, "learning_rate": 3.874405594405594e-06, "loss": 0.4109, "step": 2300 }, { "epoch": 2.0, "eval_loss": 0.5667211413383484, "eval_runtime": 132.8098, "eval_samples_per_second": 4.006, "eval_steps_per_second": 2.003, "eval_wer": 0.2739602751173105, "step": 2308 }, { "epoch": 2.0, "learning_rate": 3.873706293706294e-06, "loss": 0.4696, "step": 2310 }, { "epoch": 2.01, "learning_rate": 3.8730069930069925e-06, "loss": 0.4279, "step": 2320 }, { "epoch": 2.02, "learning_rate": 3.872307692307692e-06, "loss": 0.4668, "step": 2330 }, { "epoch": 2.03, "learning_rate": 3.8716083916083915e-06, "loss": 0.3705, "step": 2340 }, { "epoch": 2.04, "learning_rate": 3.870909090909091e-06, "loss": 0.4757, "step": 2350 }, { "epoch": 2.05, "learning_rate": 3.87020979020979e-06, "loss": 0.4652, "step": 2360 }, { "epoch": 2.05, "learning_rate": 3.869510489510489e-06, "loss": 0.4144, "step": 2370 }, { "epoch": 2.06, "learning_rate": 3.868811188811189e-06, "loss": 0.4441, "step": 2380 }, { "epoch": 2.07, "learning_rate": 3.868111888111888e-06, "loss": 0.4188, "step": 2390 }, { "epoch": 2.08, "learning_rate": 3.867412587412587e-06, "loss": 0.4725, "step": 2400 }, { "epoch": 2.09, "learning_rate": 3.866713286713286e-06, "loss": 0.4527, "step": 2410 }, { "epoch": 2.1, "learning_rate": 3.866013986013986e-06, "loss": 0.4182, "step": 2420 }, { "epoch": 2.11, "learning_rate": 3.865314685314685e-06, "loss": 0.3844, "step": 2430 }, { "epoch": 2.11, "learning_rate": 3.864615384615384e-06, "loss": 0.4113, "step": 2440 }, { "epoch": 2.12, "learning_rate": 3.8639160839160835e-06, "loss": 0.4282, "step": 2450 }, { "epoch": 2.13, "learning_rate": 3.863216783216783e-06, "loss": 0.4842, "step": 2460 }, { "epoch": 2.14, "learning_rate": 3.8625174825174825e-06, "loss": 0.4822, "step": 2470 }, { "epoch": 2.15, "learning_rate": 3.861818181818182e-06, "loss": 0.3696, "step": 2480 }, { "epoch": 2.16, "learning_rate": 3.8611188811188815e-06, "loss": 0.4124, "step": 2490 }, { "epoch": 2.17, "learning_rate": 3.86041958041958e-06, "loss": 0.4624, "step": 2500 }, { "epoch": 2.17, "learning_rate": 3.85972027972028e-06, "loss": 0.3711, "step": 2510 }, { "epoch": 2.18, "learning_rate": 3.859020979020979e-06, "loss": 0.4044, "step": 2520 }, { "epoch": 2.19, "learning_rate": 3.858321678321679e-06, "loss": 0.4136, "step": 2530 }, { "epoch": 2.2, "learning_rate": 3.857622377622377e-06, "loss": 0.3982, "step": 2540 }, { "epoch": 2.21, "learning_rate": 3.856923076923077e-06, "loss": 0.4259, "step": 2550 }, { "epoch": 2.22, "learning_rate": 3.856223776223776e-06, "loss": 0.4588, "step": 2560 }, { "epoch": 2.23, "learning_rate": 3.855524475524475e-06, "loss": 0.4043, "step": 2570 }, { "epoch": 2.24, "learning_rate": 3.854825174825174e-06, "loss": 0.4745, "step": 2580 }, { "epoch": 2.24, "learning_rate": 3.854125874125874e-06, "loss": 0.3965, "step": 2590 }, { "epoch": 2.25, "learning_rate": 3.853426573426573e-06, "loss": 0.449, "step": 2600 }, { "epoch": 2.26, "learning_rate": 3.852727272727272e-06, "loss": 0.4828, "step": 2610 }, { "epoch": 2.27, "learning_rate": 3.8520279720279715e-06, "loss": 0.4536, "step": 2620 }, { "epoch": 2.28, "learning_rate": 3.851328671328671e-06, "loss": 0.4621, "step": 2630 }, { "epoch": 2.29, "learning_rate": 3.8506293706293705e-06, "loss": 0.396, "step": 2640 }, { "epoch": 2.3, "learning_rate": 3.84993006993007e-06, "loss": 0.4883, "step": 2650 }, { "epoch": 2.3, "learning_rate": 3.849230769230769e-06, "loss": 0.4217, "step": 2660 }, { "epoch": 2.31, "learning_rate": 3.848531468531468e-06, "loss": 0.479, "step": 2670 }, { "epoch": 2.32, "learning_rate": 3.847832167832168e-06, "loss": 0.4179, "step": 2680 }, { "epoch": 2.33, "learning_rate": 3.847132867132867e-06, "loss": 0.4314, "step": 2690 }, { "epoch": 2.34, "learning_rate": 3.846433566433567e-06, "loss": 0.4006, "step": 2700 }, { "epoch": 2.35, "learning_rate": 3.845734265734266e-06, "loss": 0.4523, "step": 2710 }, { "epoch": 2.36, "learning_rate": 3.845034965034965e-06, "loss": 0.4371, "step": 2720 }, { "epoch": 2.37, "learning_rate": 3.844335664335664e-06, "loss": 0.4165, "step": 2730 }, { "epoch": 2.37, "learning_rate": 3.843636363636364e-06, "loss": 0.4169, "step": 2740 }, { "epoch": 2.38, "learning_rate": 3.8429370629370624e-06, "loss": 0.4272, "step": 2750 }, { "epoch": 2.39, "learning_rate": 3.842237762237762e-06, "loss": 0.4621, "step": 2760 }, { "epoch": 2.4, "learning_rate": 3.8415384615384614e-06, "loss": 0.4041, "step": 2770 }, { "epoch": 2.41, "learning_rate": 3.840839160839161e-06, "loss": 0.4403, "step": 2780 }, { "epoch": 2.42, "learning_rate": 3.84013986013986e-06, "loss": 0.4194, "step": 2790 }, { "epoch": 2.43, "learning_rate": 3.839440559440559e-06, "loss": 0.447, "step": 2800 }, { "epoch": 2.43, "learning_rate": 3.838741258741259e-06, "loss": 0.3986, "step": 2810 }, { "epoch": 2.44, "learning_rate": 3.838041958041958e-06, "loss": 0.4245, "step": 2820 }, { "epoch": 2.45, "learning_rate": 3.837342657342657e-06, "loss": 0.4412, "step": 2830 }, { "epoch": 2.46, "learning_rate": 3.836643356643356e-06, "loss": 0.4128, "step": 2840 }, { "epoch": 2.47, "learning_rate": 3.835944055944056e-06, "loss": 0.4236, "step": 2850 }, { "epoch": 2.48, "learning_rate": 3.835244755244755e-06, "loss": 0.5051, "step": 2860 }, { "epoch": 2.49, "learning_rate": 3.834545454545455e-06, "loss": 0.3899, "step": 2870 }, { "epoch": 2.5, "learning_rate": 3.833846153846153e-06, "loss": 0.402, "step": 2880 }, { "epoch": 2.5, "learning_rate": 3.833146853146853e-06, "loss": 0.4073, "step": 2890 }, { "epoch": 2.51, "learning_rate": 3.832447552447552e-06, "loss": 0.4324, "step": 2900 }, { "epoch": 2.52, "learning_rate": 3.831748251748252e-06, "loss": 0.4846, "step": 2910 }, { "epoch": 2.53, "learning_rate": 3.831048951048951e-06, "loss": 0.4426, "step": 2920 }, { "epoch": 2.54, "learning_rate": 3.83034965034965e-06, "loss": 0.3916, "step": 2930 }, { "epoch": 2.55, "learning_rate": 3.8296503496503495e-06, "loss": 0.3975, "step": 2940 }, { "epoch": 2.56, "learning_rate": 3.828951048951049e-06, "loss": 0.439, "step": 2950 }, { "epoch": 2.56, "learning_rate": 3.8282517482517485e-06, "loss": 0.4785, "step": 2960 }, { "epoch": 2.57, "learning_rate": 3.827552447552447e-06, "loss": 0.4355, "step": 2970 }, { "epoch": 2.58, "learning_rate": 3.826853146853147e-06, "loss": 0.3911, "step": 2980 }, { "epoch": 2.59, "learning_rate": 3.826153846153846e-06, "loss": 0.4459, "step": 2990 }, { "epoch": 2.6, "learning_rate": 3.825454545454546e-06, "loss": 0.4879, "step": 3000 }, { "epoch": 2.61, "learning_rate": 3.824755244755244e-06, "loss": 0.4449, "step": 3010 }, { "epoch": 2.62, "learning_rate": 3.824055944055944e-06, "loss": 0.4061, "step": 3020 }, { "epoch": 2.63, "learning_rate": 3.823356643356643e-06, "loss": 0.3946, "step": 3030 }, { "epoch": 2.63, "learning_rate": 3.822657342657342e-06, "loss": 0.4905, "step": 3040 }, { "epoch": 2.64, "learning_rate": 3.8219580419580414e-06, "loss": 0.4251, "step": 3050 }, { "epoch": 2.65, "learning_rate": 3.821258741258741e-06, "loss": 0.4532, "step": 3060 }, { "epoch": 2.66, "learning_rate": 3.82055944055944e-06, "loss": 0.3845, "step": 3070 }, { "epoch": 2.67, "learning_rate": 3.81986013986014e-06, "loss": 0.4218, "step": 3080 }, { "epoch": 2.68, "learning_rate": 3.8191608391608386e-06, "loss": 0.3965, "step": 3090 }, { "epoch": 2.69, "learning_rate": 3.818461538461538e-06, "loss": 0.4261, "step": 3100 }, { "epoch": 2.69, "learning_rate": 3.8177622377622376e-06, "loss": 0.3952, "step": 3110 }, { "epoch": 2.7, "learning_rate": 3.817062937062937e-06, "loss": 0.4337, "step": 3120 }, { "epoch": 2.71, "learning_rate": 3.8163636363636366e-06, "loss": 0.3518, "step": 3130 }, { "epoch": 2.72, "learning_rate": 3.815664335664336e-06, "loss": 0.4675, "step": 3140 }, { "epoch": 2.73, "learning_rate": 3.814965034965035e-06, "loss": 0.4442, "step": 3150 }, { "epoch": 2.74, "learning_rate": 3.814265734265734e-06, "loss": 0.4365, "step": 3160 }, { "epoch": 2.75, "learning_rate": 3.8135664335664333e-06, "loss": 0.3938, "step": 3170 }, { "epoch": 2.76, "learning_rate": 3.8128671328671328e-06, "loss": 0.3778, "step": 3180 }, { "epoch": 2.76, "learning_rate": 3.812167832167832e-06, "loss": 0.43, "step": 3190 }, { "epoch": 2.77, "learning_rate": 3.8114685314685313e-06, "loss": 0.3924, "step": 3200 }, { "epoch": 2.78, "learning_rate": 3.810769230769231e-06, "loss": 0.4437, "step": 3210 }, { "epoch": 2.79, "learning_rate": 3.81006993006993e-06, "loss": 0.4305, "step": 3220 }, { "epoch": 2.8, "learning_rate": 3.809370629370629e-06, "loss": 0.4576, "step": 3230 }, { "epoch": 2.81, "learning_rate": 3.8086713286713285e-06, "loss": 0.4286, "step": 3240 }, { "epoch": 2.82, "learning_rate": 3.807972027972028e-06, "loss": 0.4298, "step": 3250 }, { "epoch": 2.82, "learning_rate": 3.807272727272727e-06, "loss": 0.4584, "step": 3260 }, { "epoch": 2.83, "learning_rate": 3.8065734265734265e-06, "loss": 0.4241, "step": 3270 }, { "epoch": 2.84, "learning_rate": 3.8058741258741256e-06, "loss": 0.44, "step": 3280 }, { "epoch": 2.85, "learning_rate": 3.8051748251748247e-06, "loss": 0.3742, "step": 3290 }, { "epoch": 2.86, "learning_rate": 3.804475524475524e-06, "loss": 0.3989, "step": 3300 }, { "epoch": 2.87, "learning_rate": 3.8037762237762237e-06, "loss": 0.44, "step": 3310 }, { "epoch": 2.88, "learning_rate": 3.803076923076923e-06, "loss": 0.4348, "step": 3320 }, { "epoch": 2.89, "learning_rate": 3.8023776223776223e-06, "loss": 0.424, "step": 3330 }, { "epoch": 2.89, "learning_rate": 3.8016783216783213e-06, "loss": 0.3793, "step": 3340 }, { "epoch": 2.9, "learning_rate": 3.800979020979021e-06, "loss": 0.4532, "step": 3350 }, { "epoch": 2.91, "learning_rate": 3.8002797202797203e-06, "loss": 0.4313, "step": 3360 }, { "epoch": 2.92, "learning_rate": 3.7995804195804194e-06, "loss": 0.4326, "step": 3370 }, { "epoch": 2.93, "learning_rate": 3.798881118881119e-06, "loss": 0.3999, "step": 3380 }, { "epoch": 2.94, "learning_rate": 3.798181818181818e-06, "loss": 0.4128, "step": 3390 }, { "epoch": 2.95, "learning_rate": 3.797482517482517e-06, "loss": 0.4218, "step": 3400 }, { "epoch": 2.95, "learning_rate": 3.7967832167832165e-06, "loss": 0.4248, "step": 3410 }, { "epoch": 2.96, "learning_rate": 3.796083916083916e-06, "loss": 0.3458, "step": 3420 }, { "epoch": 2.97, "learning_rate": 3.7953846153846155e-06, "loss": 0.4079, "step": 3430 }, { "epoch": 2.98, "learning_rate": 3.794685314685314e-06, "loss": 0.43, "step": 3440 }, { "epoch": 2.99, "learning_rate": 3.7939860139860137e-06, "loss": 0.4257, "step": 3450 }, { "epoch": 3.0, "learning_rate": 3.793286713286713e-06, "loss": 0.4183, "step": 3460 }, { "epoch": 3.0, "eval_loss": 0.5650942921638489, "eval_runtime": 133.5311, "eval_samples_per_second": 3.984, "eval_steps_per_second": 1.992, "eval_wer": 0.2742173940991194, "step": 3462 }, { "epoch": 3.01, "learning_rate": 3.7925874125874123e-06, "loss": 0.4397, "step": 3470 }, { "epoch": 3.02, "learning_rate": 3.7918881118881117e-06, "loss": 0.4497, "step": 3480 }, { "epoch": 3.02, "learning_rate": 3.7911888111888112e-06, "loss": 0.4424, "step": 3490 }, { "epoch": 3.03, "learning_rate": 3.7904895104895103e-06, "loss": 0.5406, "step": 3500 }, { "epoch": 3.04, "learning_rate": 3.7897902097902094e-06, "loss": 0.5165, "step": 3510 }, { "epoch": 3.05, "learning_rate": 3.789090909090909e-06, "loss": 0.388, "step": 3520 }, { "epoch": 3.06, "learning_rate": 3.7883916083916084e-06, "loss": 0.3958, "step": 3530 }, { "epoch": 3.07, "learning_rate": 3.787692307692308e-06, "loss": 0.3826, "step": 3540 }, { "epoch": 3.08, "learning_rate": 3.7869930069930065e-06, "loss": 0.4399, "step": 3550 }, { "epoch": 3.08, "learning_rate": 3.786293706293706e-06, "loss": 0.4987, "step": 3560 }, { "epoch": 3.09, "learning_rate": 3.7855944055944055e-06, "loss": 0.4862, "step": 3570 }, { "epoch": 3.1, "learning_rate": 3.7848951048951046e-06, "loss": 0.4197, "step": 3580 }, { "epoch": 3.11, "learning_rate": 3.784195804195804e-06, "loss": 0.4305, "step": 3590 }, { "epoch": 3.12, "learning_rate": 3.7834965034965036e-06, "loss": 0.4473, "step": 3600 }, { "epoch": 3.13, "learning_rate": 3.7827972027972027e-06, "loss": 0.4162, "step": 3610 }, { "epoch": 3.14, "learning_rate": 3.7820979020979017e-06, "loss": 0.4128, "step": 3620 }, { "epoch": 3.15, "learning_rate": 3.7813986013986012e-06, "loss": 0.4461, "step": 3630 }, { "epoch": 3.15, "learning_rate": 3.7806993006993007e-06, "loss": 0.3405, "step": 3640 }, { "epoch": 3.16, "learning_rate": 3.78e-06, "loss": 0.4331, "step": 3650 }, { "epoch": 3.17, "learning_rate": 3.779300699300699e-06, "loss": 0.4181, "step": 3660 }, { "epoch": 3.18, "learning_rate": 3.7786013986013984e-06, "loss": 0.4451, "step": 3670 }, { "epoch": 3.19, "learning_rate": 3.777902097902098e-06, "loss": 0.4119, "step": 3680 }, { "epoch": 3.2, "learning_rate": 3.777202797202797e-06, "loss": 0.4076, "step": 3690 }, { "epoch": 3.21, "learning_rate": 3.7765034965034964e-06, "loss": 0.4246, "step": 3700 }, { "epoch": 3.21, "learning_rate": 3.775804195804196e-06, "loss": 0.4545, "step": 3710 }, { "epoch": 3.22, "learning_rate": 3.7751048951048946e-06, "loss": 0.4589, "step": 3720 }, { "epoch": 3.23, "learning_rate": 3.774405594405594e-06, "loss": 0.3718, "step": 3730 }, { "epoch": 3.24, "learning_rate": 3.7737062937062936e-06, "loss": 0.4376, "step": 3740 }, { "epoch": 3.25, "learning_rate": 3.773006993006993e-06, "loss": 0.4793, "step": 3750 }, { "epoch": 3.26, "learning_rate": 3.772307692307692e-06, "loss": 0.4543, "step": 3760 }, { "epoch": 3.27, "learning_rate": 3.7716083916083912e-06, "loss": 0.4228, "step": 3770 }, { "epoch": 3.28, "learning_rate": 3.7709090909090907e-06, "loss": 0.4624, "step": 3780 }, { "epoch": 3.28, "learning_rate": 3.7702097902097902e-06, "loss": 0.4135, "step": 3790 }, { "epoch": 3.29, "learning_rate": 3.7695104895104893e-06, "loss": 0.3678, "step": 3800 }, { "epoch": 3.3, "learning_rate": 3.768811188811189e-06, "loss": 0.5265, "step": 3810 }, { "epoch": 3.31, "learning_rate": 3.768111888111888e-06, "loss": 0.4423, "step": 3820 }, { "epoch": 3.32, "learning_rate": 3.767412587412587e-06, "loss": 0.3714, "step": 3830 }, { "epoch": 3.33, "learning_rate": 3.7667132867132864e-06, "loss": 0.4268, "step": 3840 }, { "epoch": 3.34, "learning_rate": 3.766013986013986e-06, "loss": 0.4489, "step": 3850 }, { "epoch": 3.34, "learning_rate": 3.7653146853146854e-06, "loss": 0.5035, "step": 3860 }, { "epoch": 3.35, "learning_rate": 3.7646153846153845e-06, "loss": 0.4687, "step": 3870 }, { "epoch": 3.36, "learning_rate": 3.7639160839160836e-06, "loss": 0.4121, "step": 3880 }, { "epoch": 3.37, "learning_rate": 3.763216783216783e-06, "loss": 0.369, "step": 3890 }, { "epoch": 3.38, "learning_rate": 3.762517482517482e-06, "loss": 0.4527, "step": 3900 }, { "epoch": 3.39, "learning_rate": 3.7618181818181816e-06, "loss": 0.4308, "step": 3910 }, { "epoch": 3.4, "learning_rate": 3.761118881118881e-06, "loss": 0.4128, "step": 3920 }, { "epoch": 3.41, "learning_rate": 3.7604195804195802e-06, "loss": 0.521, "step": 3930 }, { "epoch": 3.41, "learning_rate": 3.7597202797202793e-06, "loss": 0.4238, "step": 3940 }, { "epoch": 3.42, "learning_rate": 3.7590209790209788e-06, "loss": 0.4704, "step": 3950 }, { "epoch": 3.43, "learning_rate": 3.7583216783216783e-06, "loss": 0.4642, "step": 3960 }, { "epoch": 3.44, "learning_rate": 3.7576223776223778e-06, "loss": 0.4667, "step": 3970 }, { "epoch": 3.45, "learning_rate": 3.7569230769230764e-06, "loss": 0.4269, "step": 3980 }, { "epoch": 3.46, "learning_rate": 3.756223776223776e-06, "loss": 0.4289, "step": 3990 }, { "epoch": 3.47, "learning_rate": 3.7555244755244754e-06, "loss": 0.4133, "step": 4000 }, { "epoch": 3.47, "learning_rate": 3.7548251748251745e-06, "loss": 0.421, "step": 4010 }, { "epoch": 3.48, "learning_rate": 3.754125874125874e-06, "loss": 0.4431, "step": 4020 }, { "epoch": 3.49, "learning_rate": 3.7534265734265735e-06, "loss": 0.42, "step": 4030 }, { "epoch": 3.5, "learning_rate": 3.7527272727272726e-06, "loss": 0.3878, "step": 4040 }, { "epoch": 3.51, "learning_rate": 3.7520279720279716e-06, "loss": 0.4353, "step": 4050 }, { "epoch": 3.52, "learning_rate": 3.751328671328671e-06, "loss": 0.4756, "step": 4060 }, { "epoch": 3.53, "learning_rate": 3.7506293706293706e-06, "loss": 0.4126, "step": 4070 }, { "epoch": 3.54, "learning_rate": 3.7499300699300697e-06, "loss": 0.4228, "step": 4080 }, { "epoch": 3.54, "learning_rate": 3.7492307692307688e-06, "loss": 0.4061, "step": 4090 }, { "epoch": 3.55, "learning_rate": 3.7485314685314683e-06, "loss": 0.4199, "step": 4100 }, { "epoch": 3.56, "learning_rate": 3.7478321678321678e-06, "loss": 0.3854, "step": 4110 }, { "epoch": 3.57, "learning_rate": 3.747132867132867e-06, "loss": 0.4457, "step": 4120 }, { "epoch": 3.58, "learning_rate": 3.7464335664335663e-06, "loss": 0.4599, "step": 4130 }, { "epoch": 3.59, "learning_rate": 3.745734265734266e-06, "loss": 0.4054, "step": 4140 }, { "epoch": 3.6, "learning_rate": 3.745034965034965e-06, "loss": 0.3808, "step": 4150 }, { "epoch": 3.6, "learning_rate": 3.744335664335664e-06, "loss": 0.4587, "step": 4160 }, { "epoch": 3.61, "learning_rate": 3.7436363636363635e-06, "loss": 0.4025, "step": 4170 }, { "epoch": 3.62, "learning_rate": 3.742937062937063e-06, "loss": 0.4518, "step": 4180 }, { "epoch": 3.63, "learning_rate": 3.742237762237762e-06, "loss": 0.4274, "step": 4190 }, { "epoch": 3.64, "learning_rate": 3.741538461538461e-06, "loss": 0.3934, "step": 4200 }, { "epoch": 3.65, "learning_rate": 3.7408391608391606e-06, "loss": 0.4389, "step": 4210 }, { "epoch": 3.66, "learning_rate": 3.74013986013986e-06, "loss": 0.4551, "step": 4220 }, { "epoch": 3.67, "learning_rate": 3.739440559440559e-06, "loss": 0.437, "step": 4230 }, { "epoch": 3.67, "learning_rate": 3.7387412587412587e-06, "loss": 0.3626, "step": 4240 }, { "epoch": 3.68, "learning_rate": 3.738041958041958e-06, "loss": 0.4564, "step": 4250 }, { "epoch": 3.69, "learning_rate": 3.737342657342657e-06, "loss": 0.4565, "step": 4260 }, { "epoch": 3.7, "learning_rate": 3.7366433566433563e-06, "loss": 0.3513, "step": 4270 }, { "epoch": 3.71, "learning_rate": 3.735944055944056e-06, "loss": 0.4132, "step": 4280 }, { "epoch": 3.72, "learning_rate": 3.7352447552447553e-06, "loss": 0.4435, "step": 4290 }, { "epoch": 3.73, "learning_rate": 3.7345454545454544e-06, "loss": 0.4355, "step": 4300 }, { "epoch": 3.73, "learning_rate": 3.7338461538461535e-06, "loss": 0.4505, "step": 4310 }, { "epoch": 3.74, "learning_rate": 3.733146853146853e-06, "loss": 0.4314, "step": 4320 }, { "epoch": 3.75, "learning_rate": 3.7324475524475525e-06, "loss": 0.4169, "step": 4330 }, { "epoch": 3.76, "learning_rate": 3.7317482517482515e-06, "loss": 0.4096, "step": 4340 }, { "epoch": 3.77, "learning_rate": 3.731048951048951e-06, "loss": 0.4357, "step": 4350 }, { "epoch": 3.78, "learning_rate": 3.73034965034965e-06, "loss": 0.4208, "step": 4360 }, { "epoch": 3.79, "learning_rate": 3.729650349650349e-06, "loss": 0.4181, "step": 4370 }, { "epoch": 3.8, "learning_rate": 3.7289510489510487e-06, "loss": 0.3545, "step": 4380 }, { "epoch": 3.8, "learning_rate": 3.728251748251748e-06, "loss": 0.4258, "step": 4390 }, { "epoch": 3.81, "learning_rate": 3.7275524475524477e-06, "loss": 0.435, "step": 4400 }, { "epoch": 3.82, "learning_rate": 3.7268531468531468e-06, "loss": 0.4027, "step": 4410 }, { "epoch": 3.83, "learning_rate": 3.726153846153846e-06, "loss": 0.3978, "step": 4420 }, { "epoch": 3.84, "learning_rate": 3.7254545454545453e-06, "loss": 0.4087, "step": 4430 }, { "epoch": 3.85, "learning_rate": 3.7247552447552444e-06, "loss": 0.4328, "step": 4440 }, { "epoch": 3.86, "learning_rate": 3.724055944055944e-06, "loss": 0.4419, "step": 4450 }, { "epoch": 3.86, "learning_rate": 3.7233566433566434e-06, "loss": 0.4289, "step": 4460 }, { "epoch": 3.87, "learning_rate": 3.7226573426573425e-06, "loss": 0.4208, "step": 4470 }, { "epoch": 3.88, "learning_rate": 3.7219580419580415e-06, "loss": 0.3757, "step": 4480 }, { "epoch": 3.89, "learning_rate": 3.721258741258741e-06, "loss": 0.4707, "step": 4490 }, { "epoch": 3.9, "learning_rate": 3.7205594405594405e-06, "loss": 0.4446, "step": 4500 }, { "epoch": 3.91, "learning_rate": 3.71986013986014e-06, "loss": 0.4387, "step": 4510 }, { "epoch": 3.92, "learning_rate": 3.719160839160839e-06, "loss": 0.3761, "step": 4520 }, { "epoch": 3.93, "learning_rate": 3.718461538461538e-06, "loss": 0.3772, "step": 4530 }, { "epoch": 3.93, "learning_rate": 3.7177622377622377e-06, "loss": 0.3546, "step": 4540 }, { "epoch": 3.94, "learning_rate": 3.7170629370629367e-06, "loss": 0.3831, "step": 4550 }, { "epoch": 3.95, "learning_rate": 3.7163636363636362e-06, "loss": 0.4194, "step": 4560 }, { "epoch": 3.96, "learning_rate": 3.7156643356643357e-06, "loss": 0.3452, "step": 4570 }, { "epoch": 3.97, "learning_rate": 3.714965034965035e-06, "loss": 0.426, "step": 4580 }, { "epoch": 3.98, "learning_rate": 3.714265734265734e-06, "loss": 0.4237, "step": 4590 }, { "epoch": 3.99, "learning_rate": 3.7135664335664334e-06, "loss": 0.4047, "step": 4600 }, { "epoch": 3.99, "learning_rate": 3.712867132867133e-06, "loss": 0.4618, "step": 4610 }, { "epoch": 4.0, "eval_loss": 0.5653170347213745, "eval_runtime": 133.4467, "eval_samples_per_second": 3.987, "eval_steps_per_second": 1.993, "eval_wer": 0.2675323005720897, "step": 4616 }, { "epoch": 4.0, "learning_rate": 3.712167832167832e-06, "loss": 0.4252, "step": 4620 }, { "epoch": 4.01, "learning_rate": 3.711468531468531e-06, "loss": 0.4812, "step": 4630 }, { "epoch": 4.02, "learning_rate": 3.7107692307692305e-06, "loss": 0.3366, "step": 4640 }, { "epoch": 4.03, "learning_rate": 3.71006993006993e-06, "loss": 0.4217, "step": 4650 }, { "epoch": 4.04, "learning_rate": 3.709370629370629e-06, "loss": 0.459, "step": 4660 }, { "epoch": 4.05, "learning_rate": 3.7086713286713286e-06, "loss": 0.4434, "step": 4670 }, { "epoch": 4.06, "learning_rate": 3.707972027972028e-06, "loss": 0.4243, "step": 4680 }, { "epoch": 4.06, "learning_rate": 3.7072727272727267e-06, "loss": 0.4106, "step": 4690 }, { "epoch": 4.07, "learning_rate": 3.7065734265734262e-06, "loss": 0.4261, "step": 4700 }, { "epoch": 4.08, "learning_rate": 3.7058741258741257e-06, "loss": 0.4321, "step": 4710 }, { "epoch": 4.09, "learning_rate": 3.7051748251748252e-06, "loss": 0.4066, "step": 4720 }, { "epoch": 4.1, "learning_rate": 3.7044755244755243e-06, "loss": 0.3874, "step": 4730 }, { "epoch": 4.11, "learning_rate": 3.7037762237762234e-06, "loss": 0.3956, "step": 4740 }, { "epoch": 4.12, "learning_rate": 3.703076923076923e-06, "loss": 0.3823, "step": 4750 }, { "epoch": 4.12, "learning_rate": 3.7023776223776224e-06, "loss": 0.3953, "step": 4760 }, { "epoch": 4.13, "learning_rate": 3.7016783216783214e-06, "loss": 0.4628, "step": 4770 }, { "epoch": 4.14, "learning_rate": 3.700979020979021e-06, "loss": 0.4156, "step": 4780 }, { "epoch": 4.15, "learning_rate": 3.7002797202797204e-06, "loss": 0.3769, "step": 4790 }, { "epoch": 4.16, "learning_rate": 3.699580419580419e-06, "loss": 0.3838, "step": 4800 }, { "epoch": 4.17, "learning_rate": 3.6988811188811186e-06, "loss": 0.3492, "step": 4810 }, { "epoch": 4.18, "learning_rate": 3.698181818181818e-06, "loss": 0.3568, "step": 4820 }, { "epoch": 4.19, "learning_rate": 3.6974825174825176e-06, "loss": 0.4544, "step": 4830 }, { "epoch": 4.19, "learning_rate": 3.6967832167832167e-06, "loss": 0.3981, "step": 4840 }, { "epoch": 4.2, "learning_rate": 3.6960839160839157e-06, "loss": 0.4105, "step": 4850 }, { "epoch": 4.21, "learning_rate": 3.6953846153846152e-06, "loss": 0.422, "step": 4860 }, { "epoch": 4.22, "learning_rate": 3.6946853146853143e-06, "loss": 0.3775, "step": 4870 }, { "epoch": 4.23, "learning_rate": 3.693986013986014e-06, "loss": 0.4763, "step": 4880 }, { "epoch": 4.24, "learning_rate": 3.6932867132867133e-06, "loss": 0.3996, "step": 4890 }, { "epoch": 4.25, "learning_rate": 3.6925874125874128e-06, "loss": 0.4157, "step": 4900 }, { "epoch": 4.25, "learning_rate": 3.6918881118881114e-06, "loss": 0.4038, "step": 4910 }, { "epoch": 4.26, "learning_rate": 3.691188811188811e-06, "loss": 0.4375, "step": 4920 }, { "epoch": 4.27, "learning_rate": 3.6904895104895104e-06, "loss": 0.3983, "step": 4930 }, { "epoch": 4.28, "learning_rate": 3.68979020979021e-06, "loss": 0.376, "step": 4940 }, { "epoch": 4.29, "learning_rate": 3.689090909090909e-06, "loss": 0.4349, "step": 4950 }, { "epoch": 4.3, "learning_rate": 3.688391608391608e-06, "loss": 0.4193, "step": 4960 }, { "epoch": 4.31, "learning_rate": 3.6876923076923076e-06, "loss": 0.4872, "step": 4970 }, { "epoch": 4.32, "learning_rate": 3.6869930069930066e-06, "loss": 0.4245, "step": 4980 }, { "epoch": 4.32, "learning_rate": 3.686293706293706e-06, "loss": 0.3797, "step": 4990 }, { "epoch": 4.33, "learning_rate": 3.6855944055944056e-06, "loss": 0.3833, "step": 5000 }, { "epoch": 4.34, "learning_rate": 3.6848951048951047e-06, "loss": 0.4412, "step": 5010 }, { "epoch": 4.35, "learning_rate": 3.6841958041958038e-06, "loss": 0.4183, "step": 5020 }, { "epoch": 4.36, "learning_rate": 3.6834965034965033e-06, "loss": 0.3991, "step": 5030 }, { "epoch": 4.37, "learning_rate": 3.6827972027972028e-06, "loss": 0.4045, "step": 5040 }, { "epoch": 4.38, "learning_rate": 3.682097902097902e-06, "loss": 0.419, "step": 5050 }, { "epoch": 4.38, "learning_rate": 3.6814685314685313e-06, "loss": 0.4751, "step": 5060 }, { "epoch": 4.39, "learning_rate": 3.6807692307692304e-06, "loss": 0.4423, "step": 5070 }, { "epoch": 4.4, "learning_rate": 3.68006993006993e-06, "loss": 0.4421, "step": 5080 }, { "epoch": 4.41, "learning_rate": 3.6793706293706294e-06, "loss": 0.4682, "step": 5090 }, { "epoch": 4.42, "learning_rate": 3.678671328671329e-06, "loss": 0.4166, "step": 5100 }, { "epoch": 4.43, "learning_rate": 3.6779720279720275e-06, "loss": 0.3662, "step": 5110 }, { "epoch": 4.44, "learning_rate": 3.677272727272727e-06, "loss": 0.4312, "step": 5120 }, { "epoch": 4.45, "learning_rate": 3.6765734265734265e-06, "loss": 0.4069, "step": 5130 }, { "epoch": 4.45, "learning_rate": 3.6758741258741256e-06, "loss": 0.3921, "step": 5140 }, { "epoch": 4.46, "learning_rate": 3.675174825174825e-06, "loss": 0.4333, "step": 5150 }, { "epoch": 4.47, "learning_rate": 3.674475524475524e-06, "loss": 0.4416, "step": 5160 }, { "epoch": 4.48, "learning_rate": 3.6737762237762237e-06, "loss": 0.4463, "step": 5170 }, { "epoch": 4.49, "learning_rate": 3.6730769230769227e-06, "loss": 0.439, "step": 5180 }, { "epoch": 4.5, "learning_rate": 3.6723776223776222e-06, "loss": 0.4153, "step": 5190 }, { "epoch": 4.51, "learning_rate": 3.6716783216783217e-06, "loss": 0.4236, "step": 5200 }, { "epoch": 4.51, "learning_rate": 3.670979020979021e-06, "loss": 0.4354, "step": 5210 }, { "epoch": 4.52, "learning_rate": 3.67027972027972e-06, "loss": 0.4321, "step": 5220 }, { "epoch": 4.53, "learning_rate": 3.6695804195804194e-06, "loss": 0.4584, "step": 5230 }, { "epoch": 4.54, "learning_rate": 3.668881118881119e-06, "loss": 0.4637, "step": 5240 }, { "epoch": 4.55, "learning_rate": 3.668181818181818e-06, "loss": 0.414, "step": 5250 }, { "epoch": 4.56, "learning_rate": 3.6674825174825174e-06, "loss": 0.4954, "step": 5260 }, { "epoch": 4.57, "learning_rate": 3.6667832167832165e-06, "loss": 0.3738, "step": 5270 }, { "epoch": 4.58, "learning_rate": 3.666083916083916e-06, "loss": 0.3884, "step": 5280 }, { "epoch": 4.58, "learning_rate": 3.665384615384615e-06, "loss": 0.3681, "step": 5290 }, { "epoch": 4.59, "learning_rate": 3.6646853146853146e-06, "loss": 0.4485, "step": 5300 }, { "epoch": 4.6, "learning_rate": 3.663986013986014e-06, "loss": 0.4244, "step": 5310 }, { "epoch": 4.61, "learning_rate": 3.6632867132867127e-06, "loss": 0.3891, "step": 5320 }, { "epoch": 4.62, "learning_rate": 3.6625874125874122e-06, "loss": 0.4124, "step": 5330 }, { "epoch": 4.63, "learning_rate": 3.6618881118881117e-06, "loss": 0.3761, "step": 5340 }, { "epoch": 4.64, "learning_rate": 3.6611888111888112e-06, "loss": 0.3659, "step": 5350 }, { "epoch": 4.64, "learning_rate": 3.6604895104895103e-06, "loss": 0.4604, "step": 5360 }, { "epoch": 4.65, "learning_rate": 3.65979020979021e-06, "loss": 0.4532, "step": 5370 }, { "epoch": 4.66, "learning_rate": 3.659090909090909e-06, "loss": 0.4347, "step": 5380 }, { "epoch": 4.67, "learning_rate": 3.6583916083916084e-06, "loss": 0.4212, "step": 5390 }, { "epoch": 4.68, "learning_rate": 3.6576923076923074e-06, "loss": 0.457, "step": 5400 }, { "epoch": 4.69, "learning_rate": 3.656993006993007e-06, "loss": 0.5144, "step": 5410 }, { "epoch": 4.7, "learning_rate": 3.6562937062937064e-06, "loss": 0.4147, "step": 5420 }, { "epoch": 4.71, "learning_rate": 3.655594405594405e-06, "loss": 0.4336, "step": 5430 }, { "epoch": 4.71, "learning_rate": 3.6548951048951046e-06, "loss": 0.4126, "step": 5440 }, { "epoch": 4.72, "learning_rate": 3.654195804195804e-06, "loss": 0.4083, "step": 5450 }, { "epoch": 4.73, "learning_rate": 3.6534965034965036e-06, "loss": 0.444, "step": 5460 }, { "epoch": 4.74, "learning_rate": 3.6527972027972026e-06, "loss": 0.4407, "step": 5470 }, { "epoch": 4.75, "learning_rate": 3.6520979020979017e-06, "loss": 0.4018, "step": 5480 }, { "epoch": 4.76, "learning_rate": 3.651398601398601e-06, "loss": 0.4195, "step": 5490 }, { "epoch": 4.77, "learning_rate": 3.6506993006993003e-06, "loss": 0.4083, "step": 5500 }, { "epoch": 4.77, "learning_rate": 3.6499999999999998e-06, "loss": 0.4352, "step": 5510 }, { "epoch": 4.78, "learning_rate": 3.6493006993006993e-06, "loss": 0.451, "step": 5520 }, { "epoch": 4.79, "learning_rate": 3.6486013986013988e-06, "loss": 0.3954, "step": 5530 }, { "epoch": 4.8, "learning_rate": 3.6479020979020974e-06, "loss": 0.4088, "step": 5540 }, { "epoch": 4.81, "learning_rate": 3.647202797202797e-06, "loss": 0.3787, "step": 5550 }, { "epoch": 4.82, "learning_rate": 3.6465034965034964e-06, "loss": 0.4491, "step": 5560 }, { "epoch": 4.83, "learning_rate": 3.645804195804196e-06, "loss": 0.476, "step": 5570 }, { "epoch": 4.83, "learning_rate": 3.645104895104895e-06, "loss": 0.4762, "step": 5580 }, { "epoch": 4.84, "learning_rate": 3.644405594405594e-06, "loss": 0.3717, "step": 5590 }, { "epoch": 4.85, "learning_rate": 3.6437062937062936e-06, "loss": 0.447, "step": 5600 }, { "epoch": 4.86, "learning_rate": 3.6430069930069926e-06, "loss": 0.427, "step": 5610 }, { "epoch": 4.87, "learning_rate": 3.642307692307692e-06, "loss": 0.4573, "step": 5620 }, { "epoch": 4.88, "learning_rate": 3.6416083916083916e-06, "loss": 0.4257, "step": 5630 }, { "epoch": 4.89, "learning_rate": 3.640909090909091e-06, "loss": 0.4192, "step": 5640 }, { "epoch": 4.9, "learning_rate": 3.6402097902097898e-06, "loss": 0.4273, "step": 5650 }, { "epoch": 4.9, "learning_rate": 3.6395104895104893e-06, "loss": 0.4011, "step": 5660 }, { "epoch": 4.91, "learning_rate": 3.6388111888111888e-06, "loss": 0.4335, "step": 5670 }, { "epoch": 4.92, "learning_rate": 3.638111888111888e-06, "loss": 0.4133, "step": 5680 }, { "epoch": 4.93, "learning_rate": 3.6374125874125873e-06, "loss": 0.4318, "step": 5690 }, { "epoch": 4.94, "learning_rate": 3.6367132867132864e-06, "loss": 0.4009, "step": 5700 }, { "epoch": 4.95, "learning_rate": 3.636013986013986e-06, "loss": 0.37, "step": 5710 }, { "epoch": 4.96, "learning_rate": 3.635314685314685e-06, "loss": 0.5268, "step": 5720 }, { "epoch": 4.96, "learning_rate": 3.6346153846153845e-06, "loss": 0.3504, "step": 5730 }, { "epoch": 4.97, "learning_rate": 3.633916083916084e-06, "loss": 0.4493, "step": 5740 }, { "epoch": 4.98, "learning_rate": 3.6332167832167835e-06, "loss": 0.4104, "step": 5750 }, { "epoch": 4.99, "learning_rate": 3.632517482517482e-06, "loss": 0.4701, "step": 5760 }, { "epoch": 5.0, "learning_rate": 3.6318181818181816e-06, "loss": 0.4179, "step": 5770 }, { "epoch": 5.0, "eval_loss": 0.5541394352912903, "eval_runtime": 132.2755, "eval_samples_per_second": 4.022, "eval_steps_per_second": 2.011, "eval_wer": 0.2696535321720126, "step": 5770 }, { "epoch": 5.01, "learning_rate": 3.631118881118881e-06, "loss": 0.4515, "step": 5780 }, { "epoch": 5.02, "learning_rate": 3.63041958041958e-06, "loss": 0.3908, "step": 5790 }, { "epoch": 5.03, "learning_rate": 3.6297202797202797e-06, "loss": 0.3718, "step": 5800 }, { "epoch": 5.03, "learning_rate": 3.6290209790209788e-06, "loss": 0.4033, "step": 5810 }, { "epoch": 5.04, "learning_rate": 3.6283216783216783e-06, "loss": 0.4639, "step": 5820 }, { "epoch": 5.05, "learning_rate": 3.6276223776223773e-06, "loss": 0.4132, "step": 5830 }, { "epoch": 5.06, "learning_rate": 3.626923076923077e-06, "loss": 0.3738, "step": 5840 }, { "epoch": 5.07, "learning_rate": 3.6262237762237763e-06, "loss": 0.3811, "step": 5850 }, { "epoch": 5.08, "learning_rate": 3.625524475524475e-06, "loss": 0.3906, "step": 5860 }, { "epoch": 5.09, "learning_rate": 3.6248251748251745e-06, "loss": 0.456, "step": 5870 }, { "epoch": 5.1, "learning_rate": 3.624125874125874e-06, "loss": 0.4335, "step": 5880 }, { "epoch": 5.1, "learning_rate": 3.6234265734265735e-06, "loss": 0.4065, "step": 5890 }, { "epoch": 5.11, "learning_rate": 3.6227272727272725e-06, "loss": 0.3946, "step": 5900 }, { "epoch": 5.12, "learning_rate": 3.622027972027972e-06, "loss": 0.4255, "step": 5910 }, { "epoch": 5.13, "learning_rate": 3.621328671328671e-06, "loss": 0.5383, "step": 5920 }, { "epoch": 5.14, "learning_rate": 3.6206293706293706e-06, "loss": 0.4545, "step": 5930 }, { "epoch": 5.15, "learning_rate": 3.6199300699300697e-06, "loss": 0.4416, "step": 5940 }, { "epoch": 5.16, "learning_rate": 3.619230769230769e-06, "loss": 0.3873, "step": 5950 }, { "epoch": 5.16, "learning_rate": 3.6185314685314687e-06, "loss": 0.4583, "step": 5960 }, { "epoch": 5.17, "learning_rate": 3.6178321678321673e-06, "loss": 0.4221, "step": 5970 }, { "epoch": 5.18, "learning_rate": 3.617132867132867e-06, "loss": 0.3759, "step": 5980 }, { "epoch": 5.19, "learning_rate": 3.6164335664335663e-06, "loss": 0.3778, "step": 5990 }, { "epoch": 5.2, "learning_rate": 3.615734265734266e-06, "loss": 0.3657, "step": 6000 }, { "epoch": 5.21, "learning_rate": 3.615034965034965e-06, "loss": 0.4768, "step": 6010 }, { "epoch": 5.22, "learning_rate": 3.614335664335664e-06, "loss": 0.4704, "step": 6020 }, { "epoch": 5.23, "learning_rate": 3.6136363636363635e-06, "loss": 0.4471, "step": 6030 }, { "epoch": 5.23, "learning_rate": 3.6129370629370625e-06, "loss": 0.4016, "step": 6040 }, { "epoch": 5.24, "learning_rate": 3.612237762237762e-06, "loss": 0.3933, "step": 6050 }, { "epoch": 5.25, "learning_rate": 3.6115384615384615e-06, "loss": 0.4244, "step": 6060 }, { "epoch": 5.26, "learning_rate": 3.610839160839161e-06, "loss": 0.4475, "step": 6070 }, { "epoch": 5.27, "learning_rate": 3.6101398601398597e-06, "loss": 0.4473, "step": 6080 }, { "epoch": 5.28, "learning_rate": 3.609440559440559e-06, "loss": 0.454, "step": 6090 }, { "epoch": 5.29, "learning_rate": 3.6087412587412587e-06, "loss": 0.4177, "step": 6100 }, { "epoch": 5.29, "learning_rate": 3.608041958041958e-06, "loss": 0.4084, "step": 6110 }, { "epoch": 5.3, "learning_rate": 3.6073426573426572e-06, "loss": 0.4163, "step": 6120 }, { "epoch": 5.31, "learning_rate": 3.6066433566433563e-06, "loss": 0.4717, "step": 6130 }, { "epoch": 5.32, "learning_rate": 3.605944055944056e-06, "loss": 0.3936, "step": 6140 }, { "epoch": 5.33, "learning_rate": 3.605244755244755e-06, "loss": 0.3789, "step": 6150 }, { "epoch": 5.34, "learning_rate": 3.6045454545454544e-06, "loss": 0.4144, "step": 6160 }, { "epoch": 5.35, "learning_rate": 3.603846153846154e-06, "loss": 0.3966, "step": 6170 }, { "epoch": 5.36, "learning_rate": 3.6031468531468534e-06, "loss": 0.4479, "step": 6180 }, { "epoch": 5.36, "learning_rate": 3.602447552447552e-06, "loss": 0.37, "step": 6190 }, { "epoch": 5.37, "learning_rate": 3.6017482517482515e-06, "loss": 0.366, "step": 6200 }, { "epoch": 5.38, "learning_rate": 3.601048951048951e-06, "loss": 0.443, "step": 6210 }, { "epoch": 5.39, "learning_rate": 3.60034965034965e-06, "loss": 0.3772, "step": 6220 }, { "epoch": 5.4, "learning_rate": 3.5996503496503496e-06, "loss": 0.4389, "step": 6230 }, { "epoch": 5.41, "learning_rate": 3.5989510489510487e-06, "loss": 0.4294, "step": 6240 }, { "epoch": 5.42, "learning_rate": 3.598251748251748e-06, "loss": 0.4025, "step": 6250 }, { "epoch": 5.42, "learning_rate": 3.5975524475524472e-06, "loss": 0.4683, "step": 6260 }, { "epoch": 5.43, "learning_rate": 3.5968531468531467e-06, "loss": 0.4215, "step": 6270 }, { "epoch": 5.44, "learning_rate": 3.5961538461538462e-06, "loss": 0.3982, "step": 6280 }, { "epoch": 5.45, "learning_rate": 3.595454545454545e-06, "loss": 0.3678, "step": 6290 }, { "epoch": 5.46, "learning_rate": 3.5947552447552444e-06, "loss": 0.3787, "step": 6300 }, { "epoch": 5.47, "learning_rate": 3.594055944055944e-06, "loss": 0.4167, "step": 6310 }, { "epoch": 5.48, "learning_rate": 3.5933566433566434e-06, "loss": 0.4013, "step": 6320 }, { "epoch": 5.49, "learning_rate": 3.5926573426573424e-06, "loss": 0.3849, "step": 6330 }, { "epoch": 5.49, "learning_rate": 3.591958041958042e-06, "loss": 0.4911, "step": 6340 }, { "epoch": 5.5, "learning_rate": 3.591258741258741e-06, "loss": 0.3917, "step": 6350 }, { "epoch": 5.51, "learning_rate": 3.5905594405594405e-06, "loss": 0.4331, "step": 6360 }, { "epoch": 5.52, "learning_rate": 3.5898601398601396e-06, "loss": 0.4441, "step": 6370 }, { "epoch": 5.53, "learning_rate": 3.589160839160839e-06, "loss": 0.404, "step": 6380 }, { "epoch": 5.54, "learning_rate": 3.5884615384615386e-06, "loss": 0.3654, "step": 6390 }, { "epoch": 5.55, "learning_rate": 3.5877622377622372e-06, "loss": 0.3759, "step": 6400 }, { "epoch": 5.55, "learning_rate": 3.5870629370629367e-06, "loss": 0.3972, "step": 6410 }, { "epoch": 5.56, "learning_rate": 3.5863636363636362e-06, "loss": 0.4738, "step": 6420 }, { "epoch": 5.57, "learning_rate": 3.5856643356643357e-06, "loss": 0.3825, "step": 6430 }, { "epoch": 5.58, "learning_rate": 3.5849650349650348e-06, "loss": 0.4313, "step": 6440 }, { "epoch": 5.59, "learning_rate": 3.5842657342657343e-06, "loss": 0.4117, "step": 6450 }, { "epoch": 5.6, "learning_rate": 3.5835664335664334e-06, "loss": 0.4463, "step": 6460 }, { "epoch": 5.61, "learning_rate": 3.5828671328671324e-06, "loss": 0.4928, "step": 6470 }, { "epoch": 5.61, "learning_rate": 3.582167832167832e-06, "loss": 0.3977, "step": 6480 }, { "epoch": 5.62, "learning_rate": 3.5814685314685314e-06, "loss": 0.43, "step": 6490 }, { "epoch": 5.63, "learning_rate": 3.580769230769231e-06, "loss": 0.3967, "step": 6500 }, { "epoch": 5.64, "learning_rate": 3.5800699300699296e-06, "loss": 0.4091, "step": 6510 }, { "epoch": 5.65, "learning_rate": 3.579370629370629e-06, "loss": 0.4269, "step": 6520 }, { "epoch": 5.66, "learning_rate": 3.5786713286713286e-06, "loss": 0.4157, "step": 6530 }, { "epoch": 5.67, "learning_rate": 3.577972027972028e-06, "loss": 0.4275, "step": 6540 }, { "epoch": 5.68, "learning_rate": 3.577272727272727e-06, "loss": 0.4638, "step": 6550 }, { "epoch": 5.68, "learning_rate": 3.5765734265734266e-06, "loss": 0.4441, "step": 6560 }, { "epoch": 5.69, "learning_rate": 3.5758741258741257e-06, "loss": 0.4582, "step": 6570 }, { "epoch": 5.7, "learning_rate": 3.5751748251748248e-06, "loss": 0.4679, "step": 6580 }, { "epoch": 5.71, "learning_rate": 3.5744755244755243e-06, "loss": 0.4212, "step": 6590 }, { "epoch": 5.72, "learning_rate": 3.5737762237762238e-06, "loss": 0.4247, "step": 6600 }, { "epoch": 5.73, "learning_rate": 3.5730769230769233e-06, "loss": 0.4173, "step": 6610 }, { "epoch": 5.74, "learning_rate": 3.572377622377622e-06, "loss": 0.4359, "step": 6620 }, { "epoch": 5.74, "learning_rate": 3.5716783216783214e-06, "loss": 0.4385, "step": 6630 }, { "epoch": 5.75, "learning_rate": 3.570979020979021e-06, "loss": 0.4632, "step": 6640 }, { "epoch": 5.76, "learning_rate": 3.57027972027972e-06, "loss": 0.4045, "step": 6650 }, { "epoch": 5.77, "learning_rate": 3.5695804195804195e-06, "loss": 0.4145, "step": 6660 }, { "epoch": 5.78, "learning_rate": 3.5688811188811186e-06, "loss": 0.393, "step": 6670 }, { "epoch": 5.79, "learning_rate": 3.568181818181818e-06, "loss": 0.4025, "step": 6680 }, { "epoch": 5.8, "learning_rate": 3.567482517482517e-06, "loss": 0.378, "step": 6690 }, { "epoch": 5.81, "learning_rate": 3.5667832167832166e-06, "loss": 0.4254, "step": 6700 }, { "epoch": 5.81, "learning_rate": 3.566083916083916e-06, "loss": 0.4688, "step": 6710 }, { "epoch": 5.82, "learning_rate": 3.5653846153846156e-06, "loss": 0.4761, "step": 6720 }, { "epoch": 5.83, "learning_rate": 3.5646853146853143e-06, "loss": 0.4667, "step": 6730 }, { "epoch": 5.84, "learning_rate": 3.5639860139860138e-06, "loss": 0.5203, "step": 6740 }, { "epoch": 5.85, "learning_rate": 3.5632867132867133e-06, "loss": 0.4006, "step": 6750 }, { "epoch": 5.86, "learning_rate": 3.5625874125874123e-06, "loss": 0.4119, "step": 6760 }, { "epoch": 5.87, "learning_rate": 3.561888111888112e-06, "loss": 0.4235, "step": 6770 }, { "epoch": 5.87, "learning_rate": 3.561188811188811e-06, "loss": 0.3927, "step": 6780 }, { "epoch": 5.88, "learning_rate": 3.5604895104895104e-06, "loss": 0.4529, "step": 6790 }, { "epoch": 5.89, "learning_rate": 3.5597902097902095e-06, "loss": 0.4006, "step": 6800 }, { "epoch": 5.9, "learning_rate": 3.559090909090909e-06, "loss": 0.4497, "step": 6810 }, { "epoch": 5.91, "learning_rate": 3.5583916083916085e-06, "loss": 0.4493, "step": 6820 }, { "epoch": 5.92, "learning_rate": 3.557692307692307e-06, "loss": 0.3804, "step": 6830 }, { "epoch": 5.93, "learning_rate": 3.5569930069930066e-06, "loss": 0.3847, "step": 6840 }, { "epoch": 5.94, "learning_rate": 3.556293706293706e-06, "loss": 0.4154, "step": 6850 }, { "epoch": 5.94, "learning_rate": 3.5555944055944056e-06, "loss": 0.3667, "step": 6860 }, { "epoch": 5.95, "learning_rate": 3.5548951048951047e-06, "loss": 0.4174, "step": 6870 }, { "epoch": 5.96, "learning_rate": 3.554195804195804e-06, "loss": 0.424, "step": 6880 }, { "epoch": 5.97, "learning_rate": 3.5534965034965033e-06, "loss": 0.4112, "step": 6890 }, { "epoch": 5.98, "learning_rate": 3.5528671328671327e-06, "loss": 0.4325, "step": 6900 }, { "epoch": 5.99, "learning_rate": 3.5521678321678322e-06, "loss": 0.4382, "step": 6910 }, { "epoch": 6.0, "learning_rate": 3.5514685314685313e-06, "loss": 0.4376, "step": 6920 }, { "epoch": 6.0, "eval_loss": 0.5798775553703308, "eval_runtime": 131.9415, "eval_samples_per_second": 4.032, "eval_steps_per_second": 2.016, "eval_wer": 0.26913929420839494, "step": 6924 }, { "epoch": 6.01, "learning_rate": 3.5507692307692304e-06, "loss": 0.4753, "step": 6930 }, { "epoch": 6.01, "learning_rate": 3.55006993006993e-06, "loss": 0.4354, "step": 6940 }, { "epoch": 6.02, "learning_rate": 3.5493706293706294e-06, "loss": 0.4241, "step": 6950 }, { "epoch": 6.03, "learning_rate": 3.5486713286713284e-06, "loss": 0.4086, "step": 6960 }, { "epoch": 6.04, "learning_rate": 3.547972027972028e-06, "loss": 0.4, "step": 6970 }, { "epoch": 6.05, "learning_rate": 3.547272727272727e-06, "loss": 0.4019, "step": 6980 }, { "epoch": 6.06, "learning_rate": 3.5465734265734265e-06, "loss": 0.457, "step": 6990 }, { "epoch": 6.07, "learning_rate": 3.5458741258741256e-06, "loss": 0.3821, "step": 7000 }, { "epoch": 6.07, "learning_rate": 3.545174825174825e-06, "loss": 0.4102, "step": 7010 }, { "epoch": 6.08, "learning_rate": 3.5444755244755246e-06, "loss": 0.4352, "step": 7020 }, { "epoch": 6.09, "learning_rate": 3.5437762237762236e-06, "loss": 0.3816, "step": 7030 }, { "epoch": 6.1, "learning_rate": 3.5430769230769227e-06, "loss": 0.4442, "step": 7040 }, { "epoch": 6.11, "learning_rate": 3.542377622377622e-06, "loss": 0.4007, "step": 7050 }, { "epoch": 6.12, "learning_rate": 3.5416783216783217e-06, "loss": 0.4247, "step": 7060 }, { "epoch": 6.13, "learning_rate": 3.5409790209790208e-06, "loss": 0.4067, "step": 7070 }, { "epoch": 6.14, "learning_rate": 3.5403496503496502e-06, "loss": 0.3995, "step": 7080 }, { "epoch": 6.14, "learning_rate": 3.5396503496503493e-06, "loss": 0.4824, "step": 7090 }, { "epoch": 6.15, "learning_rate": 3.538951048951049e-06, "loss": 0.3947, "step": 7100 }, { "epoch": 6.16, "learning_rate": 3.5382517482517483e-06, "loss": 0.3508, "step": 7110 }, { "epoch": 6.17, "learning_rate": 3.5375524475524474e-06, "loss": 0.4147, "step": 7120 }, { "epoch": 6.18, "learning_rate": 3.5368531468531465e-06, "loss": 0.3916, "step": 7130 }, { "epoch": 6.19, "learning_rate": 3.536153846153846e-06, "loss": 0.4855, "step": 7140 }, { "epoch": 6.2, "learning_rate": 3.5354545454545454e-06, "loss": 0.3445, "step": 7150 }, { "epoch": 6.2, "learning_rate": 3.5347552447552445e-06, "loss": 0.4443, "step": 7160 }, { "epoch": 6.21, "learning_rate": 3.534055944055944e-06, "loss": 0.4426, "step": 7170 }, { "epoch": 6.22, "learning_rate": 3.533356643356643e-06, "loss": 0.4079, "step": 7180 }, { "epoch": 6.23, "learning_rate": 3.532657342657342e-06, "loss": 0.3727, "step": 7190 }, { "epoch": 6.24, "learning_rate": 3.5319580419580417e-06, "loss": 0.362, "step": 7200 }, { "epoch": 6.25, "learning_rate": 3.531258741258741e-06, "loss": 0.424, "step": 7210 }, { "epoch": 6.26, "learning_rate": 3.5305594405594407e-06, "loss": 0.4108, "step": 7220 }, { "epoch": 6.27, "learning_rate": 3.5298601398601397e-06, "loss": 0.4526, "step": 7230 }, { "epoch": 6.27, "learning_rate": 3.529160839160839e-06, "loss": 0.417, "step": 7240 }, { "epoch": 6.28, "learning_rate": 3.5284615384615383e-06, "loss": 0.4048, "step": 7250 }, { "epoch": 6.29, "learning_rate": 3.527762237762238e-06, "loss": 0.421, "step": 7260 }, { "epoch": 6.3, "learning_rate": 3.527062937062937e-06, "loss": 0.4592, "step": 7270 }, { "epoch": 6.31, "learning_rate": 3.5263636363636364e-06, "loss": 0.4749, "step": 7280 }, { "epoch": 6.32, "learning_rate": 3.5256643356643354e-06, "loss": 0.426, "step": 7290 }, { "epoch": 6.33, "learning_rate": 3.5249650349650345e-06, "loss": 0.3914, "step": 7300 }, { "epoch": 6.33, "learning_rate": 3.524265734265734e-06, "loss": 0.4809, "step": 7310 }, { "epoch": 6.34, "learning_rate": 3.5235664335664335e-06, "loss": 0.4657, "step": 7320 }, { "epoch": 6.35, "learning_rate": 3.522867132867133e-06, "loss": 0.37, "step": 7330 }, { "epoch": 6.36, "learning_rate": 3.5221678321678317e-06, "loss": 0.4217, "step": 7340 }, { "epoch": 6.37, "learning_rate": 3.521468531468531e-06, "loss": 0.4398, "step": 7350 }, { "epoch": 6.38, "learning_rate": 3.5207692307692306e-06, "loss": 0.462, "step": 7360 }, { "epoch": 6.39, "learning_rate": 3.5200699300699297e-06, "loss": 0.3877, "step": 7370 }, { "epoch": 6.39, "learning_rate": 3.5193706293706292e-06, "loss": 0.4435, "step": 7380 }, { "epoch": 6.4, "learning_rate": 3.5186713286713287e-06, "loss": 0.411, "step": 7390 }, { "epoch": 6.41, "learning_rate": 3.517972027972028e-06, "loss": 0.4068, "step": 7400 }, { "epoch": 6.42, "learning_rate": 3.517272727272727e-06, "loss": 0.4755, "step": 7410 }, { "epoch": 6.43, "learning_rate": 3.5165734265734264e-06, "loss": 0.386, "step": 7420 }, { "epoch": 6.44, "learning_rate": 3.515874125874126e-06, "loss": 0.3746, "step": 7430 }, { "epoch": 6.45, "learning_rate": 3.5151748251748254e-06, "loss": 0.3711, "step": 7440 }, { "epoch": 6.46, "learning_rate": 3.514475524475524e-06, "loss": 0.4024, "step": 7450 }, { "epoch": 6.46, "learning_rate": 3.5137762237762235e-06, "loss": 0.4098, "step": 7460 }, { "epoch": 6.47, "learning_rate": 3.513076923076923e-06, "loss": 0.3528, "step": 7470 }, { "epoch": 6.48, "learning_rate": 3.512377622377622e-06, "loss": 0.5305, "step": 7480 }, { "epoch": 6.49, "learning_rate": 3.5116783216783216e-06, "loss": 0.4691, "step": 7490 }, { "epoch": 6.5, "learning_rate": 3.510979020979021e-06, "loss": 0.4021, "step": 7500 }, { "epoch": 6.51, "learning_rate": 3.51027972027972e-06, "loss": 0.4125, "step": 7510 }, { "epoch": 6.52, "learning_rate": 3.509580419580419e-06, "loss": 0.386, "step": 7520 }, { "epoch": 6.52, "learning_rate": 3.5088811188811187e-06, "loss": 0.4242, "step": 7530 }, { "epoch": 6.53, "learning_rate": 3.508181818181818e-06, "loss": 0.4123, "step": 7540 }, { "epoch": 6.54, "learning_rate": 3.5074825174825173e-06, "loss": 0.4487, "step": 7550 }, { "epoch": 6.55, "learning_rate": 3.5067832167832164e-06, "loss": 0.4478, "step": 7560 }, { "epoch": 6.56, "learning_rate": 3.506083916083916e-06, "loss": 0.4163, "step": 7570 }, { "epoch": 6.57, "learning_rate": 3.5053846153846153e-06, "loss": 0.4304, "step": 7580 }, { "epoch": 6.58, "learning_rate": 3.5046853146853144e-06, "loss": 0.4456, "step": 7590 }, { "epoch": 6.59, "learning_rate": 3.503986013986014e-06, "loss": 0.4465, "step": 7600 }, { "epoch": 6.59, "learning_rate": 3.5032867132867134e-06, "loss": 0.3964, "step": 7610 }, { "epoch": 6.6, "learning_rate": 3.5025874125874125e-06, "loss": 0.4074, "step": 7620 }, { "epoch": 6.61, "learning_rate": 3.5018881118881116e-06, "loss": 0.4124, "step": 7630 }, { "epoch": 6.62, "learning_rate": 3.501188811188811e-06, "loss": 0.4041, "step": 7640 }, { "epoch": 6.63, "learning_rate": 3.5004895104895106e-06, "loss": 0.402, "step": 7650 }, { "epoch": 6.64, "learning_rate": 3.4997902097902096e-06, "loss": 0.4579, "step": 7660 }, { "epoch": 6.65, "learning_rate": 3.4990909090909087e-06, "loss": 0.4575, "step": 7670 }, { "epoch": 6.65, "learning_rate": 3.498391608391608e-06, "loss": 0.3933, "step": 7680 }, { "epoch": 6.66, "learning_rate": 3.4976923076923077e-06, "loss": 0.3882, "step": 7690 }, { "epoch": 6.67, "learning_rate": 3.4969930069930068e-06, "loss": 0.3905, "step": 7700 }, { "epoch": 6.68, "learning_rate": 3.4962937062937063e-06, "loss": 0.4503, "step": 7710 }, { "epoch": 6.69, "learning_rate": 3.4955944055944053e-06, "loss": 0.411, "step": 7720 }, { "epoch": 6.7, "learning_rate": 3.4948951048951044e-06, "loss": 0.4377, "step": 7730 }, { "epoch": 6.71, "learning_rate": 3.494195804195804e-06, "loss": 0.4029, "step": 7740 }, { "epoch": 6.72, "learning_rate": 3.4934965034965034e-06, "loss": 0.4286, "step": 7750 }, { "epoch": 6.72, "learning_rate": 3.492797202797203e-06, "loss": 0.4271, "step": 7760 }, { "epoch": 6.73, "learning_rate": 3.492097902097902e-06, "loss": 0.411, "step": 7770 }, { "epoch": 6.74, "learning_rate": 3.491398601398601e-06, "loss": 0.4059, "step": 7780 }, { "epoch": 6.75, "learning_rate": 3.4906993006993005e-06, "loss": 0.3642, "step": 7790 }, { "epoch": 6.76, "learning_rate": 3.49e-06, "loss": 0.3648, "step": 7800 }, { "epoch": 6.77, "learning_rate": 3.489300699300699e-06, "loss": 0.4237, "step": 7810 }, { "epoch": 6.78, "learning_rate": 3.4886013986013986e-06, "loss": 0.4553, "step": 7820 }, { "epoch": 6.78, "learning_rate": 3.4879020979020977e-06, "loss": 0.4313, "step": 7830 }, { "epoch": 6.79, "learning_rate": 3.4872027972027968e-06, "loss": 0.3817, "step": 7840 }, { "epoch": 6.8, "learning_rate": 3.4865034965034963e-06, "loss": 0.4534, "step": 7850 }, { "epoch": 6.81, "learning_rate": 3.4858041958041958e-06, "loss": 0.4108, "step": 7860 }, { "epoch": 6.82, "learning_rate": 3.4851048951048953e-06, "loss": 0.4737, "step": 7870 }, { "epoch": 6.83, "learning_rate": 3.4844055944055943e-06, "loss": 0.4346, "step": 7880 }, { "epoch": 6.84, "learning_rate": 3.4837062937062934e-06, "loss": 0.4078, "step": 7890 }, { "epoch": 6.85, "learning_rate": 3.483006993006993e-06, "loss": 0.4898, "step": 7900 }, { "epoch": 6.85, "learning_rate": 3.482307692307692e-06, "loss": 0.4099, "step": 7910 }, { "epoch": 6.86, "learning_rate": 3.4816083916083915e-06, "loss": 0.4807, "step": 7920 }, { "epoch": 6.87, "learning_rate": 3.480909090909091e-06, "loss": 0.3721, "step": 7930 }, { "epoch": 6.88, "learning_rate": 3.48020979020979e-06, "loss": 0.4563, "step": 7940 }, { "epoch": 6.89, "learning_rate": 3.479510489510489e-06, "loss": 0.3941, "step": 7950 }, { "epoch": 6.9, "learning_rate": 3.4788111888111886e-06, "loss": 0.3597, "step": 7960 }, { "epoch": 6.91, "learning_rate": 3.478111888111888e-06, "loss": 0.4191, "step": 7970 }, { "epoch": 6.91, "learning_rate": 3.4774125874125876e-06, "loss": 0.4304, "step": 7980 }, { "epoch": 6.92, "learning_rate": 3.4767132867132862e-06, "loss": 0.371, "step": 7990 }, { "epoch": 6.93, "learning_rate": 3.4760139860139857e-06, "loss": 0.4132, "step": 8000 }, { "epoch": 6.94, "learning_rate": 3.4753146853146852e-06, "loss": 0.3688, "step": 8010 }, { "epoch": 6.95, "learning_rate": 3.4746153846153843e-06, "loss": 0.4284, "step": 8020 }, { "epoch": 6.96, "learning_rate": 3.473916083916084e-06, "loss": 0.4216, "step": 8030 }, { "epoch": 6.97, "learning_rate": 3.4732167832167833e-06, "loss": 0.4085, "step": 8040 }, { "epoch": 6.98, "learning_rate": 3.4725174825174824e-06, "loss": 0.3671, "step": 8050 }, { "epoch": 6.98, "learning_rate": 3.4718181818181815e-06, "loss": 0.4413, "step": 8060 }, { "epoch": 6.99, "learning_rate": 3.471118881118881e-06, "loss": 0.4341, "step": 8070 }, { "epoch": 7.0, "eval_loss": 0.5593249201774597, "eval_runtime": 132.6281, "eval_samples_per_second": 4.011, "eval_steps_per_second": 2.006, "eval_wer": 0.2648968310085492, "step": 8078 }, { "epoch": 7.0, "learning_rate": 3.4704195804195805e-06, "loss": 0.3919, "step": 8080 }, { "epoch": 7.01, "learning_rate": 3.4697202797202795e-06, "loss": 0.4472, "step": 8090 }, { "epoch": 7.02, "learning_rate": 3.4690209790209786e-06, "loss": 0.4076, "step": 8100 }, { "epoch": 7.03, "learning_rate": 3.468321678321678e-06, "loss": 0.4004, "step": 8110 }, { "epoch": 7.04, "learning_rate": 3.4676223776223776e-06, "loss": 0.4262, "step": 8120 }, { "epoch": 7.05, "learning_rate": 3.4669230769230767e-06, "loss": 0.3604, "step": 8130 }, { "epoch": 7.05, "learning_rate": 3.466223776223776e-06, "loss": 0.4613, "step": 8140 }, { "epoch": 7.06, "learning_rate": 3.4655244755244757e-06, "loss": 0.4261, "step": 8150 }, { "epoch": 7.07, "learning_rate": 3.4648251748251747e-06, "loss": 0.4473, "step": 8160 }, { "epoch": 7.08, "learning_rate": 3.464125874125874e-06, "loss": 0.3835, "step": 8170 }, { "epoch": 7.09, "learning_rate": 3.4634265734265733e-06, "loss": 0.4308, "step": 8180 }, { "epoch": 7.1, "learning_rate": 3.462727272727273e-06, "loss": 0.43, "step": 8190 }, { "epoch": 7.11, "learning_rate": 3.462027972027972e-06, "loss": 0.3746, "step": 8200 }, { "epoch": 7.11, "learning_rate": 3.461328671328671e-06, "loss": 0.3715, "step": 8210 }, { "epoch": 7.12, "learning_rate": 3.4606293706293704e-06, "loss": 0.4403, "step": 8220 }, { "epoch": 7.13, "learning_rate": 3.45993006993007e-06, "loss": 0.4333, "step": 8230 }, { "epoch": 7.14, "learning_rate": 3.459230769230769e-06, "loss": 0.3821, "step": 8240 }, { "epoch": 7.15, "learning_rate": 3.4585314685314685e-06, "loss": 0.399, "step": 8250 }, { "epoch": 7.16, "learning_rate": 3.457832167832168e-06, "loss": 0.3684, "step": 8260 }, { "epoch": 7.17, "learning_rate": 3.4571328671328667e-06, "loss": 0.4255, "step": 8270 }, { "epoch": 7.17, "learning_rate": 3.456433566433566e-06, "loss": 0.4221, "step": 8280 }, { "epoch": 7.18, "learning_rate": 3.4557342657342657e-06, "loss": 0.4537, "step": 8290 }, { "epoch": 7.19, "learning_rate": 3.455034965034965e-06, "loss": 0.4006, "step": 8300 }, { "epoch": 7.2, "learning_rate": 3.4543356643356642e-06, "loss": 0.4107, "step": 8310 }, { "epoch": 7.21, "learning_rate": 3.4536363636363633e-06, "loss": 0.466, "step": 8320 }, { "epoch": 7.22, "learning_rate": 3.452937062937063e-06, "loss": 0.4655, "step": 8330 }, { "epoch": 7.23, "learning_rate": 3.452237762237762e-06, "loss": 0.4353, "step": 8340 }, { "epoch": 7.24, "learning_rate": 3.4515384615384614e-06, "loss": 0.3783, "step": 8350 }, { "epoch": 7.24, "learning_rate": 3.450839160839161e-06, "loss": 0.3839, "step": 8360 }, { "epoch": 7.25, "learning_rate": 3.45013986013986e-06, "loss": 0.4209, "step": 8370 }, { "epoch": 7.26, "learning_rate": 3.449440559440559e-06, "loss": 0.3719, "step": 8380 }, { "epoch": 7.27, "learning_rate": 3.4487412587412585e-06, "loss": 0.4884, "step": 8390 }, { "epoch": 7.28, "learning_rate": 3.448041958041958e-06, "loss": 0.4634, "step": 8400 }, { "epoch": 7.29, "learning_rate": 3.4473426573426575e-06, "loss": 0.3454, "step": 8410 }, { "epoch": 7.3, "learning_rate": 3.4466433566433566e-06, "loss": 0.3983, "step": 8420 }, { "epoch": 7.3, "learning_rate": 3.4459440559440556e-06, "loss": 0.3874, "step": 8430 }, { "epoch": 7.31, "learning_rate": 3.445244755244755e-06, "loss": 0.396, "step": 8440 }, { "epoch": 7.32, "learning_rate": 3.4445454545454542e-06, "loss": 0.4124, "step": 8450 }, { "epoch": 7.33, "learning_rate": 3.4438461538461537e-06, "loss": 0.3665, "step": 8460 }, { "epoch": 7.34, "learning_rate": 3.443146853146853e-06, "loss": 0.3893, "step": 8470 }, { "epoch": 7.35, "learning_rate": 3.4424475524475523e-06, "loss": 0.5006, "step": 8480 }, { "epoch": 7.36, "learning_rate": 3.4417482517482514e-06, "loss": 0.3679, "step": 8490 }, { "epoch": 7.37, "learning_rate": 3.441048951048951e-06, "loss": 0.3859, "step": 8500 }, { "epoch": 7.37, "learning_rate": 3.4403496503496503e-06, "loss": 0.3818, "step": 8510 }, { "epoch": 7.38, "learning_rate": 3.4396503496503494e-06, "loss": 0.3795, "step": 8520 }, { "epoch": 7.39, "learning_rate": 3.4389510489510485e-06, "loss": 0.4211, "step": 8530 }, { "epoch": 7.4, "learning_rate": 3.438251748251748e-06, "loss": 0.4148, "step": 8540 }, { "epoch": 7.41, "learning_rate": 3.4375524475524475e-06, "loss": 0.412, "step": 8550 }, { "epoch": 7.42, "learning_rate": 3.4368531468531466e-06, "loss": 0.4597, "step": 8560 }, { "epoch": 7.43, "learning_rate": 3.436153846153846e-06, "loss": 0.3923, "step": 8570 }, { "epoch": 7.43, "learning_rate": 3.4354545454545456e-06, "loss": 0.4104, "step": 8580 }, { "epoch": 7.44, "learning_rate": 3.4347552447552446e-06, "loss": 0.4049, "step": 8590 }, { "epoch": 7.45, "learning_rate": 3.4340559440559437e-06, "loss": 0.436, "step": 8600 }, { "epoch": 7.46, "learning_rate": 3.433356643356643e-06, "loss": 0.3974, "step": 8610 }, { "epoch": 7.47, "learning_rate": 3.4326573426573427e-06, "loss": 0.4191, "step": 8620 }, { "epoch": 7.48, "learning_rate": 3.4319580419580418e-06, "loss": 0.5061, "step": 8630 }, { "epoch": 7.49, "learning_rate": 3.431258741258741e-06, "loss": 0.4298, "step": 8640 }, { "epoch": 7.5, "learning_rate": 3.4305594405594403e-06, "loss": 0.3958, "step": 8650 }, { "epoch": 7.5, "learning_rate": 3.42986013986014e-06, "loss": 0.4406, "step": 8660 }, { "epoch": 7.51, "learning_rate": 3.429160839160839e-06, "loss": 0.3959, "step": 8670 }, { "epoch": 7.52, "learning_rate": 3.4284615384615384e-06, "loss": 0.4711, "step": 8680 }, { "epoch": 7.53, "learning_rate": 3.427762237762238e-06, "loss": 0.4468, "step": 8690 }, { "epoch": 7.54, "learning_rate": 3.4270629370629366e-06, "loss": 0.3709, "step": 8700 }, { "epoch": 7.55, "learning_rate": 3.426363636363636e-06, "loss": 0.3925, "step": 8710 }, { "epoch": 7.56, "learning_rate": 3.4256643356643356e-06, "loss": 0.4129, "step": 8720 }, { "epoch": 7.56, "learning_rate": 3.424965034965035e-06, "loss": 0.3852, "step": 8730 }, { "epoch": 7.57, "learning_rate": 3.424265734265734e-06, "loss": 0.4379, "step": 8740 }, { "epoch": 7.58, "learning_rate": 3.423566433566433e-06, "loss": 0.4254, "step": 8750 }, { "epoch": 7.59, "learning_rate": 3.4228671328671327e-06, "loss": 0.413, "step": 8760 }, { "epoch": 7.6, "learning_rate": 3.422167832167832e-06, "loss": 0.4442, "step": 8770 }, { "epoch": 7.61, "learning_rate": 3.4214685314685313e-06, "loss": 0.4296, "step": 8780 }, { "epoch": 7.62, "learning_rate": 3.4207692307692308e-06, "loss": 0.3851, "step": 8790 }, { "epoch": 7.63, "learning_rate": 3.4200699300699303e-06, "loss": 0.4104, "step": 8800 }, { "epoch": 7.63, "learning_rate": 3.419370629370629e-06, "loss": 0.4401, "step": 8810 }, { "epoch": 7.64, "learning_rate": 3.4186713286713284e-06, "loss": 0.4269, "step": 8820 }, { "epoch": 7.65, "learning_rate": 3.417972027972028e-06, "loss": 0.4383, "step": 8830 }, { "epoch": 7.66, "learning_rate": 3.4172727272727274e-06, "loss": 0.3926, "step": 8840 }, { "epoch": 7.67, "learning_rate": 3.4165734265734265e-06, "loss": 0.4193, "step": 8850 }, { "epoch": 7.68, "learning_rate": 3.4158741258741255e-06, "loss": 0.3959, "step": 8860 }, { "epoch": 7.69, "learning_rate": 3.415174825174825e-06, "loss": 0.4067, "step": 8870 }, { "epoch": 7.69, "learning_rate": 3.414475524475524e-06, "loss": 0.3681, "step": 8880 }, { "epoch": 7.7, "learning_rate": 3.4137762237762236e-06, "loss": 0.4089, "step": 8890 }, { "epoch": 7.71, "learning_rate": 3.413076923076923e-06, "loss": 0.4024, "step": 8900 }, { "epoch": 7.72, "learning_rate": 3.412377622377622e-06, "loss": 0.3742, "step": 8910 }, { "epoch": 7.73, "learning_rate": 3.4116783216783213e-06, "loss": 0.3803, "step": 8920 }, { "epoch": 7.74, "learning_rate": 3.4109790209790208e-06, "loss": 0.4946, "step": 8930 }, { "epoch": 7.75, "learning_rate": 3.4102797202797202e-06, "loss": 0.372, "step": 8940 }, { "epoch": 7.76, "learning_rate": 3.4095804195804197e-06, "loss": 0.4491, "step": 8950 }, { "epoch": 7.76, "learning_rate": 3.408881118881119e-06, "loss": 0.4298, "step": 8960 }, { "epoch": 7.77, "learning_rate": 3.408181818181818e-06, "loss": 0.411, "step": 8970 }, { "epoch": 7.78, "learning_rate": 3.4074825174825174e-06, "loss": 0.4381, "step": 8980 }, { "epoch": 7.79, "learning_rate": 3.4067832167832165e-06, "loss": 0.3929, "step": 8990 }, { "epoch": 7.8, "learning_rate": 3.406083916083916e-06, "loss": 0.3752, "step": 9000 }, { "epoch": 7.81, "learning_rate": 3.4053846153846155e-06, "loss": 0.4362, "step": 9010 }, { "epoch": 7.82, "learning_rate": 3.4046853146853145e-06, "loss": 0.4371, "step": 9020 }, { "epoch": 7.82, "learning_rate": 3.4039860139860136e-06, "loss": 0.4526, "step": 9030 }, { "epoch": 7.83, "learning_rate": 3.403286713286713e-06, "loss": 0.4018, "step": 9040 }, { "epoch": 7.84, "learning_rate": 3.4025874125874126e-06, "loss": 0.3963, "step": 9050 }, { "epoch": 7.85, "learning_rate": 3.4018881118881117e-06, "loss": 0.3984, "step": 9060 }, { "epoch": 7.86, "learning_rate": 3.401188811188811e-06, "loss": 0.4395, "step": 9070 }, { "epoch": 7.87, "learning_rate": 3.4004895104895102e-06, "loss": 0.4229, "step": 9080 }, { "epoch": 7.88, "learning_rate": 3.3997902097902097e-06, "loss": 0.4344, "step": 9090 }, { "epoch": 7.89, "learning_rate": 3.399090909090909e-06, "loss": 0.3741, "step": 9100 }, { "epoch": 7.89, "learning_rate": 3.3983916083916083e-06, "loss": 0.3811, "step": 9110 }, { "epoch": 7.9, "learning_rate": 3.397692307692308e-06, "loss": 0.3972, "step": 9120 }, { "epoch": 7.91, "learning_rate": 3.396993006993007e-06, "loss": 0.4293, "step": 9130 }, { "epoch": 7.92, "learning_rate": 3.396293706293706e-06, "loss": 0.4136, "step": 9140 }, { "epoch": 7.93, "learning_rate": 3.3955944055944054e-06, "loss": 0.3997, "step": 9150 }, { "epoch": 7.94, "learning_rate": 3.394895104895105e-06, "loss": 0.4106, "step": 9160 }, { "epoch": 7.95, "learning_rate": 3.394195804195804e-06, "loss": 0.4311, "step": 9170 }, { "epoch": 7.95, "learning_rate": 3.393496503496503e-06, "loss": 0.411, "step": 9180 }, { "epoch": 7.96, "learning_rate": 3.3927972027972026e-06, "loss": 0.4382, "step": 9190 }, { "epoch": 7.97, "learning_rate": 3.392097902097902e-06, "loss": 0.3804, "step": 9200 }, { "epoch": 7.98, "learning_rate": 3.391398601398601e-06, "loss": 0.4592, "step": 9210 }, { "epoch": 7.99, "learning_rate": 3.3906993006993007e-06, "loss": 0.4102, "step": 9220 }, { "epoch": 8.0, "learning_rate": 3.39e-06, "loss": 0.4234, "step": 9230 }, { "epoch": 8.0, "eval_loss": 0.5488837957382202, "eval_runtime": 134.1414, "eval_samples_per_second": 3.966, "eval_steps_per_second": 1.983, "eval_wer": 0.2652182297358103, "step": 9232 }, { "epoch": 8.01, "learning_rate": 3.389300699300699e-06, "loss": 0.3802, "step": 9240 }, { "epoch": 8.02, "learning_rate": 3.3886013986013983e-06, "loss": 0.4252, "step": 9250 }, { "epoch": 8.02, "learning_rate": 3.387902097902098e-06, "loss": 0.3946, "step": 9260 }, { "epoch": 8.03, "learning_rate": 3.3872027972027973e-06, "loss": 0.397, "step": 9270 }, { "epoch": 8.04, "learning_rate": 3.3865034965034964e-06, "loss": 0.5124, "step": 9280 }, { "epoch": 8.05, "learning_rate": 3.3858041958041954e-06, "loss": 0.3946, "step": 9290 }, { "epoch": 8.06, "learning_rate": 3.385104895104895e-06, "loss": 0.4221, "step": 9300 }, { "epoch": 8.07, "learning_rate": 3.384405594405594e-06, "loss": 0.4058, "step": 9310 }, { "epoch": 8.08, "learning_rate": 3.3837062937062935e-06, "loss": 0.4154, "step": 9320 }, { "epoch": 8.08, "learning_rate": 3.383006993006993e-06, "loss": 0.4059, "step": 9330 }, { "epoch": 8.09, "learning_rate": 3.3823076923076925e-06, "loss": 0.4428, "step": 9340 }, { "epoch": 8.1, "learning_rate": 3.381608391608391e-06, "loss": 0.4559, "step": 9350 }, { "epoch": 8.11, "learning_rate": 3.3809090909090906e-06, "loss": 0.4143, "step": 9360 }, { "epoch": 8.12, "learning_rate": 3.38020979020979e-06, "loss": 0.3998, "step": 9370 }, { "epoch": 8.13, "learning_rate": 3.3795104895104896e-06, "loss": 0.4962, "step": 9380 }, { "epoch": 8.14, "learning_rate": 3.3788111888111887e-06, "loss": 0.4313, "step": 9390 }, { "epoch": 8.15, "learning_rate": 3.378111888111888e-06, "loss": 0.4054, "step": 9400 }, { "epoch": 8.15, "learning_rate": 3.3774125874125873e-06, "loss": 0.4037, "step": 9410 }, { "epoch": 8.16, "learning_rate": 3.3767132867132864e-06, "loss": 0.3747, "step": 9420 }, { "epoch": 8.17, "learning_rate": 3.376013986013986e-06, "loss": 0.3761, "step": 9430 }, { "epoch": 8.18, "learning_rate": 3.3753146853146854e-06, "loss": 0.4675, "step": 9440 }, { "epoch": 8.19, "learning_rate": 3.374615384615385e-06, "loss": 0.4281, "step": 9450 }, { "epoch": 8.2, "learning_rate": 3.3739160839160835e-06, "loss": 0.3503, "step": 9460 }, { "epoch": 8.21, "learning_rate": 3.373216783216783e-06, "loss": 0.4173, "step": 9470 }, { "epoch": 8.21, "learning_rate": 3.3725174825174825e-06, "loss": 0.4234, "step": 9480 }, { "epoch": 8.22, "learning_rate": 3.3718181818181816e-06, "loss": 0.39, "step": 9490 }, { "epoch": 8.23, "learning_rate": 3.371118881118881e-06, "loss": 0.424, "step": 9500 }, { "epoch": 8.24, "learning_rate": 3.37041958041958e-06, "loss": 0.4464, "step": 9510 }, { "epoch": 8.25, "learning_rate": 3.3697202797202796e-06, "loss": 0.4552, "step": 9520 }, { "epoch": 8.26, "learning_rate": 3.3690209790209787e-06, "loss": 0.4114, "step": 9530 }, { "epoch": 8.27, "learning_rate": 3.368321678321678e-06, "loss": 0.423, "step": 9540 }, { "epoch": 8.28, "learning_rate": 3.3676223776223777e-06, "loss": 0.4322, "step": 9550 }, { "epoch": 8.28, "learning_rate": 3.3669230769230768e-06, "loss": 0.3917, "step": 9560 }, { "epoch": 8.29, "learning_rate": 3.366223776223776e-06, "loss": 0.4033, "step": 9570 }, { "epoch": 8.3, "learning_rate": 3.3655244755244753e-06, "loss": 0.4534, "step": 9580 }, { "epoch": 8.31, "learning_rate": 3.364825174825175e-06, "loss": 0.4289, "step": 9590 }, { "epoch": 8.32, "learning_rate": 3.364125874125874e-06, "loss": 0.4591, "step": 9600 }, { "epoch": 8.33, "learning_rate": 3.3634265734265734e-06, "loss": 0.398, "step": 9610 }, { "epoch": 8.34, "learning_rate": 3.3627272727272725e-06, "loss": 0.425, "step": 9620 }, { "epoch": 8.34, "learning_rate": 3.362027972027972e-06, "loss": 0.4334, "step": 9630 }, { "epoch": 8.35, "learning_rate": 3.361328671328671e-06, "loss": 0.3715, "step": 9640 }, { "epoch": 8.36, "learning_rate": 3.3606293706293706e-06, "loss": 0.4115, "step": 9650 }, { "epoch": 8.37, "learning_rate": 3.35993006993007e-06, "loss": 0.3408, "step": 9660 }, { "epoch": 8.38, "learning_rate": 3.3592307692307687e-06, "loss": 0.4309, "step": 9670 }, { "epoch": 8.39, "learning_rate": 3.358531468531468e-06, "loss": 0.4107, "step": 9680 }, { "epoch": 8.4, "learning_rate": 3.3578321678321677e-06, "loss": 0.3915, "step": 9690 }, { "epoch": 8.41, "learning_rate": 3.357132867132867e-06, "loss": 0.4034, "step": 9700 }, { "epoch": 8.41, "learning_rate": 3.3564335664335663e-06, "loss": 0.3847, "step": 9710 }, { "epoch": 8.42, "learning_rate": 3.3557342657342653e-06, "loss": 0.423, "step": 9720 }, { "epoch": 8.43, "learning_rate": 3.355034965034965e-06, "loss": 0.4304, "step": 9730 }, { "epoch": 8.44, "learning_rate": 3.3543356643356643e-06, "loss": 0.4048, "step": 9740 }, { "epoch": 8.45, "learning_rate": 3.3536363636363634e-06, "loss": 0.3768, "step": 9750 }, { "epoch": 8.46, "learning_rate": 3.352937062937063e-06, "loss": 0.3473, "step": 9760 }, { "epoch": 8.47, "learning_rate": 3.3522377622377624e-06, "loss": 0.4231, "step": 9770 }, { "epoch": 8.47, "learning_rate": 3.351538461538461e-06, "loss": 0.3808, "step": 9780 }, { "epoch": 8.48, "learning_rate": 3.3508391608391605e-06, "loss": 0.3728, "step": 9790 }, { "epoch": 8.49, "learning_rate": 3.35013986013986e-06, "loss": 0.4372, "step": 9800 }, { "epoch": 8.5, "learning_rate": 3.3494405594405595e-06, "loss": 0.4418, "step": 9810 }, { "epoch": 8.51, "learning_rate": 3.3487412587412586e-06, "loss": 0.4072, "step": 9820 }, { "epoch": 8.52, "learning_rate": 3.3480419580419577e-06, "loss": 0.441, "step": 9830 }, { "epoch": 8.53, "learning_rate": 3.347342657342657e-06, "loss": 0.3316, "step": 9840 }, { "epoch": 8.54, "learning_rate": 3.3466433566433563e-06, "loss": 0.381, "step": 9850 }, { "epoch": 8.54, "learning_rate": 3.3459440559440558e-06, "loss": 0.401, "step": 9860 }, { "epoch": 8.55, "learning_rate": 3.3452447552447553e-06, "loss": 0.4355, "step": 9870 }, { "epoch": 8.56, "learning_rate": 3.3445454545454547e-06, "loss": 0.511, "step": 9880 }, { "epoch": 8.57, "learning_rate": 3.3438461538461534e-06, "loss": 0.413, "step": 9890 }, { "epoch": 8.58, "learning_rate": 3.343146853146853e-06, "loss": 0.422, "step": 9900 }, { "epoch": 8.59, "learning_rate": 3.3424475524475524e-06, "loss": 0.4066, "step": 9910 }, { "epoch": 8.6, "learning_rate": 3.341748251748252e-06, "loss": 0.3828, "step": 9920 }, { "epoch": 8.6, "learning_rate": 3.341048951048951e-06, "loss": 0.4135, "step": 9930 }, { "epoch": 8.61, "learning_rate": 3.34034965034965e-06, "loss": 0.4386, "step": 9940 }, { "epoch": 8.62, "learning_rate": 3.3396503496503495e-06, "loss": 0.3895, "step": 9950 }, { "epoch": 8.63, "learning_rate": 3.3389510489510486e-06, "loss": 0.3449, "step": 9960 }, { "epoch": 8.64, "learning_rate": 3.338251748251748e-06, "loss": 0.3914, "step": 9970 }, { "epoch": 8.65, "learning_rate": 3.3375524475524476e-06, "loss": 0.4172, "step": 9980 }, { "epoch": 8.66, "learning_rate": 3.336853146853147e-06, "loss": 0.3624, "step": 9990 }, { "epoch": 8.67, "learning_rate": 3.3361538461538457e-06, "loss": 0.3909, "step": 10000 }, { "epoch": 8.67, "learning_rate": 3.3354545454545452e-06, "loss": 0.4117, "step": 10010 }, { "epoch": 8.68, "learning_rate": 3.3347552447552447e-06, "loss": 0.3968, "step": 10020 }, { "epoch": 8.69, "learning_rate": 3.334055944055944e-06, "loss": 0.4085, "step": 10030 }, { "epoch": 8.7, "learning_rate": 3.3333566433566433e-06, "loss": 0.4649, "step": 10040 }, { "epoch": 8.71, "learning_rate": 3.3326573426573424e-06, "loss": 0.4003, "step": 10050 }, { "epoch": 8.72, "learning_rate": 3.331958041958042e-06, "loss": 0.3796, "step": 10060 }, { "epoch": 8.73, "learning_rate": 3.331258741258741e-06, "loss": 0.4687, "step": 10070 }, { "epoch": 8.73, "learning_rate": 3.3305594405594405e-06, "loss": 0.4325, "step": 10080 }, { "epoch": 8.74, "learning_rate": 3.32986013986014e-06, "loss": 0.4062, "step": 10090 }, { "epoch": 8.75, "learning_rate": 3.329160839160839e-06, "loss": 0.3887, "step": 10100 }, { "epoch": 8.76, "learning_rate": 3.328461538461538e-06, "loss": 0.3791, "step": 10110 }, { "epoch": 8.77, "learning_rate": 3.3277622377622376e-06, "loss": 0.4117, "step": 10120 }, { "epoch": 8.78, "learning_rate": 3.327062937062937e-06, "loss": 0.4206, "step": 10130 }, { "epoch": 8.79, "learning_rate": 3.326363636363636e-06, "loss": 0.4569, "step": 10140 }, { "epoch": 8.8, "learning_rate": 3.3256643356643357e-06, "loss": 0.3759, "step": 10150 }, { "epoch": 8.8, "learning_rate": 3.3249650349650347e-06, "loss": 0.414, "step": 10160 }, { "epoch": 8.81, "learning_rate": 3.3242657342657342e-06, "loss": 0.3948, "step": 10170 }, { "epoch": 8.82, "learning_rate": 3.3235664335664333e-06, "loss": 0.426, "step": 10180 }, { "epoch": 8.83, "learning_rate": 3.322867132867133e-06, "loss": 0.4246, "step": 10190 }, { "epoch": 8.84, "learning_rate": 3.3221678321678323e-06, "loss": 0.4605, "step": 10200 }, { "epoch": 8.85, "learning_rate": 3.321468531468531e-06, "loss": 0.4355, "step": 10210 }, { "epoch": 8.86, "learning_rate": 3.3207692307692304e-06, "loss": 0.4407, "step": 10220 }, { "epoch": 8.86, "learning_rate": 3.32006993006993e-06, "loss": 0.4483, "step": 10230 }, { "epoch": 8.87, "learning_rate": 3.3193706293706294e-06, "loss": 0.3864, "step": 10240 }, { "epoch": 8.88, "learning_rate": 3.3186713286713285e-06, "loss": 0.4614, "step": 10250 }, { "epoch": 8.89, "learning_rate": 3.317972027972028e-06, "loss": 0.3972, "step": 10260 }, { "epoch": 8.9, "learning_rate": 3.317272727272727e-06, "loss": 0.4305, "step": 10270 }, { "epoch": 8.91, "learning_rate": 3.316573426573426e-06, "loss": 0.3863, "step": 10280 }, { "epoch": 8.92, "learning_rate": 3.3158741258741257e-06, "loss": 0.4265, "step": 10290 }, { "epoch": 8.93, "learning_rate": 3.315174825174825e-06, "loss": 0.3841, "step": 10300 }, { "epoch": 8.93, "learning_rate": 3.3144755244755246e-06, "loss": 0.3922, "step": 10310 }, { "epoch": 8.94, "learning_rate": 3.3137762237762233e-06, "loss": 0.3994, "step": 10320 }, { "epoch": 8.95, "learning_rate": 3.313076923076923e-06, "loss": 0.4247, "step": 10330 }, { "epoch": 8.96, "learning_rate": 3.3123776223776223e-06, "loss": 0.4377, "step": 10340 }, { "epoch": 8.97, "learning_rate": 3.3116783216783218e-06, "loss": 0.3737, "step": 10350 }, { "epoch": 8.98, "learning_rate": 3.310979020979021e-06, "loss": 0.3754, "step": 10360 }, { "epoch": 8.99, "learning_rate": 3.31027972027972e-06, "loss": 0.4627, "step": 10370 }, { "epoch": 8.99, "learning_rate": 3.3095804195804194e-06, "loss": 0.3965, "step": 10380 }, { "epoch": 9.0, "eval_loss": 0.560581386089325, "eval_runtime": 133.9098, "eval_samples_per_second": 3.973, "eval_steps_per_second": 1.986, "eval_wer": 0.26014012984508583, "step": 10386 }, { "epoch": 9.0, "learning_rate": 3.3088811188811185e-06, "loss": 0.4449, "step": 10390 }, { "epoch": 9.01, "learning_rate": 3.308181818181818e-06, "loss": 0.4246, "step": 10400 }, { "epoch": 9.02, "learning_rate": 3.3074825174825175e-06, "loss": 0.4037, "step": 10410 }, { "epoch": 9.03, "learning_rate": 3.306783216783217e-06, "loss": 0.3731, "step": 10420 }, { "epoch": 9.04, "learning_rate": 3.3060839160839156e-06, "loss": 0.4149, "step": 10430 }, { "epoch": 9.05, "learning_rate": 3.305384615384615e-06, "loss": 0.4062, "step": 10440 }, { "epoch": 9.06, "learning_rate": 3.3046853146853146e-06, "loss": 0.4265, "step": 10450 }, { "epoch": 9.06, "learning_rate": 3.3039860139860137e-06, "loss": 0.3848, "step": 10460 }, { "epoch": 9.07, "learning_rate": 3.303286713286713e-06, "loss": 0.3891, "step": 10470 }, { "epoch": 9.08, "learning_rate": 3.3025874125874123e-06, "loss": 0.4249, "step": 10480 }, { "epoch": 9.09, "learning_rate": 3.3018881118881118e-06, "loss": 0.404, "step": 10490 }, { "epoch": 9.1, "learning_rate": 3.301188811188811e-06, "loss": 0.4211, "step": 10500 }, { "epoch": 9.11, "learning_rate": 3.3004895104895104e-06, "loss": 0.3693, "step": 10510 }, { "epoch": 9.12, "learning_rate": 3.29979020979021e-06, "loss": 0.4231, "step": 10520 }, { "epoch": 9.12, "learning_rate": 3.2990909090909093e-06, "loss": 0.379, "step": 10530 }, { "epoch": 9.13, "learning_rate": 3.298391608391608e-06, "loss": 0.3743, "step": 10540 }, { "epoch": 9.14, "learning_rate": 3.2976923076923075e-06, "loss": 0.3608, "step": 10550 }, { "epoch": 9.15, "learning_rate": 3.296993006993007e-06, "loss": 0.3752, "step": 10560 }, { "epoch": 9.16, "learning_rate": 3.296293706293706e-06, "loss": 0.4375, "step": 10570 }, { "epoch": 9.17, "learning_rate": 3.2955944055944056e-06, "loss": 0.4091, "step": 10580 }, { "epoch": 9.18, "learning_rate": 3.2948951048951046e-06, "loss": 0.4659, "step": 10590 }, { "epoch": 9.19, "learning_rate": 3.294195804195804e-06, "loss": 0.4305, "step": 10600 }, { "epoch": 9.19, "learning_rate": 3.293496503496503e-06, "loss": 0.3882, "step": 10610 }, { "epoch": 9.2, "learning_rate": 3.2927972027972027e-06, "loss": 0.3877, "step": 10620 }, { "epoch": 9.21, "learning_rate": 3.292097902097902e-06, "loss": 0.4133, "step": 10630 }, { "epoch": 9.22, "learning_rate": 3.291398601398601e-06, "loss": 0.4197, "step": 10640 }, { "epoch": 9.23, "learning_rate": 3.2906993006993003e-06, "loss": 0.3962, "step": 10650 }, { "epoch": 9.24, "learning_rate": 3.29e-06, "loss": 0.4339, "step": 10660 }, { "epoch": 9.25, "learning_rate": 3.2893006993006993e-06, "loss": 0.405, "step": 10670 }, { "epoch": 9.25, "learning_rate": 3.2886013986013984e-06, "loss": 0.411, "step": 10680 }, { "epoch": 9.26, "learning_rate": 3.287902097902098e-06, "loss": 0.4084, "step": 10690 }, { "epoch": 9.27, "learning_rate": 3.287202797202797e-06, "loss": 0.4886, "step": 10700 }, { "epoch": 9.28, "learning_rate": 3.2865034965034965e-06, "loss": 0.4184, "step": 10710 }, { "epoch": 9.29, "learning_rate": 3.2858041958041956e-06, "loss": 0.407, "step": 10720 }, { "epoch": 9.3, "learning_rate": 3.285104895104895e-06, "loss": 0.4283, "step": 10730 }, { "epoch": 9.31, "learning_rate": 3.2844055944055945e-06, "loss": 0.3711, "step": 10740 }, { "epoch": 9.32, "learning_rate": 3.283706293706293e-06, "loss": 0.4128, "step": 10750 }, { "epoch": 9.32, "learning_rate": 3.2830069930069927e-06, "loss": 0.3888, "step": 10760 }, { "epoch": 9.33, "learning_rate": 3.282307692307692e-06, "loss": 0.4046, "step": 10770 }, { "epoch": 9.34, "learning_rate": 3.2816083916083917e-06, "loss": 0.4792, "step": 10780 }, { "epoch": 9.35, "learning_rate": 3.2809090909090908e-06, "loss": 0.3611, "step": 10790 }, { "epoch": 9.36, "learning_rate": 3.2802097902097903e-06, "loss": 0.4009, "step": 10800 }, { "epoch": 9.37, "learning_rate": 3.2795104895104893e-06, "loss": 0.3805, "step": 10810 }, { "epoch": 9.38, "learning_rate": 3.2788111888111884e-06, "loss": 0.3642, "step": 10820 }, { "epoch": 9.38, "learning_rate": 3.278111888111888e-06, "loss": 0.3998, "step": 10830 }, { "epoch": 9.39, "learning_rate": 3.2774125874125874e-06, "loss": 0.4431, "step": 10840 }, { "epoch": 9.4, "learning_rate": 3.276713286713287e-06, "loss": 0.4207, "step": 10850 }, { "epoch": 9.41, "learning_rate": 3.2760139860139855e-06, "loss": 0.392, "step": 10860 }, { "epoch": 9.42, "learning_rate": 3.275314685314685e-06, "loss": 0.3769, "step": 10870 }, { "epoch": 9.43, "learning_rate": 3.2746153846153845e-06, "loss": 0.4146, "step": 10880 }, { "epoch": 9.44, "learning_rate": 3.273916083916084e-06, "loss": 0.4471, "step": 10890 }, { "epoch": 9.45, "learning_rate": 3.273216783216783e-06, "loss": 0.4716, "step": 10900 }, { "epoch": 9.45, "learning_rate": 3.272517482517482e-06, "loss": 0.3586, "step": 10910 }, { "epoch": 9.46, "learning_rate": 3.2718181818181817e-06, "loss": 0.4394, "step": 10920 }, { "epoch": 9.47, "learning_rate": 3.2711188811188808e-06, "loss": 0.4323, "step": 10930 }, { "epoch": 9.48, "learning_rate": 3.2704195804195802e-06, "loss": 0.4524, "step": 10940 }, { "epoch": 9.49, "learning_rate": 3.2697202797202797e-06, "loss": 0.512, "step": 10950 }, { "epoch": 9.5, "learning_rate": 3.2690209790209792e-06, "loss": 0.3513, "step": 10960 }, { "epoch": 9.51, "learning_rate": 3.268321678321678e-06, "loss": 0.4046, "step": 10970 }, { "epoch": 9.51, "learning_rate": 3.2676223776223774e-06, "loss": 0.3967, "step": 10980 }, { "epoch": 9.52, "learning_rate": 3.266923076923077e-06, "loss": 0.4133, "step": 10990 }, { "epoch": 9.53, "learning_rate": 3.266223776223776e-06, "loss": 0.4759, "step": 11000 }, { "epoch": 9.54, "learning_rate": 3.2655244755244755e-06, "loss": 0.3668, "step": 11010 }, { "epoch": 9.55, "learning_rate": 3.2648251748251745e-06, "loss": 0.4029, "step": 11020 }, { "epoch": 9.56, "learning_rate": 3.264125874125874e-06, "loss": 0.4852, "step": 11030 }, { "epoch": 9.57, "learning_rate": 3.263426573426573e-06, "loss": 0.4197, "step": 11040 }, { "epoch": 9.58, "learning_rate": 3.2627272727272726e-06, "loss": 0.4511, "step": 11050 }, { "epoch": 9.58, "learning_rate": 3.262027972027972e-06, "loss": 0.4441, "step": 11060 }, { "epoch": 9.59, "learning_rate": 3.2613286713286716e-06, "loss": 0.4381, "step": 11070 }, { "epoch": 9.6, "learning_rate": 3.2606293706293702e-06, "loss": 0.3922, "step": 11080 }, { "epoch": 9.61, "learning_rate": 3.2599300699300697e-06, "loss": 0.4215, "step": 11090 }, { "epoch": 9.62, "learning_rate": 3.2592307692307692e-06, "loss": 0.3579, "step": 11100 }, { "epoch": 9.63, "learning_rate": 3.2585314685314683e-06, "loss": 0.4254, "step": 11110 }, { "epoch": 9.64, "learning_rate": 3.257832167832168e-06, "loss": 0.3891, "step": 11120 }, { "epoch": 9.64, "learning_rate": 3.257132867132867e-06, "loss": 0.404, "step": 11130 }, { "epoch": 9.65, "learning_rate": 3.2564335664335664e-06, "loss": 0.4374, "step": 11140 }, { "epoch": 9.66, "learning_rate": 3.2557342657342654e-06, "loss": 0.3818, "step": 11150 }, { "epoch": 9.67, "learning_rate": 3.255034965034965e-06, "loss": 0.3742, "step": 11160 }, { "epoch": 9.68, "learning_rate": 3.2543356643356644e-06, "loss": 0.43, "step": 11170 }, { "epoch": 9.69, "learning_rate": 3.253636363636363e-06, "loss": 0.4267, "step": 11180 }, { "epoch": 9.7, "learning_rate": 3.2529370629370626e-06, "loss": 0.4361, "step": 11190 }, { "epoch": 9.71, "learning_rate": 3.252237762237762e-06, "loss": 0.4058, "step": 11200 }, { "epoch": 9.71, "learning_rate": 3.2515384615384616e-06, "loss": 0.3672, "step": 11210 }, { "epoch": 9.72, "learning_rate": 3.2508391608391607e-06, "loss": 0.3858, "step": 11220 }, { "epoch": 9.73, "learning_rate": 3.25013986013986e-06, "loss": 0.3885, "step": 11230 }, { "epoch": 9.74, "learning_rate": 3.2494405594405592e-06, "loss": 0.3776, "step": 11240 }, { "epoch": 9.75, "learning_rate": 3.2487412587412583e-06, "loss": 0.4401, "step": 11250 }, { "epoch": 9.76, "learning_rate": 3.248041958041958e-06, "loss": 0.4318, "step": 11260 }, { "epoch": 9.77, "learning_rate": 3.2473426573426573e-06, "loss": 0.4234, "step": 11270 }, { "epoch": 9.77, "learning_rate": 3.246643356643357e-06, "loss": 0.436, "step": 11280 }, { "epoch": 9.78, "learning_rate": 3.2459440559440554e-06, "loss": 0.4338, "step": 11290 }, { "epoch": 9.79, "learning_rate": 3.245244755244755e-06, "loss": 0.4059, "step": 11300 }, { "epoch": 9.8, "learning_rate": 3.2445454545454544e-06, "loss": 0.4006, "step": 11310 }, { "epoch": 9.81, "learning_rate": 3.243916083916084e-06, "loss": 0.417, "step": 11320 }, { "epoch": 9.82, "learning_rate": 3.243216783216783e-06, "loss": 0.4349, "step": 11330 }, { "epoch": 9.83, "learning_rate": 3.2425174825174825e-06, "loss": 0.4421, "step": 11340 }, { "epoch": 9.83, "learning_rate": 3.2418181818181815e-06, "loss": 0.4203, "step": 11350 }, { "epoch": 9.84, "learning_rate": 3.241118881118881e-06, "loss": 0.3779, "step": 11360 }, { "epoch": 9.85, "learning_rate": 3.2404195804195805e-06, "loss": 0.4028, "step": 11370 }, { "epoch": 9.86, "learning_rate": 3.239720279720279e-06, "loss": 0.3965, "step": 11380 }, { "epoch": 9.87, "learning_rate": 3.2390209790209787e-06, "loss": 0.3674, "step": 11390 }, { "epoch": 9.88, "learning_rate": 3.238321678321678e-06, "loss": 0.3918, "step": 11400 }, { "epoch": 9.89, "learning_rate": 3.2376223776223777e-06, "loss": 0.4187, "step": 11410 }, { "epoch": 9.9, "learning_rate": 3.2369230769230768e-06, "loss": 0.3845, "step": 11420 }, { "epoch": 9.9, "learning_rate": 3.2362237762237762e-06, "loss": 0.4286, "step": 11430 }, { "epoch": 9.91, "learning_rate": 3.2355244755244753e-06, "loss": 0.448, "step": 11440 }, { "epoch": 9.92, "learning_rate": 3.2348251748251744e-06, "loss": 0.4251, "step": 11450 }, { "epoch": 9.93, "learning_rate": 3.234125874125874e-06, "loss": 0.4281, "step": 11460 }, { "epoch": 9.94, "learning_rate": 3.2334265734265734e-06, "loss": 0.4495, "step": 11470 }, { "epoch": 9.95, "learning_rate": 3.232727272727273e-06, "loss": 0.3919, "step": 11480 }, { "epoch": 9.96, "learning_rate": 3.2320279720279715e-06, "loss": 0.4116, "step": 11490 }, { "epoch": 9.96, "learning_rate": 3.231328671328671e-06, "loss": 0.3788, "step": 11500 }, { "epoch": 9.97, "learning_rate": 3.2306293706293705e-06, "loss": 0.3904, "step": 11510 }, { "epoch": 9.98, "learning_rate": 3.22993006993007e-06, "loss": 0.412, "step": 11520 }, { "epoch": 9.99, "learning_rate": 3.229230769230769e-06, "loss": 0.3909, "step": 11530 }, { "epoch": 10.0, "learning_rate": 3.2285314685314686e-06, "loss": 0.4383, "step": 11540 }, { "epoch": 10.0, "eval_loss": 0.5629733204841614, "eval_runtime": 133.284, "eval_samples_per_second": 3.991, "eval_steps_per_second": 1.996, "eval_wer": 0.2606543678087035, "step": 11540 }, { "epoch": 10.01, "learning_rate": 3.2278321678321677e-06, "loss": 0.422, "step": 11550 }, { "epoch": 10.02, "learning_rate": 3.2271328671328667e-06, "loss": 0.4198, "step": 11560 }, { "epoch": 10.03, "learning_rate": 3.2264335664335662e-06, "loss": 0.3768, "step": 11570 }, { "epoch": 10.03, "learning_rate": 3.2257342657342657e-06, "loss": 0.4059, "step": 11580 }, { "epoch": 10.04, "learning_rate": 3.2250349650349652e-06, "loss": 0.4248, "step": 11590 }, { "epoch": 10.05, "learning_rate": 3.224335664335664e-06, "loss": 0.3902, "step": 11600 }, { "epoch": 10.06, "learning_rate": 3.2236363636363634e-06, "loss": 0.383, "step": 11610 }, { "epoch": 10.07, "learning_rate": 3.222937062937063e-06, "loss": 0.3833, "step": 11620 }, { "epoch": 10.08, "learning_rate": 3.222237762237762e-06, "loss": 0.4813, "step": 11630 }, { "epoch": 10.09, "learning_rate": 3.2215384615384614e-06, "loss": 0.3924, "step": 11640 }, { "epoch": 10.1, "learning_rate": 3.220839160839161e-06, "loss": 0.3906, "step": 11650 }, { "epoch": 10.1, "learning_rate": 3.22013986013986e-06, "loss": 0.3665, "step": 11660 }, { "epoch": 10.11, "learning_rate": 3.219440559440559e-06, "loss": 0.3477, "step": 11670 }, { "epoch": 10.12, "learning_rate": 3.2187412587412586e-06, "loss": 0.4091, "step": 11680 }, { "epoch": 10.13, "learning_rate": 3.218041958041958e-06, "loss": 0.3921, "step": 11690 }, { "epoch": 10.14, "learning_rate": 3.2173426573426576e-06, "loss": 0.3875, "step": 11700 }, { "epoch": 10.15, "learning_rate": 3.2166433566433562e-06, "loss": 0.4104, "step": 11710 }, { "epoch": 10.16, "learning_rate": 3.2159440559440557e-06, "loss": 0.3885, "step": 11720 }, { "epoch": 10.16, "learning_rate": 3.2152447552447552e-06, "loss": 0.3613, "step": 11730 }, { "epoch": 10.17, "learning_rate": 3.2145454545454543e-06, "loss": 0.471, "step": 11740 }, { "epoch": 10.18, "learning_rate": 3.213846153846154e-06, "loss": 0.4413, "step": 11750 }, { "epoch": 10.19, "learning_rate": 3.213146853146853e-06, "loss": 0.3643, "step": 11760 }, { "epoch": 10.2, "learning_rate": 3.2124475524475524e-06, "loss": 0.3322, "step": 11770 }, { "epoch": 10.21, "learning_rate": 3.2117482517482514e-06, "loss": 0.3777, "step": 11780 }, { "epoch": 10.22, "learning_rate": 3.211048951048951e-06, "loss": 0.4579, "step": 11790 }, { "epoch": 10.23, "learning_rate": 3.2103496503496504e-06, "loss": 0.3609, "step": 11800 }, { "epoch": 10.23, "learning_rate": 3.2096503496503495e-06, "loss": 0.4145, "step": 11810 }, { "epoch": 10.24, "learning_rate": 3.2089510489510486e-06, "loss": 0.4498, "step": 11820 }, { "epoch": 10.25, "learning_rate": 3.208251748251748e-06, "loss": 0.4212, "step": 11830 }, { "epoch": 10.26, "learning_rate": 3.2075524475524476e-06, "loss": 0.4339, "step": 11840 }, { "epoch": 10.27, "learning_rate": 3.2068531468531466e-06, "loss": 0.4033, "step": 11850 }, { "epoch": 10.28, "learning_rate": 3.206153846153846e-06, "loss": 0.3386, "step": 11860 }, { "epoch": 10.29, "learning_rate": 3.2054545454545452e-06, "loss": 0.3892, "step": 11870 }, { "epoch": 10.29, "learning_rate": 3.2047552447552443e-06, "loss": 0.3798, "step": 11880 }, { "epoch": 10.3, "learning_rate": 3.204055944055944e-06, "loss": 0.4161, "step": 11890 }, { "epoch": 10.31, "learning_rate": 3.2033566433566433e-06, "loss": 0.3388, "step": 11900 }, { "epoch": 10.32, "learning_rate": 3.2026573426573428e-06, "loss": 0.3871, "step": 11910 }, { "epoch": 10.33, "learning_rate": 3.2019580419580414e-06, "loss": 0.4393, "step": 11920 }, { "epoch": 10.34, "learning_rate": 3.201258741258741e-06, "loss": 0.4055, "step": 11930 }, { "epoch": 10.35, "learning_rate": 3.2005594405594404e-06, "loss": 0.434, "step": 11940 }, { "epoch": 10.36, "learning_rate": 3.19986013986014e-06, "loss": 0.4293, "step": 11950 }, { "epoch": 10.36, "learning_rate": 3.199160839160839e-06, "loss": 0.3783, "step": 11960 }, { "epoch": 10.37, "learning_rate": 3.1984615384615385e-06, "loss": 0.4578, "step": 11970 }, { "epoch": 10.38, "learning_rate": 3.1977622377622376e-06, "loss": 0.3943, "step": 11980 }, { "epoch": 10.39, "learning_rate": 3.1970629370629366e-06, "loss": 0.4987, "step": 11990 }, { "epoch": 10.4, "learning_rate": 3.196363636363636e-06, "loss": 0.4265, "step": 12000 }, { "epoch": 10.41, "learning_rate": 3.1956643356643356e-06, "loss": 0.3909, "step": 12010 }, { "epoch": 10.42, "learning_rate": 3.194965034965035e-06, "loss": 0.3212, "step": 12020 }, { "epoch": 10.42, "learning_rate": 3.1942657342657338e-06, "loss": 0.5361, "step": 12030 }, { "epoch": 10.43, "learning_rate": 3.1935664335664333e-06, "loss": 0.374, "step": 12040 }, { "epoch": 10.44, "learning_rate": 3.1928671328671328e-06, "loss": 0.4897, "step": 12050 }, { "epoch": 10.45, "learning_rate": 3.192167832167832e-06, "loss": 0.4381, "step": 12060 }, { "epoch": 10.46, "learning_rate": 3.1914685314685313e-06, "loss": 0.4138, "step": 12070 }, { "epoch": 10.47, "learning_rate": 3.190769230769231e-06, "loss": 0.4278, "step": 12080 }, { "epoch": 10.48, "learning_rate": 3.19006993006993e-06, "loss": 0.4777, "step": 12090 }, { "epoch": 10.49, "learning_rate": 3.189370629370629e-06, "loss": 0.3806, "step": 12100 }, { "epoch": 10.49, "learning_rate": 3.1886713286713285e-06, "loss": 0.4316, "step": 12110 }, { "epoch": 10.5, "learning_rate": 3.187972027972028e-06, "loss": 0.359, "step": 12120 }, { "epoch": 10.51, "learning_rate": 3.1872727272727275e-06, "loss": 0.4141, "step": 12130 }, { "epoch": 10.52, "learning_rate": 3.186573426573426e-06, "loss": 0.4678, "step": 12140 }, { "epoch": 10.53, "learning_rate": 3.1858741258741256e-06, "loss": 0.5613, "step": 12150 }, { "epoch": 10.54, "learning_rate": 3.185174825174825e-06, "loss": 0.4073, "step": 12160 }, { "epoch": 10.55, "learning_rate": 3.184475524475524e-06, "loss": 0.3658, "step": 12170 }, { "epoch": 10.55, "learning_rate": 3.1837762237762237e-06, "loss": 0.4292, "step": 12180 }, { "epoch": 10.56, "learning_rate": 3.183076923076923e-06, "loss": 0.3994, "step": 12190 }, { "epoch": 10.57, "learning_rate": 3.1823776223776223e-06, "loss": 0.3395, "step": 12200 }, { "epoch": 10.58, "learning_rate": 3.1816783216783213e-06, "loss": 0.3992, "step": 12210 }, { "epoch": 10.59, "learning_rate": 3.180979020979021e-06, "loss": 0.382, "step": 12220 }, { "epoch": 10.6, "learning_rate": 3.1802797202797203e-06, "loss": 0.4397, "step": 12230 }, { "epoch": 10.61, "learning_rate": 3.1795804195804194e-06, "loss": 0.4188, "step": 12240 }, { "epoch": 10.61, "learning_rate": 3.1788811188811185e-06, "loss": 0.3643, "step": 12250 }, { "epoch": 10.62, "learning_rate": 3.178181818181818e-06, "loss": 0.4586, "step": 12260 }, { "epoch": 10.63, "learning_rate": 3.1774825174825175e-06, "loss": 0.3905, "step": 12270 }, { "epoch": 10.64, "learning_rate": 3.1767832167832165e-06, "loss": 0.4422, "step": 12280 }, { "epoch": 10.65, "learning_rate": 3.176083916083916e-06, "loss": 0.3952, "step": 12290 }, { "epoch": 10.66, "learning_rate": 3.175384615384615e-06, "loss": 0.4059, "step": 12300 }, { "epoch": 10.67, "learning_rate": 3.1746853146853146e-06, "loss": 0.4235, "step": 12310 }, { "epoch": 10.68, "learning_rate": 3.1739860139860137e-06, "loss": 0.408, "step": 12320 }, { "epoch": 10.68, "learning_rate": 3.173286713286713e-06, "loss": 0.3726, "step": 12330 }, { "epoch": 10.69, "learning_rate": 3.1725874125874127e-06, "loss": 0.4191, "step": 12340 }, { "epoch": 10.7, "learning_rate": 3.1718881118881118e-06, "loss": 0.3919, "step": 12350 }, { "epoch": 10.71, "learning_rate": 3.171188811188811e-06, "loss": 0.4135, "step": 12360 }, { "epoch": 10.72, "learning_rate": 3.1704895104895103e-06, "loss": 0.449, "step": 12370 }, { "epoch": 10.73, "learning_rate": 3.16979020979021e-06, "loss": 0.4839, "step": 12380 }, { "epoch": 10.74, "learning_rate": 3.169090909090909e-06, "loss": 0.3793, "step": 12390 }, { "epoch": 10.74, "learning_rate": 3.1683916083916084e-06, "loss": 0.4173, "step": 12400 }, { "epoch": 10.75, "learning_rate": 3.1676923076923075e-06, "loss": 0.3964, "step": 12410 }, { "epoch": 10.76, "learning_rate": 3.1669930069930065e-06, "loss": 0.4478, "step": 12420 }, { "epoch": 10.77, "learning_rate": 3.166293706293706e-06, "loss": 0.4247, "step": 12430 }, { "epoch": 10.78, "learning_rate": 3.1655944055944055e-06, "loss": 0.4806, "step": 12440 }, { "epoch": 10.79, "learning_rate": 3.164895104895105e-06, "loss": 0.4104, "step": 12450 }, { "epoch": 10.8, "learning_rate": 3.164195804195804e-06, "loss": 0.4602, "step": 12460 }, { "epoch": 10.81, "learning_rate": 3.163496503496503e-06, "loss": 0.3707, "step": 12470 }, { "epoch": 10.81, "learning_rate": 3.1627972027972027e-06, "loss": 0.3626, "step": 12480 }, { "epoch": 10.82, "learning_rate": 3.162097902097902e-06, "loss": 0.4234, "step": 12490 }, { "epoch": 10.83, "learning_rate": 3.1613986013986012e-06, "loss": 0.37, "step": 12500 }, { "epoch": 10.84, "learning_rate": 3.1606993006993007e-06, "loss": 0.3754, "step": 12510 }, { "epoch": 10.85, "learning_rate": 3.16e-06, "loss": 0.4232, "step": 12520 }, { "epoch": 10.86, "learning_rate": 3.159300699300699e-06, "loss": 0.4205, "step": 12530 }, { "epoch": 10.87, "learning_rate": 3.1586013986013984e-06, "loss": 0.3652, "step": 12540 }, { "epoch": 10.87, "learning_rate": 3.157902097902098e-06, "loss": 0.4103, "step": 12550 }, { "epoch": 10.88, "learning_rate": 3.1572027972027974e-06, "loss": 0.4234, "step": 12560 }, { "epoch": 10.89, "learning_rate": 3.156503496503496e-06, "loss": 0.356, "step": 12570 }, { "epoch": 10.9, "learning_rate": 3.1558041958041955e-06, "loss": 0.4116, "step": 12580 }, { "epoch": 10.91, "learning_rate": 3.155104895104895e-06, "loss": 0.4963, "step": 12590 }, { "epoch": 10.92, "learning_rate": 3.154405594405594e-06, "loss": 0.4658, "step": 12600 }, { "epoch": 10.93, "learning_rate": 3.1537062937062936e-06, "loss": 0.4356, "step": 12610 }, { "epoch": 10.94, "learning_rate": 3.153006993006993e-06, "loss": 0.4288, "step": 12620 }, { "epoch": 10.94, "learning_rate": 3.152307692307692e-06, "loss": 0.3944, "step": 12630 }, { "epoch": 10.95, "learning_rate": 3.1516083916083912e-06, "loss": 0.4145, "step": 12640 }, { "epoch": 10.96, "learning_rate": 3.1509090909090907e-06, "loss": 0.4038, "step": 12650 }, { "epoch": 10.97, "learning_rate": 3.1502097902097902e-06, "loss": 0.4021, "step": 12660 }, { "epoch": 10.98, "learning_rate": 3.1495104895104897e-06, "loss": 0.377, "step": 12670 }, { "epoch": 10.99, "learning_rate": 3.1488111888111884e-06, "loss": 0.3921, "step": 12680 }, { "epoch": 11.0, "learning_rate": 3.148111888111888e-06, "loss": 0.4245, "step": 12690 }, { "epoch": 11.0, "eval_loss": 0.5647190809249878, "eval_runtime": 134.3558, "eval_samples_per_second": 3.96, "eval_steps_per_second": 1.98, "eval_wer": 0.2560905058815967, "step": 12694 }, { "epoch": 11.01, "learning_rate": 3.1474125874125874e-06, "loss": 0.3689, "step": 12700 }, { "epoch": 11.01, "learning_rate": 3.1467132867132864e-06, "loss": 0.3827, "step": 12710 }, { "epoch": 11.02, "learning_rate": 3.146013986013986e-06, "loss": 0.3676, "step": 12720 }, { "epoch": 11.03, "learning_rate": 3.1453146853146854e-06, "loss": 0.4533, "step": 12730 }, { "epoch": 11.04, "learning_rate": 3.1446153846153845e-06, "loss": 0.4324, "step": 12740 }, { "epoch": 11.05, "learning_rate": 3.1439160839160836e-06, "loss": 0.442, "step": 12750 }, { "epoch": 11.06, "learning_rate": 3.143216783216783e-06, "loss": 0.3553, "step": 12760 }, { "epoch": 11.07, "learning_rate": 3.1425174825174826e-06, "loss": 0.4051, "step": 12770 }, { "epoch": 11.07, "learning_rate": 3.1418181818181817e-06, "loss": 0.4422, "step": 12780 }, { "epoch": 11.08, "learning_rate": 3.1411188811188807e-06, "loss": 0.4083, "step": 12790 }, { "epoch": 11.09, "learning_rate": 3.1404195804195802e-06, "loss": 0.3878, "step": 12800 }, { "epoch": 11.1, "learning_rate": 3.1397202797202797e-06, "loss": 0.4111, "step": 12810 }, { "epoch": 11.11, "learning_rate": 3.139020979020979e-06, "loss": 0.4363, "step": 12820 }, { "epoch": 11.12, "learning_rate": 3.1383216783216783e-06, "loss": 0.4326, "step": 12830 }, { "epoch": 11.13, "learning_rate": 3.1376223776223778e-06, "loss": 0.393, "step": 12840 }, { "epoch": 11.14, "learning_rate": 3.1369230769230764e-06, "loss": 0.4463, "step": 12850 }, { "epoch": 11.14, "learning_rate": 3.136223776223776e-06, "loss": 0.4079, "step": 12860 }, { "epoch": 11.15, "learning_rate": 3.1355244755244754e-06, "loss": 0.4008, "step": 12870 }, { "epoch": 11.16, "learning_rate": 3.134825174825175e-06, "loss": 0.4737, "step": 12880 }, { "epoch": 11.17, "learning_rate": 3.134125874125874e-06, "loss": 0.4459, "step": 12890 }, { "epoch": 11.18, "learning_rate": 3.133426573426573e-06, "loss": 0.4121, "step": 12900 }, { "epoch": 11.19, "learning_rate": 3.1327272727272726e-06, "loss": 0.4312, "step": 12910 }, { "epoch": 11.2, "learning_rate": 3.132027972027972e-06, "loss": 0.3916, "step": 12920 }, { "epoch": 11.2, "learning_rate": 3.131328671328671e-06, "loss": 0.3627, "step": 12930 }, { "epoch": 11.21, "learning_rate": 3.1306293706293706e-06, "loss": 0.4057, "step": 12940 }, { "epoch": 11.22, "learning_rate": 3.1299300699300697e-06, "loss": 0.3761, "step": 12950 }, { "epoch": 11.23, "learning_rate": 3.1292307692307688e-06, "loss": 0.4694, "step": 12960 }, { "epoch": 11.24, "learning_rate": 3.1285314685314683e-06, "loss": 0.3899, "step": 12970 }, { "epoch": 11.25, "learning_rate": 3.1278321678321678e-06, "loss": 0.3499, "step": 12980 }, { "epoch": 11.26, "learning_rate": 3.1271328671328673e-06, "loss": 0.4372, "step": 12990 }, { "epoch": 11.27, "learning_rate": 3.1264335664335664e-06, "loss": 0.4522, "step": 13000 }, { "epoch": 11.27, "learning_rate": 3.1257342657342654e-06, "loss": 0.3943, "step": 13010 }, { "epoch": 11.28, "learning_rate": 3.125034965034965e-06, "loss": 0.3741, "step": 13020 }, { "epoch": 11.29, "learning_rate": 3.124335664335664e-06, "loss": 0.3595, "step": 13030 }, { "epoch": 11.3, "learning_rate": 3.1236363636363635e-06, "loss": 0.4889, "step": 13040 }, { "epoch": 11.31, "learning_rate": 3.122937062937063e-06, "loss": 0.3744, "step": 13050 }, { "epoch": 11.32, "learning_rate": 3.122237762237762e-06, "loss": 0.4061, "step": 13060 }, { "epoch": 11.33, "learning_rate": 3.121538461538461e-06, "loss": 0.4333, "step": 13070 }, { "epoch": 11.33, "learning_rate": 3.1208391608391606e-06, "loss": 0.3838, "step": 13080 }, { "epoch": 11.34, "learning_rate": 3.12013986013986e-06, "loss": 0.4064, "step": 13090 }, { "epoch": 11.35, "learning_rate": 3.1194405594405596e-06, "loss": 0.4572, "step": 13100 }, { "epoch": 11.36, "learning_rate": 3.1187412587412583e-06, "loss": 0.3864, "step": 13110 }, { "epoch": 11.37, "learning_rate": 3.1180419580419578e-06, "loss": 0.4353, "step": 13120 }, { "epoch": 11.38, "learning_rate": 3.1173426573426573e-06, "loss": 0.4305, "step": 13130 }, { "epoch": 11.39, "learning_rate": 3.1166433566433563e-06, "loss": 0.4294, "step": 13140 }, { "epoch": 11.39, "learning_rate": 3.115944055944056e-06, "loss": 0.3242, "step": 13150 }, { "epoch": 11.4, "learning_rate": 3.1152447552447553e-06, "loss": 0.3815, "step": 13160 }, { "epoch": 11.41, "learning_rate": 3.1145454545454544e-06, "loss": 0.3437, "step": 13170 }, { "epoch": 11.42, "learning_rate": 3.1138461538461535e-06, "loss": 0.4029, "step": 13180 }, { "epoch": 11.43, "learning_rate": 3.113146853146853e-06, "loss": 0.4357, "step": 13190 }, { "epoch": 11.44, "learning_rate": 3.1124475524475525e-06, "loss": 0.4073, "step": 13200 }, { "epoch": 11.45, "learning_rate": 3.1117482517482516e-06, "loss": 0.3962, "step": 13210 }, { "epoch": 11.46, "learning_rate": 3.1110489510489506e-06, "loss": 0.3896, "step": 13220 }, { "epoch": 11.46, "learning_rate": 3.11034965034965e-06, "loss": 0.422, "step": 13230 }, { "epoch": 11.47, "learning_rate": 3.1096503496503496e-06, "loss": 0.3918, "step": 13240 }, { "epoch": 11.48, "learning_rate": 3.1089510489510487e-06, "loss": 0.3884, "step": 13250 }, { "epoch": 11.49, "learning_rate": 3.108251748251748e-06, "loss": 0.4256, "step": 13260 }, { "epoch": 11.5, "learning_rate": 3.1075524475524477e-06, "loss": 0.4003, "step": 13270 }, { "epoch": 11.51, "learning_rate": 3.1068531468531468e-06, "loss": 0.3744, "step": 13280 }, { "epoch": 11.52, "learning_rate": 3.106153846153846e-06, "loss": 0.4673, "step": 13290 }, { "epoch": 11.52, "learning_rate": 3.1054545454545453e-06, "loss": 0.473, "step": 13300 }, { "epoch": 11.53, "learning_rate": 3.104755244755245e-06, "loss": 0.3683, "step": 13310 }, { "epoch": 11.54, "learning_rate": 3.104055944055944e-06, "loss": 0.3906, "step": 13320 }, { "epoch": 11.55, "learning_rate": 3.103356643356643e-06, "loss": 0.4705, "step": 13330 }, { "epoch": 11.56, "learning_rate": 3.1026573426573425e-06, "loss": 0.4346, "step": 13340 }, { "epoch": 11.57, "learning_rate": 3.101958041958042e-06, "loss": 0.3415, "step": 13350 }, { "epoch": 11.58, "learning_rate": 3.101258741258741e-06, "loss": 0.3599, "step": 13360 }, { "epoch": 11.59, "learning_rate": 3.1005594405594405e-06, "loss": 0.3877, "step": 13370 }, { "epoch": 11.59, "learning_rate": 3.09986013986014e-06, "loss": 0.4167, "step": 13380 }, { "epoch": 11.6, "learning_rate": 3.0991608391608387e-06, "loss": 0.4292, "step": 13390 }, { "epoch": 11.61, "learning_rate": 3.098461538461538e-06, "loss": 0.4469, "step": 13400 }, { "epoch": 11.62, "learning_rate": 3.0977622377622377e-06, "loss": 0.4273, "step": 13410 }, { "epoch": 11.63, "learning_rate": 3.097062937062937e-06, "loss": 0.3338, "step": 13420 }, { "epoch": 11.64, "learning_rate": 3.0963636363636362e-06, "loss": 0.422, "step": 13430 }, { "epoch": 11.65, "learning_rate": 3.0956643356643353e-06, "loss": 0.4025, "step": 13440 }, { "epoch": 11.65, "learning_rate": 3.094965034965035e-06, "loss": 0.4044, "step": 13450 }, { "epoch": 11.66, "learning_rate": 3.0942657342657343e-06, "loss": 0.4187, "step": 13460 }, { "epoch": 11.67, "learning_rate": 3.0935664335664334e-06, "loss": 0.3947, "step": 13470 }, { "epoch": 11.68, "learning_rate": 3.092867132867133e-06, "loss": 0.3553, "step": 13480 }, { "epoch": 11.69, "learning_rate": 3.092167832167832e-06, "loss": 0.4187, "step": 13490 }, { "epoch": 11.7, "learning_rate": 3.091468531468531e-06, "loss": 0.4666, "step": 13500 }, { "epoch": 11.71, "learning_rate": 3.0907692307692305e-06, "loss": 0.4248, "step": 13510 }, { "epoch": 11.72, "learning_rate": 3.09006993006993e-06, "loss": 0.362, "step": 13520 }, { "epoch": 11.72, "learning_rate": 3.0893706293706295e-06, "loss": 0.4296, "step": 13530 }, { "epoch": 11.73, "learning_rate": 3.0886713286713286e-06, "loss": 0.3882, "step": 13540 }, { "epoch": 11.74, "learning_rate": 3.0879720279720277e-06, "loss": 0.3709, "step": 13550 }, { "epoch": 11.75, "learning_rate": 3.087272727272727e-06, "loss": 0.3679, "step": 13560 }, { "epoch": 11.76, "learning_rate": 3.0865734265734262e-06, "loss": 0.4126, "step": 13570 }, { "epoch": 11.77, "learning_rate": 3.0858741258741257e-06, "loss": 0.4288, "step": 13580 }, { "epoch": 11.78, "learning_rate": 3.0851748251748252e-06, "loss": 0.3786, "step": 13590 }, { "epoch": 11.78, "learning_rate": 3.0844755244755243e-06, "loss": 0.381, "step": 13600 }, { "epoch": 11.79, "learning_rate": 3.0837762237762234e-06, "loss": 0.4091, "step": 13610 }, { "epoch": 11.8, "learning_rate": 3.083076923076923e-06, "loss": 0.3875, "step": 13620 }, { "epoch": 11.81, "learning_rate": 3.0823776223776224e-06, "loss": 0.3907, "step": 13630 }, { "epoch": 11.82, "learning_rate": 3.081678321678322e-06, "loss": 0.3664, "step": 13640 }, { "epoch": 11.83, "learning_rate": 3.080979020979021e-06, "loss": 0.3494, "step": 13650 }, { "epoch": 11.84, "learning_rate": 3.08027972027972e-06, "loss": 0.3899, "step": 13660 }, { "epoch": 11.85, "learning_rate": 3.0795804195804195e-06, "loss": 0.4002, "step": 13670 }, { "epoch": 11.85, "learning_rate": 3.0788811188811186e-06, "loss": 0.5063, "step": 13680 }, { "epoch": 11.86, "learning_rate": 3.078181818181818e-06, "loss": 0.4773, "step": 13690 }, { "epoch": 11.87, "learning_rate": 3.0774825174825176e-06, "loss": 0.3547, "step": 13700 }, { "epoch": 11.88, "learning_rate": 3.0767832167832167e-06, "loss": 0.3995, "step": 13710 }, { "epoch": 11.89, "learning_rate": 3.0760839160839157e-06, "loss": 0.4126, "step": 13720 }, { "epoch": 11.9, "learning_rate": 3.0753846153846152e-06, "loss": 0.3785, "step": 13730 }, { "epoch": 11.91, "learning_rate": 3.0746853146853147e-06, "loss": 0.4024, "step": 13740 }, { "epoch": 11.91, "learning_rate": 3.073986013986014e-06, "loss": 0.3838, "step": 13750 }, { "epoch": 11.92, "learning_rate": 3.073286713286713e-06, "loss": 0.4221, "step": 13760 }, { "epoch": 11.93, "learning_rate": 3.0725874125874124e-06, "loss": 0.4061, "step": 13770 }, { "epoch": 11.94, "learning_rate": 3.071888111888112e-06, "loss": 0.4233, "step": 13780 }, { "epoch": 11.95, "learning_rate": 3.071188811188811e-06, "loss": 0.3744, "step": 13790 }, { "epoch": 11.96, "learning_rate": 3.0704895104895104e-06, "loss": 0.409, "step": 13800 }, { "epoch": 11.97, "learning_rate": 3.06979020979021e-06, "loss": 0.4319, "step": 13810 }, { "epoch": 11.98, "learning_rate": 3.0690909090909086e-06, "loss": 0.4032, "step": 13820 }, { "epoch": 11.98, "learning_rate": 3.068391608391608e-06, "loss": 0.4338, "step": 13830 }, { "epoch": 11.99, "learning_rate": 3.0676923076923076e-06, "loss": 0.3946, "step": 13840 }, { "epoch": 12.0, "eval_loss": 0.5525963306427002, "eval_runtime": 133.5393, "eval_samples_per_second": 3.984, "eval_steps_per_second": 1.992, "eval_wer": 0.26348267660860064, "step": 13848 }, { "epoch": 12.0, "learning_rate": 3.066993006993007e-06, "loss": 0.3896, "step": 13850 }, { "epoch": 12.01, "learning_rate": 3.066293706293706e-06, "loss": 0.4106, "step": 13860 }, { "epoch": 12.02, "learning_rate": 3.0655944055944052e-06, "loss": 0.4001, "step": 13870 }, { "epoch": 12.03, "learning_rate": 3.0648951048951047e-06, "loss": 0.3334, "step": 13880 }, { "epoch": 12.04, "learning_rate": 3.0641958041958042e-06, "loss": 0.3551, "step": 13890 }, { "epoch": 12.05, "learning_rate": 3.0634965034965033e-06, "loss": 0.4169, "step": 13900 }, { "epoch": 12.05, "learning_rate": 3.0627972027972028e-06, "loss": 0.3991, "step": 13910 }, { "epoch": 12.06, "learning_rate": 3.0620979020979023e-06, "loss": 0.4, "step": 13920 }, { "epoch": 12.07, "learning_rate": 3.061398601398601e-06, "loss": 0.4013, "step": 13930 }, { "epoch": 12.08, "learning_rate": 3.0606993006993004e-06, "loss": 0.3758, "step": 13940 }, { "epoch": 12.09, "learning_rate": 3.06e-06, "loss": 0.4109, "step": 13950 }, { "epoch": 12.1, "learning_rate": 3.0593006993006994e-06, "loss": 0.4589, "step": 13960 }, { "epoch": 12.11, "learning_rate": 3.0586713286713285e-06, "loss": 0.4093, "step": 13970 }, { "epoch": 12.11, "learning_rate": 3.057972027972028e-06, "loss": 0.422, "step": 13980 }, { "epoch": 12.12, "learning_rate": 3.057272727272727e-06, "loss": 0.4142, "step": 13990 }, { "epoch": 12.13, "learning_rate": 3.0565734265734265e-06, "loss": 0.394, "step": 14000 }, { "epoch": 12.14, "learning_rate": 3.055874125874126e-06, "loss": 0.4007, "step": 14010 }, { "epoch": 12.15, "learning_rate": 3.0551748251748247e-06, "loss": 0.3457, "step": 14020 }, { "epoch": 12.16, "learning_rate": 3.054475524475524e-06, "loss": 0.3427, "step": 14030 }, { "epoch": 12.17, "learning_rate": 3.0537762237762237e-06, "loss": 0.4197, "step": 14040 }, { "epoch": 12.17, "learning_rate": 3.053076923076923e-06, "loss": 0.3985, "step": 14050 }, { "epoch": 12.18, "learning_rate": 3.0523776223776222e-06, "loss": 0.3557, "step": 14060 }, { "epoch": 12.19, "learning_rate": 3.0516783216783213e-06, "loss": 0.389, "step": 14070 }, { "epoch": 12.2, "learning_rate": 3.050979020979021e-06, "loss": 0.4019, "step": 14080 }, { "epoch": 12.21, "learning_rate": 3.0502797202797203e-06, "loss": 0.3896, "step": 14090 }, { "epoch": 12.22, "learning_rate": 3.0495804195804194e-06, "loss": 0.3969, "step": 14100 }, { "epoch": 12.23, "learning_rate": 3.048881118881119e-06, "loss": 0.3983, "step": 14110 }, { "epoch": 12.24, "learning_rate": 3.0481818181818184e-06, "loss": 0.3853, "step": 14120 }, { "epoch": 12.24, "learning_rate": 3.047482517482517e-06, "loss": 0.405, "step": 14130 }, { "epoch": 12.25, "learning_rate": 3.0467832167832165e-06, "loss": 0.4416, "step": 14140 }, { "epoch": 12.26, "learning_rate": 3.046083916083916e-06, "loss": 0.4443, "step": 14150 }, { "epoch": 12.27, "learning_rate": 3.0453846153846155e-06, "loss": 0.4276, "step": 14160 }, { "epoch": 12.28, "learning_rate": 3.0446853146853146e-06, "loss": 0.3815, "step": 14170 }, { "epoch": 12.29, "learning_rate": 3.0439860139860137e-06, "loss": 0.3975, "step": 14180 }, { "epoch": 12.3, "learning_rate": 3.043286713286713e-06, "loss": 0.4268, "step": 14190 }, { "epoch": 12.3, "learning_rate": 3.0425874125874122e-06, "loss": 0.3851, "step": 14200 }, { "epoch": 12.31, "learning_rate": 3.0418881118881117e-06, "loss": 0.4057, "step": 14210 }, { "epoch": 12.32, "learning_rate": 3.0411888111888112e-06, "loss": 0.407, "step": 14220 }, { "epoch": 12.33, "learning_rate": 3.0404895104895107e-06, "loss": 0.4224, "step": 14230 }, { "epoch": 12.34, "learning_rate": 3.0397902097902094e-06, "loss": 0.4311, "step": 14240 }, { "epoch": 12.35, "learning_rate": 3.039090909090909e-06, "loss": 0.4162, "step": 14250 }, { "epoch": 12.36, "learning_rate": 3.0383916083916084e-06, "loss": 0.4437, "step": 14260 }, { "epoch": 12.37, "learning_rate": 3.037692307692308e-06, "loss": 0.4052, "step": 14270 }, { "epoch": 12.37, "learning_rate": 3.036993006993007e-06, "loss": 0.3864, "step": 14280 }, { "epoch": 12.38, "learning_rate": 3.036293706293706e-06, "loss": 0.4052, "step": 14290 }, { "epoch": 12.39, "learning_rate": 3.0355944055944055e-06, "loss": 0.3948, "step": 14300 }, { "epoch": 12.4, "learning_rate": 3.0348951048951046e-06, "loss": 0.4039, "step": 14310 }, { "epoch": 12.41, "learning_rate": 3.034195804195804e-06, "loss": 0.3865, "step": 14320 }, { "epoch": 12.42, "learning_rate": 3.0334965034965036e-06, "loss": 0.3794, "step": 14330 }, { "epoch": 12.43, "learning_rate": 3.0327972027972026e-06, "loss": 0.4173, "step": 14340 }, { "epoch": 12.43, "learning_rate": 3.0320979020979017e-06, "loss": 0.4037, "step": 14350 }, { "epoch": 12.44, "learning_rate": 3.0313986013986012e-06, "loss": 0.4497, "step": 14360 }, { "epoch": 12.45, "learning_rate": 3.0306993006993007e-06, "loss": 0.4244, "step": 14370 }, { "epoch": 12.46, "learning_rate": 3.03e-06, "loss": 0.3988, "step": 14380 }, { "epoch": 12.47, "learning_rate": 3.0293006993006993e-06, "loss": 0.4545, "step": 14390 }, { "epoch": 12.48, "learning_rate": 3.0286013986013984e-06, "loss": 0.5355, "step": 14400 }, { "epoch": 12.49, "learning_rate": 3.027902097902098e-06, "loss": 0.3757, "step": 14410 }, { "epoch": 12.5, "learning_rate": 3.027202797202797e-06, "loss": 0.3856, "step": 14420 }, { "epoch": 12.5, "learning_rate": 3.0265034965034964e-06, "loss": 0.4305, "step": 14430 }, { "epoch": 12.51, "learning_rate": 3.025804195804196e-06, "loss": 0.4123, "step": 14440 }, { "epoch": 12.52, "learning_rate": 3.0251048951048946e-06, "loss": 0.3745, "step": 14450 }, { "epoch": 12.53, "learning_rate": 3.024405594405594e-06, "loss": 0.357, "step": 14460 }, { "epoch": 12.54, "learning_rate": 3.0237062937062936e-06, "loss": 0.3626, "step": 14470 }, { "epoch": 12.55, "learning_rate": 3.023006993006993e-06, "loss": 0.3647, "step": 14480 }, { "epoch": 12.56, "learning_rate": 3.022307692307692e-06, "loss": 0.3769, "step": 14490 }, { "epoch": 12.56, "learning_rate": 3.0216083916083916e-06, "loss": 0.4741, "step": 14500 }, { "epoch": 12.57, "learning_rate": 3.0209090909090907e-06, "loss": 0.3898, "step": 14510 }, { "epoch": 12.58, "learning_rate": 3.02020979020979e-06, "loss": 0.3792, "step": 14520 }, { "epoch": 12.59, "learning_rate": 3.0195104895104893e-06, "loss": 0.3776, "step": 14530 }, { "epoch": 12.6, "learning_rate": 3.0188111888111888e-06, "loss": 0.4141, "step": 14540 }, { "epoch": 12.61, "learning_rate": 3.0181118881118883e-06, "loss": 0.3948, "step": 14550 }, { "epoch": 12.62, "learning_rate": 3.017412587412587e-06, "loss": 0.3601, "step": 14560 }, { "epoch": 12.63, "learning_rate": 3.0167132867132864e-06, "loss": 0.4267, "step": 14570 }, { "epoch": 12.63, "learning_rate": 3.016013986013986e-06, "loss": 0.4611, "step": 14580 }, { "epoch": 12.64, "learning_rate": 3.0153146853146854e-06, "loss": 0.4253, "step": 14590 }, { "epoch": 12.65, "learning_rate": 3.0146153846153845e-06, "loss": 0.4089, "step": 14600 }, { "epoch": 12.66, "learning_rate": 3.0139160839160836e-06, "loss": 0.3613, "step": 14610 }, { "epoch": 12.67, "learning_rate": 3.013216783216783e-06, "loss": 0.3582, "step": 14620 }, { "epoch": 12.68, "learning_rate": 3.012517482517482e-06, "loss": 0.3913, "step": 14630 }, { "epoch": 12.69, "learning_rate": 3.0118181818181816e-06, "loss": 0.4095, "step": 14640 }, { "epoch": 12.69, "learning_rate": 3.011118881118881e-06, "loss": 0.3807, "step": 14650 }, { "epoch": 12.7, "learning_rate": 3.0104195804195806e-06, "loss": 0.4255, "step": 14660 }, { "epoch": 12.71, "learning_rate": 3.0097202797202793e-06, "loss": 0.385, "step": 14670 }, { "epoch": 12.72, "learning_rate": 3.0090209790209788e-06, "loss": 0.3581, "step": 14680 }, { "epoch": 12.73, "learning_rate": 3.0083216783216783e-06, "loss": 0.407, "step": 14690 }, { "epoch": 12.74, "learning_rate": 3.0076223776223778e-06, "loss": 0.4068, "step": 14700 }, { "epoch": 12.75, "learning_rate": 3.006923076923077e-06, "loss": 0.4436, "step": 14710 }, { "epoch": 12.76, "learning_rate": 3.006223776223776e-06, "loss": 0.3818, "step": 14720 }, { "epoch": 12.76, "learning_rate": 3.0055244755244754e-06, "loss": 0.3307, "step": 14730 }, { "epoch": 12.77, "learning_rate": 3.0048251748251745e-06, "loss": 0.4024, "step": 14740 }, { "epoch": 12.78, "learning_rate": 3.004125874125874e-06, "loss": 0.4657, "step": 14750 }, { "epoch": 12.79, "learning_rate": 3.0034265734265735e-06, "loss": 0.4503, "step": 14760 }, { "epoch": 12.8, "learning_rate": 3.002727272727273e-06, "loss": 0.3551, "step": 14770 }, { "epoch": 12.81, "learning_rate": 3.0020279720279716e-06, "loss": 0.4221, "step": 14780 }, { "epoch": 12.82, "learning_rate": 3.001328671328671e-06, "loss": 0.3889, "step": 14790 }, { "epoch": 12.82, "learning_rate": 3.0006293706293706e-06, "loss": 0.3709, "step": 14800 }, { "epoch": 12.83, "learning_rate": 2.9999300699300697e-06, "loss": 0.4108, "step": 14810 }, { "epoch": 12.84, "learning_rate": 2.999230769230769e-06, "loss": 0.402, "step": 14820 }, { "epoch": 12.85, "learning_rate": 2.9985314685314683e-06, "loss": 0.3713, "step": 14830 }, { "epoch": 12.86, "learning_rate": 2.9978321678321678e-06, "loss": 0.4058, "step": 14840 }, { "epoch": 12.87, "learning_rate": 2.997132867132867e-06, "loss": 0.3828, "step": 14850 }, { "epoch": 12.88, "learning_rate": 2.9964335664335663e-06, "loss": 0.3566, "step": 14860 }, { "epoch": 12.89, "learning_rate": 2.995734265734266e-06, "loss": 0.3908, "step": 14870 }, { "epoch": 12.89, "learning_rate": 2.9950349650349653e-06, "loss": 0.4369, "step": 14880 }, { "epoch": 12.9, "learning_rate": 2.994335664335664e-06, "loss": 0.4022, "step": 14890 }, { "epoch": 12.91, "learning_rate": 2.9936363636363635e-06, "loss": 0.4866, "step": 14900 }, { "epoch": 12.92, "learning_rate": 2.992937062937063e-06, "loss": 0.4089, "step": 14910 }, { "epoch": 12.93, "learning_rate": 2.992237762237762e-06, "loss": 0.3921, "step": 14920 }, { "epoch": 12.94, "learning_rate": 2.9915384615384615e-06, "loss": 0.4111, "step": 14930 }, { "epoch": 12.95, "learning_rate": 2.9908391608391606e-06, "loss": 0.3707, "step": 14940 }, { "epoch": 12.95, "learning_rate": 2.99013986013986e-06, "loss": 0.5013, "step": 14950 }, { "epoch": 12.96, "learning_rate": 2.989440559440559e-06, "loss": 0.4334, "step": 14960 }, { "epoch": 12.97, "learning_rate": 2.9887412587412587e-06, "loss": 0.4315, "step": 14970 }, { "epoch": 12.98, "learning_rate": 2.988041958041958e-06, "loss": 0.382, "step": 14980 }, { "epoch": 12.99, "learning_rate": 2.987342657342657e-06, "loss": 0.3887, "step": 14990 }, { "epoch": 13.0, "learning_rate": 2.9866433566433563e-06, "loss": 0.3722, "step": 15000 }, { "epoch": 13.0, "eval_loss": 0.5786426663398743, "eval_runtime": 133.9404, "eval_samples_per_second": 3.972, "eval_steps_per_second": 1.986, "eval_wer": 0.25654046409976217, "step": 15002 }, { "epoch": 13.01, "learning_rate": 2.985944055944056e-06, "loss": 0.3685, "step": 15010 }, { "epoch": 13.02, "learning_rate": 2.9852447552447553e-06, "loss": 0.3702, "step": 15020 }, { "epoch": 13.02, "learning_rate": 2.9845454545454544e-06, "loss": 0.3794, "step": 15030 }, { "epoch": 13.03, "learning_rate": 2.983846153846154e-06, "loss": 0.3762, "step": 15040 }, { "epoch": 13.04, "learning_rate": 2.983146853146853e-06, "loss": 0.4761, "step": 15050 }, { "epoch": 13.05, "learning_rate": 2.9824475524475525e-06, "loss": 0.401, "step": 15060 }, { "epoch": 13.06, "learning_rate": 2.9817482517482515e-06, "loss": 0.4142, "step": 15070 }, { "epoch": 13.07, "learning_rate": 2.981048951048951e-06, "loss": 0.3326, "step": 15080 }, { "epoch": 13.08, "learning_rate": 2.9803496503496505e-06, "loss": 0.3793, "step": 15090 }, { "epoch": 13.08, "learning_rate": 2.979650349650349e-06, "loss": 0.3986, "step": 15100 }, { "epoch": 13.09, "learning_rate": 2.9789510489510487e-06, "loss": 0.3771, "step": 15110 }, { "epoch": 13.1, "learning_rate": 2.978251748251748e-06, "loss": 0.3902, "step": 15120 }, { "epoch": 13.11, "learning_rate": 2.9775524475524477e-06, "loss": 0.3795, "step": 15130 }, { "epoch": 13.12, "learning_rate": 2.9768531468531467e-06, "loss": 0.4201, "step": 15140 }, { "epoch": 13.13, "learning_rate": 2.976153846153846e-06, "loss": 0.409, "step": 15150 }, { "epoch": 13.14, "learning_rate": 2.9754545454545453e-06, "loss": 0.4454, "step": 15160 }, { "epoch": 13.15, "learning_rate": 2.9747552447552444e-06, "loss": 0.44, "step": 15170 }, { "epoch": 13.15, "learning_rate": 2.974055944055944e-06, "loss": 0.413, "step": 15180 }, { "epoch": 13.16, "learning_rate": 2.9733566433566434e-06, "loss": 0.3937, "step": 15190 }, { "epoch": 13.17, "learning_rate": 2.972657342657343e-06, "loss": 0.3827, "step": 15200 }, { "epoch": 13.18, "learning_rate": 2.9719580419580415e-06, "loss": 0.3791, "step": 15210 }, { "epoch": 13.19, "learning_rate": 2.971258741258741e-06, "loss": 0.3759, "step": 15220 }, { "epoch": 13.2, "learning_rate": 2.9705594405594405e-06, "loss": 0.3828, "step": 15230 }, { "epoch": 13.21, "learning_rate": 2.96986013986014e-06, "loss": 0.3988, "step": 15240 }, { "epoch": 13.21, "learning_rate": 2.969160839160839e-06, "loss": 0.4248, "step": 15250 }, { "epoch": 13.22, "learning_rate": 2.968461538461538e-06, "loss": 0.472, "step": 15260 }, { "epoch": 13.23, "learning_rate": 2.9677622377622377e-06, "loss": 0.3754, "step": 15270 }, { "epoch": 13.24, "learning_rate": 2.9670629370629367e-06, "loss": 0.3814, "step": 15280 }, { "epoch": 13.25, "learning_rate": 2.9663636363636362e-06, "loss": 0.4308, "step": 15290 }, { "epoch": 13.26, "learning_rate": 2.9656643356643357e-06, "loss": 0.3784, "step": 15300 }, { "epoch": 13.27, "learning_rate": 2.9649650349650352e-06, "loss": 0.435, "step": 15310 }, { "epoch": 13.28, "learning_rate": 2.964265734265734e-06, "loss": 0.4053, "step": 15320 }, { "epoch": 13.28, "learning_rate": 2.9635664335664334e-06, "loss": 0.4048, "step": 15330 }, { "epoch": 13.29, "learning_rate": 2.962867132867133e-06, "loss": 0.4112, "step": 15340 }, { "epoch": 13.3, "learning_rate": 2.962167832167832e-06, "loss": 0.3558, "step": 15350 }, { "epoch": 13.31, "learning_rate": 2.9614685314685314e-06, "loss": 0.4515, "step": 15360 }, { "epoch": 13.32, "learning_rate": 2.9607692307692305e-06, "loss": 0.3856, "step": 15370 }, { "epoch": 13.33, "learning_rate": 2.96006993006993e-06, "loss": 0.3782, "step": 15380 }, { "epoch": 13.34, "learning_rate": 2.959370629370629e-06, "loss": 0.4126, "step": 15390 }, { "epoch": 13.34, "learning_rate": 2.9586713286713286e-06, "loss": 0.3945, "step": 15400 }, { "epoch": 13.35, "learning_rate": 2.957972027972028e-06, "loss": 0.4101, "step": 15410 }, { "epoch": 13.36, "learning_rate": 2.9572727272727267e-06, "loss": 0.4763, "step": 15420 }, { "epoch": 13.37, "learning_rate": 2.9565734265734262e-06, "loss": 0.3442, "step": 15430 }, { "epoch": 13.38, "learning_rate": 2.9558741258741257e-06, "loss": 0.3997, "step": 15440 }, { "epoch": 13.39, "learning_rate": 2.955174825174825e-06, "loss": 0.4133, "step": 15450 }, { "epoch": 13.4, "learning_rate": 2.9544755244755243e-06, "loss": 0.4239, "step": 15460 }, { "epoch": 13.41, "learning_rate": 2.9537762237762238e-06, "loss": 0.4066, "step": 15470 }, { "epoch": 13.41, "learning_rate": 2.953076923076923e-06, "loss": 0.3706, "step": 15480 }, { "epoch": 13.42, "learning_rate": 2.9523776223776223e-06, "loss": 0.3928, "step": 15490 }, { "epoch": 13.43, "learning_rate": 2.9516783216783214e-06, "loss": 0.4208, "step": 15500 }, { "epoch": 13.44, "learning_rate": 2.950979020979021e-06, "loss": 0.4563, "step": 15510 }, { "epoch": 13.45, "learning_rate": 2.9502797202797204e-06, "loss": 0.4204, "step": 15520 }, { "epoch": 13.46, "learning_rate": 2.949580419580419e-06, "loss": 0.3688, "step": 15530 }, { "epoch": 13.47, "learning_rate": 2.9488811188811186e-06, "loss": 0.478, "step": 15540 }, { "epoch": 13.47, "learning_rate": 2.948181818181818e-06, "loss": 0.4186, "step": 15550 }, { "epoch": 13.48, "learning_rate": 2.9474825174825176e-06, "loss": 0.3855, "step": 15560 }, { "epoch": 13.49, "learning_rate": 2.9467832167832166e-06, "loss": 0.4161, "step": 15570 }, { "epoch": 13.5, "learning_rate": 2.946083916083916e-06, "loss": 0.3894, "step": 15580 }, { "epoch": 13.51, "learning_rate": 2.945384615384615e-06, "loss": 0.4233, "step": 15590 }, { "epoch": 13.52, "learning_rate": 2.9446853146853143e-06, "loss": 0.504, "step": 15600 }, { "epoch": 13.53, "learning_rate": 2.9439860139860138e-06, "loss": 0.4012, "step": 15610 }, { "epoch": 13.54, "learning_rate": 2.9432867132867133e-06, "loss": 0.3991, "step": 15620 }, { "epoch": 13.54, "learning_rate": 2.9425874125874128e-06, "loss": 0.4202, "step": 15630 }, { "epoch": 13.55, "learning_rate": 2.9418881118881114e-06, "loss": 0.4122, "step": 15640 }, { "epoch": 13.56, "learning_rate": 2.941188811188811e-06, "loss": 0.4015, "step": 15650 }, { "epoch": 13.57, "learning_rate": 2.9404895104895104e-06, "loss": 0.4611, "step": 15660 }, { "epoch": 13.58, "learning_rate": 2.93979020979021e-06, "loss": 0.3858, "step": 15670 }, { "epoch": 13.59, "learning_rate": 2.939090909090909e-06, "loss": 0.3611, "step": 15680 }, { "epoch": 13.6, "learning_rate": 2.9383916083916085e-06, "loss": 0.4195, "step": 15690 }, { "epoch": 13.6, "learning_rate": 2.9376923076923076e-06, "loss": 0.4241, "step": 15700 }, { "epoch": 13.61, "learning_rate": 2.9369930069930066e-06, "loss": 0.3334, "step": 15710 }, { "epoch": 13.62, "learning_rate": 2.936293706293706e-06, "loss": 0.3701, "step": 15720 }, { "epoch": 13.63, "learning_rate": 2.9355944055944056e-06, "loss": 0.4322, "step": 15730 }, { "epoch": 13.64, "learning_rate": 2.934895104895105e-06, "loss": 0.4141, "step": 15740 }, { "epoch": 13.65, "learning_rate": 2.9341958041958038e-06, "loss": 0.3971, "step": 15750 }, { "epoch": 13.66, "learning_rate": 2.9334965034965033e-06, "loss": 0.368, "step": 15760 }, { "epoch": 13.67, "learning_rate": 2.9327972027972028e-06, "loss": 0.328, "step": 15770 }, { "epoch": 13.67, "learning_rate": 2.932097902097902e-06, "loss": 0.3849, "step": 15780 }, { "epoch": 13.68, "learning_rate": 2.9313986013986013e-06, "loss": 0.4378, "step": 15790 }, { "epoch": 13.69, "learning_rate": 2.9306993006993004e-06, "loss": 0.3931, "step": 15800 }, { "epoch": 13.7, "learning_rate": 2.93e-06, "loss": 0.3739, "step": 15810 }, { "epoch": 13.71, "learning_rate": 2.929300699300699e-06, "loss": 0.3899, "step": 15820 }, { "epoch": 13.72, "learning_rate": 2.9286013986013985e-06, "loss": 0.4047, "step": 15830 }, { "epoch": 13.73, "learning_rate": 2.927902097902098e-06, "loss": 0.4169, "step": 15840 }, { "epoch": 13.73, "learning_rate": 2.9272027972027975e-06, "loss": 0.4546, "step": 15850 }, { "epoch": 13.74, "learning_rate": 2.926503496503496e-06, "loss": 0.3633, "step": 15860 }, { "epoch": 13.75, "learning_rate": 2.9258041958041956e-06, "loss": 0.4205, "step": 15870 }, { "epoch": 13.76, "learning_rate": 2.925104895104895e-06, "loss": 0.4143, "step": 15880 }, { "epoch": 13.77, "learning_rate": 2.924405594405594e-06, "loss": 0.3766, "step": 15890 }, { "epoch": 13.78, "learning_rate": 2.9237062937062937e-06, "loss": 0.4132, "step": 15900 }, { "epoch": 13.79, "learning_rate": 2.9230069930069928e-06, "loss": 0.4101, "step": 15910 }, { "epoch": 13.8, "learning_rate": 2.9223076923076922e-06, "loss": 0.4221, "step": 15920 }, { "epoch": 13.8, "learning_rate": 2.9216083916083913e-06, "loss": 0.3648, "step": 15930 }, { "epoch": 13.81, "learning_rate": 2.920909090909091e-06, "loss": 0.4157, "step": 15940 }, { "epoch": 13.82, "learning_rate": 2.9202097902097903e-06, "loss": 0.4349, "step": 15950 }, { "epoch": 13.83, "learning_rate": 2.919510489510489e-06, "loss": 0.4585, "step": 15960 }, { "epoch": 13.84, "learning_rate": 2.9188111888111885e-06, "loss": 0.4467, "step": 15970 }, { "epoch": 13.85, "learning_rate": 2.918111888111888e-06, "loss": 0.3707, "step": 15980 }, { "epoch": 13.86, "learning_rate": 2.9174125874125875e-06, "loss": 0.4144, "step": 15990 }, { "epoch": 13.86, "learning_rate": 2.9167132867132865e-06, "loss": 0.4674, "step": 16000 }, { "epoch": 13.87, "learning_rate": 2.916013986013986e-06, "loss": 0.4244, "step": 16010 }, { "epoch": 13.88, "learning_rate": 2.915314685314685e-06, "loss": 0.3754, "step": 16020 }, { "epoch": 13.89, "learning_rate": 2.9146153846153846e-06, "loss": 0.3857, "step": 16030 }, { "epoch": 13.9, "learning_rate": 2.9139160839160837e-06, "loss": 0.3695, "step": 16040 }, { "epoch": 13.91, "learning_rate": 2.913216783216783e-06, "loss": 0.4657, "step": 16050 }, { "epoch": 13.92, "learning_rate": 2.9125174825174827e-06, "loss": 0.4059, "step": 16060 }, { "epoch": 13.93, "learning_rate": 2.9118181818181813e-06, "loss": 0.442, "step": 16070 }, { "epoch": 13.93, "learning_rate": 2.911118881118881e-06, "loss": 0.3858, "step": 16080 }, { "epoch": 13.94, "learning_rate": 2.9104195804195803e-06, "loss": 0.4101, "step": 16090 }, { "epoch": 13.95, "learning_rate": 2.90972027972028e-06, "loss": 0.4026, "step": 16100 }, { "epoch": 13.96, "learning_rate": 2.909020979020979e-06, "loss": 0.3701, "step": 16110 }, { "epoch": 13.97, "learning_rate": 2.9083216783216784e-06, "loss": 0.4064, "step": 16120 }, { "epoch": 13.98, "learning_rate": 2.9076223776223774e-06, "loss": 0.4078, "step": 16130 }, { "epoch": 13.99, "learning_rate": 2.9069230769230765e-06, "loss": 0.3893, "step": 16140 }, { "epoch": 13.99, "learning_rate": 2.906223776223776e-06, "loss": 0.3558, "step": 16150 }, { "epoch": 14.0, "eval_loss": 0.5589486360549927, "eval_runtime": 132.8357, "eval_samples_per_second": 4.005, "eval_steps_per_second": 2.002, "eval_wer": 0.26380407533586164, "step": 16156 }, { "epoch": 14.0, "learning_rate": 2.9055244755244755e-06, "loss": 0.4281, "step": 16160 }, { "epoch": 14.01, "learning_rate": 2.904825174825175e-06, "loss": 0.4123, "step": 16170 }, { "epoch": 14.02, "learning_rate": 2.9041258741258737e-06, "loss": 0.3568, "step": 16180 }, { "epoch": 14.03, "learning_rate": 2.903426573426573e-06, "loss": 0.3891, "step": 16190 }, { "epoch": 14.04, "learning_rate": 2.9027272727272727e-06, "loss": 0.4301, "step": 16200 }, { "epoch": 14.05, "learning_rate": 2.902027972027972e-06, "loss": 0.4633, "step": 16210 }, { "epoch": 14.06, "learning_rate": 2.9013286713286712e-06, "loss": 0.3918, "step": 16220 }, { "epoch": 14.06, "learning_rate": 2.9006293706293707e-06, "loss": 0.3432, "step": 16230 }, { "epoch": 14.07, "learning_rate": 2.89993006993007e-06, "loss": 0.4055, "step": 16240 }, { "epoch": 14.08, "learning_rate": 2.899230769230769e-06, "loss": 0.3804, "step": 16250 }, { "epoch": 14.09, "learning_rate": 2.8985314685314684e-06, "loss": 0.4274, "step": 16260 }, { "epoch": 14.1, "learning_rate": 2.897832167832168e-06, "loss": 0.4067, "step": 16270 }, { "epoch": 14.11, "learning_rate": 2.8971328671328674e-06, "loss": 0.3626, "step": 16280 }, { "epoch": 14.12, "learning_rate": 2.896433566433566e-06, "loss": 0.3951, "step": 16290 }, { "epoch": 14.12, "learning_rate": 2.8957342657342655e-06, "loss": 0.401, "step": 16300 }, { "epoch": 14.13, "learning_rate": 2.895034965034965e-06, "loss": 0.4691, "step": 16310 }, { "epoch": 14.14, "learning_rate": 2.894335664335664e-06, "loss": 0.3822, "step": 16320 }, { "epoch": 14.15, "learning_rate": 2.8936363636363636e-06, "loss": 0.4677, "step": 16330 }, { "epoch": 14.16, "learning_rate": 2.8929370629370626e-06, "loss": 0.3749, "step": 16340 }, { "epoch": 14.17, "learning_rate": 2.892237762237762e-06, "loss": 0.3705, "step": 16350 }, { "epoch": 14.18, "learning_rate": 2.8915384615384612e-06, "loss": 0.4783, "step": 16360 }, { "epoch": 14.19, "learning_rate": 2.8908391608391607e-06, "loss": 0.4133, "step": 16370 }, { "epoch": 14.19, "learning_rate": 2.8901398601398602e-06, "loss": 0.4054, "step": 16380 }, { "epoch": 14.2, "learning_rate": 2.8894405594405593e-06, "loss": 0.4013, "step": 16390 }, { "epoch": 14.21, "learning_rate": 2.8887412587412584e-06, "loss": 0.4116, "step": 16400 }, { "epoch": 14.22, "learning_rate": 2.888041958041958e-06, "loss": 0.3836, "step": 16410 }, { "epoch": 14.23, "learning_rate": 2.8873426573426574e-06, "loss": 0.372, "step": 16420 }, { "epoch": 14.24, "learning_rate": 2.8866433566433564e-06, "loss": 0.3784, "step": 16430 }, { "epoch": 14.25, "learning_rate": 2.885944055944056e-06, "loss": 0.36, "step": 16440 }, { "epoch": 14.25, "learning_rate": 2.885244755244755e-06, "loss": 0.3712, "step": 16450 }, { "epoch": 14.26, "learning_rate": 2.8845454545454545e-06, "loss": 0.4185, "step": 16460 }, { "epoch": 14.27, "learning_rate": 2.8838461538461536e-06, "loss": 0.4046, "step": 16470 }, { "epoch": 14.28, "learning_rate": 2.883146853146853e-06, "loss": 0.3876, "step": 16480 }, { "epoch": 14.29, "learning_rate": 2.8824475524475526e-06, "loss": 0.4056, "step": 16490 }, { "epoch": 14.3, "learning_rate": 2.8817482517482516e-06, "loss": 0.3989, "step": 16500 }, { "epoch": 14.31, "learning_rate": 2.8810489510489507e-06, "loss": 0.3513, "step": 16510 }, { "epoch": 14.32, "learning_rate": 2.88034965034965e-06, "loss": 0.3871, "step": 16520 }, { "epoch": 14.32, "learning_rate": 2.8796503496503497e-06, "loss": 0.4363, "step": 16530 }, { "epoch": 14.33, "learning_rate": 2.8789510489510488e-06, "loss": 0.4149, "step": 16540 }, { "epoch": 14.34, "learning_rate": 2.8782517482517483e-06, "loss": 0.3772, "step": 16550 }, { "epoch": 14.35, "learning_rate": 2.8775524475524473e-06, "loss": 0.4088, "step": 16560 }, { "epoch": 14.36, "learning_rate": 2.8768531468531464e-06, "loss": 0.3692, "step": 16570 }, { "epoch": 14.37, "learning_rate": 2.876153846153846e-06, "loss": 0.4181, "step": 16580 }, { "epoch": 14.38, "learning_rate": 2.8754545454545454e-06, "loss": 0.4705, "step": 16590 }, { "epoch": 14.38, "learning_rate": 2.874755244755245e-06, "loss": 0.3912, "step": 16600 }, { "epoch": 14.39, "learning_rate": 2.8740559440559436e-06, "loss": 0.3983, "step": 16610 }, { "epoch": 14.4, "learning_rate": 2.873356643356643e-06, "loss": 0.4027, "step": 16620 }, { "epoch": 14.41, "learning_rate": 2.8726573426573426e-06, "loss": 0.3157, "step": 16630 }, { "epoch": 14.42, "learning_rate": 2.871958041958042e-06, "loss": 0.4119, "step": 16640 }, { "epoch": 14.43, "learning_rate": 2.871258741258741e-06, "loss": 0.3853, "step": 16650 }, { "epoch": 14.44, "learning_rate": 2.8705594405594406e-06, "loss": 0.3858, "step": 16660 }, { "epoch": 14.45, "learning_rate": 2.8698601398601397e-06, "loss": 0.3623, "step": 16670 }, { "epoch": 14.45, "learning_rate": 2.8691608391608388e-06, "loss": 0.3513, "step": 16680 }, { "epoch": 14.46, "learning_rate": 2.8684615384615383e-06, "loss": 0.3665, "step": 16690 }, { "epoch": 14.47, "learning_rate": 2.8677622377622378e-06, "loss": 0.3952, "step": 16700 }, { "epoch": 14.48, "learning_rate": 2.8670629370629373e-06, "loss": 0.4067, "step": 16710 }, { "epoch": 14.49, "learning_rate": 2.866363636363636e-06, "loss": 0.4177, "step": 16720 }, { "epoch": 14.5, "learning_rate": 2.8656643356643354e-06, "loss": 0.3951, "step": 16730 }, { "epoch": 14.51, "learning_rate": 2.864965034965035e-06, "loss": 0.4074, "step": 16740 }, { "epoch": 14.51, "learning_rate": 2.864265734265734e-06, "loss": 0.4256, "step": 16750 }, { "epoch": 14.52, "learning_rate": 2.8635664335664335e-06, "loss": 0.3896, "step": 16760 }, { "epoch": 14.53, "learning_rate": 2.862867132867133e-06, "loss": 0.4105, "step": 16770 }, { "epoch": 14.54, "learning_rate": 2.862167832167832e-06, "loss": 0.3995, "step": 16780 }, { "epoch": 14.55, "learning_rate": 2.861468531468531e-06, "loss": 0.4183, "step": 16790 }, { "epoch": 14.56, "learning_rate": 2.8607692307692306e-06, "loss": 0.4463, "step": 16800 }, { "epoch": 14.57, "learning_rate": 2.86006993006993e-06, "loss": 0.4485, "step": 16810 }, { "epoch": 14.58, "learning_rate": 2.8593706293706296e-06, "loss": 0.4317, "step": 16820 }, { "epoch": 14.58, "learning_rate": 2.8586713286713283e-06, "loss": 0.3431, "step": 16830 }, { "epoch": 14.59, "learning_rate": 2.8579720279720278e-06, "loss": 0.4122, "step": 16840 }, { "epoch": 14.6, "learning_rate": 2.8572727272727273e-06, "loss": 0.4, "step": 16850 }, { "epoch": 14.61, "learning_rate": 2.8565734265734263e-06, "loss": 0.3648, "step": 16860 }, { "epoch": 14.62, "learning_rate": 2.855874125874126e-06, "loss": 0.4101, "step": 16870 }, { "epoch": 14.63, "learning_rate": 2.8551748251748253e-06, "loss": 0.3953, "step": 16880 }, { "epoch": 14.64, "learning_rate": 2.8544755244755244e-06, "loss": 0.3571, "step": 16890 }, { "epoch": 14.64, "learning_rate": 2.8537762237762235e-06, "loss": 0.4135, "step": 16900 }, { "epoch": 14.65, "learning_rate": 2.853076923076923e-06, "loss": 0.3993, "step": 16910 }, { "epoch": 14.66, "learning_rate": 2.8523776223776225e-06, "loss": 0.4097, "step": 16920 }, { "epoch": 14.67, "learning_rate": 2.8516783216783215e-06, "loss": 0.4438, "step": 16930 }, { "epoch": 14.68, "learning_rate": 2.8509790209790206e-06, "loss": 0.4313, "step": 16940 }, { "epoch": 14.69, "learning_rate": 2.85027972027972e-06, "loss": 0.4028, "step": 16950 }, { "epoch": 14.7, "learning_rate": 2.8495804195804196e-06, "loss": 0.441, "step": 16960 }, { "epoch": 14.71, "learning_rate": 2.8488811188811187e-06, "loss": 0.4112, "step": 16970 }, { "epoch": 14.71, "learning_rate": 2.848181818181818e-06, "loss": 0.399, "step": 16980 }, { "epoch": 14.72, "learning_rate": 2.8474825174825172e-06, "loss": 0.3647, "step": 16990 }, { "epoch": 14.73, "learning_rate": 2.8467832167832167e-06, "loss": 0.3807, "step": 17000 }, { "epoch": 14.74, "learning_rate": 2.846083916083916e-06, "loss": 0.4839, "step": 17010 }, { "epoch": 14.75, "learning_rate": 2.8453846153846153e-06, "loss": 0.4013, "step": 17020 }, { "epoch": 14.76, "learning_rate": 2.844685314685315e-06, "loss": 0.3263, "step": 17030 }, { "epoch": 14.77, "learning_rate": 2.843986013986014e-06, "loss": 0.3927, "step": 17040 }, { "epoch": 14.77, "learning_rate": 2.843286713286713e-06, "loss": 0.3766, "step": 17050 }, { "epoch": 14.78, "learning_rate": 2.8425874125874125e-06, "loss": 0.4393, "step": 17060 }, { "epoch": 14.79, "learning_rate": 2.841888111888112e-06, "loss": 0.409, "step": 17070 }, { "epoch": 14.8, "learning_rate": 2.841188811188811e-06, "loss": 0.3585, "step": 17080 }, { "epoch": 14.81, "learning_rate": 2.8404895104895105e-06, "loss": 0.392, "step": 17090 }, { "epoch": 14.82, "learning_rate": 2.8397902097902096e-06, "loss": 0.417, "step": 17100 }, { "epoch": 14.83, "learning_rate": 2.8390909090909087e-06, "loss": 0.4063, "step": 17110 }, { "epoch": 14.83, "learning_rate": 2.838391608391608e-06, "loss": 0.3751, "step": 17120 }, { "epoch": 14.84, "learning_rate": 2.8376923076923077e-06, "loss": 0.3907, "step": 17130 }, { "epoch": 14.85, "learning_rate": 2.836993006993007e-06, "loss": 0.4433, "step": 17140 }, { "epoch": 14.86, "learning_rate": 2.836293706293706e-06, "loss": 0.4271, "step": 17150 }, { "epoch": 14.87, "learning_rate": 2.8355944055944053e-06, "loss": 0.4155, "step": 17160 }, { "epoch": 14.88, "learning_rate": 2.834895104895105e-06, "loss": 0.3911, "step": 17170 }, { "epoch": 14.89, "learning_rate": 2.8341958041958043e-06, "loss": 0.3268, "step": 17180 }, { "epoch": 14.9, "learning_rate": 2.8334965034965034e-06, "loss": 0.3477, "step": 17190 }, { "epoch": 14.9, "learning_rate": 2.832797202797203e-06, "loss": 0.4478, "step": 17200 }, { "epoch": 14.91, "learning_rate": 2.832097902097902e-06, "loss": 0.4441, "step": 17210 }, { "epoch": 14.92, "learning_rate": 2.831398601398601e-06, "loss": 0.4519, "step": 17220 }, { "epoch": 14.93, "learning_rate": 2.8306993006993005e-06, "loss": 0.4354, "step": 17230 }, { "epoch": 14.94, "learning_rate": 2.83e-06, "loss": 0.3698, "step": 17240 }, { "epoch": 14.95, "learning_rate": 2.8293006993006995e-06, "loss": 0.4287, "step": 17250 }, { "epoch": 14.96, "learning_rate": 2.828601398601398e-06, "loss": 0.4025, "step": 17260 }, { "epoch": 14.96, "learning_rate": 2.8279020979020977e-06, "loss": 0.4039, "step": 17270 }, { "epoch": 14.97, "learning_rate": 2.827202797202797e-06, "loss": 0.3422, "step": 17280 }, { "epoch": 14.98, "learning_rate": 2.8265034965034962e-06, "loss": 0.3912, "step": 17290 }, { "epoch": 14.99, "learning_rate": 2.8258041958041957e-06, "loss": 0.4358, "step": 17300 }, { "epoch": 15.0, "learning_rate": 2.8251048951048952e-06, "loss": 0.392, "step": 17310 }, { "epoch": 15.0, "eval_loss": 0.5580989122390747, "eval_runtime": 134.5878, "eval_samples_per_second": 3.953, "eval_steps_per_second": 1.976, "eval_wer": 0.2593044931542071, "step": 17310 }, { "epoch": 15.01, "learning_rate": 2.8244055944055943e-06, "loss": 0.4794, "step": 17320 }, { "epoch": 15.02, "learning_rate": 2.8237062937062934e-06, "loss": 0.3538, "step": 17330 }, { "epoch": 15.03, "learning_rate": 2.823006993006993e-06, "loss": 0.432, "step": 17340 }, { "epoch": 15.03, "learning_rate": 2.8223076923076924e-06, "loss": 0.3713, "step": 17350 }, { "epoch": 15.04, "learning_rate": 2.821608391608392e-06, "loss": 0.4383, "step": 17360 }, { "epoch": 15.05, "learning_rate": 2.8209090909090905e-06, "loss": 0.4064, "step": 17370 }, { "epoch": 15.06, "learning_rate": 2.82020979020979e-06, "loss": 0.4444, "step": 17380 }, { "epoch": 15.07, "learning_rate": 2.8195104895104895e-06, "loss": 0.383, "step": 17390 }, { "epoch": 15.08, "learning_rate": 2.8188111888111886e-06, "loss": 0.413, "step": 17400 }, { "epoch": 15.09, "learning_rate": 2.818111888111888e-06, "loss": 0.4161, "step": 17410 }, { "epoch": 15.1, "learning_rate": 2.8174125874125876e-06, "loss": 0.3648, "step": 17420 }, { "epoch": 15.1, "learning_rate": 2.8167132867132866e-06, "loss": 0.3707, "step": 17430 }, { "epoch": 15.11, "learning_rate": 2.8160139860139857e-06, "loss": 0.3794, "step": 17440 }, { "epoch": 15.12, "learning_rate": 2.815314685314685e-06, "loss": 0.4292, "step": 17450 }, { "epoch": 15.13, "learning_rate": 2.8146153846153847e-06, "loss": 0.468, "step": 17460 }, { "epoch": 15.14, "learning_rate": 2.8139160839160838e-06, "loss": 0.3645, "step": 17470 }, { "epoch": 15.15, "learning_rate": 2.813216783216783e-06, "loss": 0.4114, "step": 17480 }, { "epoch": 15.16, "learning_rate": 2.8125174825174824e-06, "loss": 0.4202, "step": 17490 }, { "epoch": 15.16, "learning_rate": 2.811818181818182e-06, "loss": 0.4196, "step": 17500 }, { "epoch": 15.17, "learning_rate": 2.811118881118881e-06, "loss": 0.3847, "step": 17510 }, { "epoch": 15.18, "learning_rate": 2.8104195804195804e-06, "loss": 0.4578, "step": 17520 }, { "epoch": 15.19, "learning_rate": 2.8097202797202795e-06, "loss": 0.3375, "step": 17530 }, { "epoch": 15.2, "learning_rate": 2.8090209790209786e-06, "loss": 0.3479, "step": 17540 }, { "epoch": 15.21, "learning_rate": 2.808321678321678e-06, "loss": 0.3807, "step": 17550 }, { "epoch": 15.22, "learning_rate": 2.8076223776223776e-06, "loss": 0.4187, "step": 17560 }, { "epoch": 15.23, "learning_rate": 2.806923076923077e-06, "loss": 0.3555, "step": 17570 }, { "epoch": 15.23, "learning_rate": 2.806223776223776e-06, "loss": 0.403, "step": 17580 }, { "epoch": 15.24, "learning_rate": 2.805524475524475e-06, "loss": 0.3263, "step": 17590 }, { "epoch": 15.25, "learning_rate": 2.8048251748251747e-06, "loss": 0.3526, "step": 17600 }, { "epoch": 15.26, "learning_rate": 2.804125874125874e-06, "loss": 0.3838, "step": 17610 }, { "epoch": 15.27, "learning_rate": 2.8034265734265733e-06, "loss": 0.4049, "step": 17620 }, { "epoch": 15.28, "learning_rate": 2.8027272727272728e-06, "loss": 0.4254, "step": 17630 }, { "epoch": 15.29, "learning_rate": 2.802027972027972e-06, "loss": 0.3857, "step": 17640 }, { "epoch": 15.29, "learning_rate": 2.801328671328671e-06, "loss": 0.3738, "step": 17650 }, { "epoch": 15.3, "learning_rate": 2.8006293706293704e-06, "loss": 0.389, "step": 17660 }, { "epoch": 15.31, "learning_rate": 2.79993006993007e-06, "loss": 0.4428, "step": 17670 }, { "epoch": 15.32, "learning_rate": 2.7992307692307694e-06, "loss": 0.36, "step": 17680 }, { "epoch": 15.33, "learning_rate": 2.798531468531468e-06, "loss": 0.3858, "step": 17690 }, { "epoch": 15.34, "learning_rate": 2.7978321678321676e-06, "loss": 0.4003, "step": 17700 }, { "epoch": 15.35, "learning_rate": 2.797132867132867e-06, "loss": 0.4563, "step": 17710 }, { "epoch": 15.36, "learning_rate": 2.796433566433566e-06, "loss": 0.3905, "step": 17720 }, { "epoch": 15.36, "learning_rate": 2.7957342657342656e-06, "loss": 0.3633, "step": 17730 }, { "epoch": 15.37, "learning_rate": 2.795034965034965e-06, "loss": 0.3883, "step": 17740 }, { "epoch": 15.38, "learning_rate": 2.794335664335664e-06, "loss": 0.3688, "step": 17750 }, { "epoch": 15.39, "learning_rate": 2.7936363636363633e-06, "loss": 0.4025, "step": 17760 }, { "epoch": 15.4, "learning_rate": 2.7929370629370628e-06, "loss": 0.3778, "step": 17770 }, { "epoch": 15.41, "learning_rate": 2.7922377622377623e-06, "loss": 0.4241, "step": 17780 }, { "epoch": 15.42, "learning_rate": 2.7915384615384618e-06, "loss": 0.3872, "step": 17790 }, { "epoch": 15.42, "learning_rate": 2.7908391608391604e-06, "loss": 0.3909, "step": 17800 }, { "epoch": 15.43, "learning_rate": 2.79013986013986e-06, "loss": 0.3407, "step": 17810 }, { "epoch": 15.44, "learning_rate": 2.7894405594405594e-06, "loss": 0.3655, "step": 17820 }, { "epoch": 15.45, "learning_rate": 2.7887412587412585e-06, "loss": 0.3589, "step": 17830 }, { "epoch": 15.46, "learning_rate": 2.788041958041958e-06, "loss": 0.4076, "step": 17840 }, { "epoch": 15.47, "learning_rate": 2.7873426573426575e-06, "loss": 0.4224, "step": 17850 }, { "epoch": 15.48, "learning_rate": 2.7866433566433565e-06, "loss": 0.3787, "step": 17860 }, { "epoch": 15.49, "learning_rate": 2.7859440559440556e-06, "loss": 0.4452, "step": 17870 }, { "epoch": 15.49, "learning_rate": 2.785244755244755e-06, "loss": 0.37, "step": 17880 }, { "epoch": 15.5, "learning_rate": 2.7845454545454546e-06, "loss": 0.3824, "step": 17890 }, { "epoch": 15.51, "learning_rate": 2.7838461538461537e-06, "loss": 0.3833, "step": 17900 }, { "epoch": 15.52, "learning_rate": 2.7831468531468528e-06, "loss": 0.4135, "step": 17910 }, { "epoch": 15.53, "learning_rate": 2.7824475524475522e-06, "loss": 0.4404, "step": 17920 }, { "epoch": 15.54, "learning_rate": 2.7817482517482517e-06, "loss": 0.362, "step": 17930 }, { "epoch": 15.55, "learning_rate": 2.781048951048951e-06, "loss": 0.421, "step": 17940 }, { "epoch": 15.55, "learning_rate": 2.7803496503496503e-06, "loss": 0.4144, "step": 17950 }, { "epoch": 15.56, "learning_rate": 2.77965034965035e-06, "loss": 0.4041, "step": 17960 }, { "epoch": 15.57, "learning_rate": 2.778951048951049e-06, "loss": 0.3806, "step": 17970 }, { "epoch": 15.58, "learning_rate": 2.778251748251748e-06, "loss": 0.4288, "step": 17980 }, { "epoch": 15.59, "learning_rate": 2.7775524475524475e-06, "loss": 0.3813, "step": 17990 }, { "epoch": 15.6, "learning_rate": 2.776853146853147e-06, "loss": 0.3247, "step": 18000 }, { "epoch": 15.61, "learning_rate": 2.776153846153846e-06, "loss": 0.3454, "step": 18010 }, { "epoch": 15.61, "learning_rate": 2.775454545454545e-06, "loss": 0.3573, "step": 18020 }, { "epoch": 15.62, "learning_rate": 2.7747552447552446e-06, "loss": 0.4104, "step": 18030 }, { "epoch": 15.63, "learning_rate": 2.774055944055944e-06, "loss": 0.36, "step": 18040 }, { "epoch": 15.64, "learning_rate": 2.773356643356643e-06, "loss": 0.3871, "step": 18050 }, { "epoch": 15.65, "learning_rate": 2.7726573426573427e-06, "loss": 0.3662, "step": 18060 }, { "epoch": 15.66, "learning_rate": 2.7719580419580417e-06, "loss": 0.3593, "step": 18070 }, { "epoch": 15.67, "learning_rate": 2.771258741258741e-06, "loss": 0.3884, "step": 18080 }, { "epoch": 15.68, "learning_rate": 2.7705594405594403e-06, "loss": 0.3671, "step": 18090 }, { "epoch": 15.68, "learning_rate": 2.76986013986014e-06, "loss": 0.3949, "step": 18100 }, { "epoch": 15.69, "learning_rate": 2.7691608391608393e-06, "loss": 0.3839, "step": 18110 }, { "epoch": 15.7, "learning_rate": 2.7684615384615384e-06, "loss": 0.4158, "step": 18120 }, { "epoch": 15.71, "learning_rate": 2.7677622377622374e-06, "loss": 0.3239, "step": 18130 }, { "epoch": 15.72, "learning_rate": 2.767062937062937e-06, "loss": 0.3464, "step": 18140 }, { "epoch": 15.73, "learning_rate": 2.7663636363636364e-06, "loss": 0.3884, "step": 18150 }, { "epoch": 15.74, "learning_rate": 2.7656643356643355e-06, "loss": 0.4807, "step": 18160 }, { "epoch": 15.74, "learning_rate": 2.764965034965035e-06, "loss": 0.3784, "step": 18170 }, { "epoch": 15.75, "learning_rate": 2.764265734265734e-06, "loss": 0.3405, "step": 18180 }, { "epoch": 15.76, "learning_rate": 2.763566433566433e-06, "loss": 0.4299, "step": 18190 }, { "epoch": 15.77, "learning_rate": 2.7628671328671327e-06, "loss": 0.4014, "step": 18200 }, { "epoch": 15.78, "learning_rate": 2.762167832167832e-06, "loss": 0.4313, "step": 18210 }, { "epoch": 15.79, "learning_rate": 2.7614685314685317e-06, "loss": 0.4522, "step": 18220 }, { "epoch": 15.8, "learning_rate": 2.7607692307692307e-06, "loss": 0.4019, "step": 18230 }, { "epoch": 15.81, "learning_rate": 2.76006993006993e-06, "loss": 0.4175, "step": 18240 }, { "epoch": 15.81, "learning_rate": 2.7593706293706293e-06, "loss": 0.3939, "step": 18250 }, { "epoch": 15.82, "learning_rate": 2.7586713286713284e-06, "loss": 0.4423, "step": 18260 }, { "epoch": 15.83, "learning_rate": 2.757972027972028e-06, "loss": 0.414, "step": 18270 }, { "epoch": 15.84, "learning_rate": 2.7572727272727274e-06, "loss": 0.3687, "step": 18280 }, { "epoch": 15.85, "learning_rate": 2.7565734265734264e-06, "loss": 0.3526, "step": 18290 }, { "epoch": 15.86, "learning_rate": 2.7558741258741255e-06, "loss": 0.389, "step": 18300 }, { "epoch": 15.87, "learning_rate": 2.755174825174825e-06, "loss": 0.4634, "step": 18310 }, { "epoch": 15.87, "learning_rate": 2.7544755244755245e-06, "loss": 0.3854, "step": 18320 }, { "epoch": 15.88, "learning_rate": 2.7538461538461535e-06, "loss": 0.4101, "step": 18330 }, { "epoch": 15.89, "learning_rate": 2.753146853146853e-06, "loss": 0.4215, "step": 18340 }, { "epoch": 15.9, "learning_rate": 2.752447552447552e-06, "loss": 0.4324, "step": 18350 }, { "epoch": 15.91, "learning_rate": 2.7517482517482516e-06, "loss": 0.3848, "step": 18360 }, { "epoch": 15.92, "learning_rate": 2.751048951048951e-06, "loss": 0.3643, "step": 18370 }, { "epoch": 15.93, "learning_rate": 2.75034965034965e-06, "loss": 0.4236, "step": 18380 }, { "epoch": 15.94, "learning_rate": 2.7496503496503493e-06, "loss": 0.3534, "step": 18390 }, { "epoch": 15.94, "learning_rate": 2.7489510489510488e-06, "loss": 0.4274, "step": 18400 }, { "epoch": 15.95, "learning_rate": 2.7482517482517482e-06, "loss": 0.4021, "step": 18410 }, { "epoch": 15.96, "learning_rate": 2.7476223776223773e-06, "loss": 0.3989, "step": 18420 }, { "epoch": 15.97, "learning_rate": 2.7469230769230768e-06, "loss": 0.3813, "step": 18430 }, { "epoch": 15.98, "learning_rate": 2.746223776223776e-06, "loss": 0.382, "step": 18440 }, { "epoch": 15.99, "learning_rate": 2.7455244755244754e-06, "loss": 0.4029, "step": 18450 }, { "epoch": 16.0, "learning_rate": 2.744825174825175e-06, "loss": 0.401, "step": 18460 }, { "epoch": 16.0, "eval_loss": 0.5527588725090027, "eval_runtime": 134.4619, "eval_samples_per_second": 3.957, "eval_steps_per_second": 1.978, "eval_wer": 0.25660474384521437, "step": 18464 }, { "epoch": 16.01, "learning_rate": 2.7441258741258743e-06, "loss": 0.3866, "step": 18470 }, { "epoch": 16.01, "learning_rate": 2.743426573426573e-06, "loss": 0.408, "step": 18480 }, { "epoch": 16.02, "learning_rate": 2.7427272727272725e-06, "loss": 0.3622, "step": 18490 }, { "epoch": 16.03, "learning_rate": 2.742027972027972e-06, "loss": 0.3686, "step": 18500 }, { "epoch": 16.04, "learning_rate": 2.7413286713286715e-06, "loss": 0.451, "step": 18510 }, { "epoch": 16.05, "learning_rate": 2.7406293706293706e-06, "loss": 0.3892, "step": 18520 }, { "epoch": 16.06, "learning_rate": 2.7399300699300696e-06, "loss": 0.3524, "step": 18530 }, { "epoch": 16.07, "learning_rate": 2.739230769230769e-06, "loss": 0.4344, "step": 18540 }, { "epoch": 16.07, "learning_rate": 2.738531468531468e-06, "loss": 0.3783, "step": 18550 }, { "epoch": 16.08, "learning_rate": 2.7378321678321677e-06, "loss": 0.3873, "step": 18560 }, { "epoch": 16.09, "learning_rate": 2.737132867132867e-06, "loss": 0.3959, "step": 18570 }, { "epoch": 16.1, "learning_rate": 2.7364335664335667e-06, "loss": 0.4067, "step": 18580 }, { "epoch": 16.11, "learning_rate": 2.7357342657342653e-06, "loss": 0.3906, "step": 18590 }, { "epoch": 16.12, "learning_rate": 2.735034965034965e-06, "loss": 0.4194, "step": 18600 }, { "epoch": 16.13, "learning_rate": 2.7343356643356643e-06, "loss": 0.4019, "step": 18610 }, { "epoch": 16.14, "learning_rate": 2.7336363636363634e-06, "loss": 0.4133, "step": 18620 }, { "epoch": 16.14, "learning_rate": 2.732937062937063e-06, "loss": 0.3734, "step": 18630 }, { "epoch": 16.15, "learning_rate": 2.732237762237762e-06, "loss": 0.3443, "step": 18640 }, { "epoch": 16.16, "learning_rate": 2.7315384615384615e-06, "loss": 0.4262, "step": 18650 }, { "epoch": 16.17, "learning_rate": 2.7308391608391606e-06, "loss": 0.4021, "step": 18660 }, { "epoch": 16.18, "learning_rate": 2.73013986013986e-06, "loss": 0.3941, "step": 18670 }, { "epoch": 16.19, "learning_rate": 2.7294405594405595e-06, "loss": 0.4043, "step": 18680 }, { "epoch": 16.2, "learning_rate": 2.7287412587412586e-06, "loss": 0.3946, "step": 18690 }, { "epoch": 16.2, "learning_rate": 2.7280419580419577e-06, "loss": 0.3554, "step": 18700 }, { "epoch": 16.21, "learning_rate": 2.727342657342657e-06, "loss": 0.3961, "step": 18710 }, { "epoch": 16.22, "learning_rate": 2.7266433566433567e-06, "loss": 0.4002, "step": 18720 }, { "epoch": 16.23, "learning_rate": 2.7259440559440558e-06, "loss": 0.3996, "step": 18730 }, { "epoch": 16.24, "learning_rate": 2.7252447552447553e-06, "loss": 0.3419, "step": 18740 }, { "epoch": 16.25, "learning_rate": 2.7245454545454543e-06, "loss": 0.3855, "step": 18750 }, { "epoch": 16.26, "learning_rate": 2.723846153846154e-06, "loss": 0.454, "step": 18760 }, { "epoch": 16.27, "learning_rate": 2.723146853146853e-06, "loss": 0.3747, "step": 18770 }, { "epoch": 16.27, "learning_rate": 2.7224475524475524e-06, "loss": 0.366, "step": 18780 }, { "epoch": 16.28, "learning_rate": 2.721748251748252e-06, "loss": 0.4218, "step": 18790 }, { "epoch": 16.29, "learning_rate": 2.7210489510489505e-06, "loss": 0.3791, "step": 18800 }, { "epoch": 16.3, "learning_rate": 2.72034965034965e-06, "loss": 0.4636, "step": 18810 }, { "epoch": 16.31, "learning_rate": 2.7196503496503495e-06, "loss": 0.3836, "step": 18820 }, { "epoch": 16.32, "learning_rate": 2.718951048951049e-06, "loss": 0.4457, "step": 18830 }, { "epoch": 16.33, "learning_rate": 2.718251748251748e-06, "loss": 0.3602, "step": 18840 }, { "epoch": 16.33, "learning_rate": 2.717552447552447e-06, "loss": 0.4125, "step": 18850 }, { "epoch": 16.34, "learning_rate": 2.7168531468531467e-06, "loss": 0.4183, "step": 18860 }, { "epoch": 16.35, "learning_rate": 2.716153846153846e-06, "loss": 0.3852, "step": 18870 }, { "epoch": 16.36, "learning_rate": 2.7154545454545453e-06, "loss": 0.427, "step": 18880 }, { "epoch": 16.37, "learning_rate": 2.7147552447552447e-06, "loss": 0.3541, "step": 18890 }, { "epoch": 16.38, "learning_rate": 2.7140559440559442e-06, "loss": 0.3876, "step": 18900 }, { "epoch": 16.39, "learning_rate": 2.713356643356643e-06, "loss": 0.4169, "step": 18910 }, { "epoch": 16.39, "learning_rate": 2.7126573426573424e-06, "loss": 0.3701, "step": 18920 }, { "epoch": 16.4, "learning_rate": 2.711958041958042e-06, "loss": 0.418, "step": 18930 }, { "epoch": 16.41, "learning_rate": 2.7112587412587414e-06, "loss": 0.3641, "step": 18940 }, { "epoch": 16.42, "learning_rate": 2.7105594405594405e-06, "loss": 0.3692, "step": 18950 }, { "epoch": 16.43, "learning_rate": 2.7098601398601395e-06, "loss": 0.4281, "step": 18960 }, { "epoch": 16.44, "learning_rate": 2.709160839160839e-06, "loss": 0.3755, "step": 18970 }, { "epoch": 16.45, "learning_rate": 2.708461538461538e-06, "loss": 0.3857, "step": 18980 }, { "epoch": 16.46, "learning_rate": 2.7077622377622376e-06, "loss": 0.4253, "step": 18990 }, { "epoch": 16.46, "learning_rate": 2.707062937062937e-06, "loss": 0.3912, "step": 19000 }, { "epoch": 16.47, "learning_rate": 2.7063636363636366e-06, "loss": 0.429, "step": 19010 }, { "epoch": 16.48, "learning_rate": 2.7056643356643352e-06, "loss": 0.4558, "step": 19020 }, { "epoch": 16.49, "learning_rate": 2.7049650349650347e-06, "loss": 0.4172, "step": 19030 }, { "epoch": 16.5, "learning_rate": 2.7042657342657342e-06, "loss": 0.4004, "step": 19040 }, { "epoch": 16.51, "learning_rate": 2.7035664335664337e-06, "loss": 0.4207, "step": 19050 }, { "epoch": 16.52, "learning_rate": 2.702867132867133e-06, "loss": 0.4373, "step": 19060 }, { "epoch": 16.52, "learning_rate": 2.702167832167832e-06, "loss": 0.4508, "step": 19070 }, { "epoch": 16.53, "learning_rate": 2.7014685314685314e-06, "loss": 0.4109, "step": 19080 }, { "epoch": 16.54, "learning_rate": 2.7007692307692305e-06, "loss": 0.4186, "step": 19090 }, { "epoch": 16.55, "learning_rate": 2.70006993006993e-06, "loss": 0.3652, "step": 19100 }, { "epoch": 16.56, "learning_rate": 2.6993706293706294e-06, "loss": 0.4016, "step": 19110 }, { "epoch": 16.57, "learning_rate": 2.698671328671329e-06, "loss": 0.4264, "step": 19120 }, { "epoch": 16.58, "learning_rate": 2.6979720279720276e-06, "loss": 0.3732, "step": 19130 }, { "epoch": 16.59, "learning_rate": 2.697272727272727e-06, "loss": 0.3571, "step": 19140 }, { "epoch": 16.59, "learning_rate": 2.6965734265734266e-06, "loss": 0.4206, "step": 19150 }, { "epoch": 16.6, "learning_rate": 2.6958741258741257e-06, "loss": 0.3823, "step": 19160 }, { "epoch": 16.61, "learning_rate": 2.695174825174825e-06, "loss": 0.3829, "step": 19170 }, { "epoch": 16.62, "learning_rate": 2.6944755244755242e-06, "loss": 0.392, "step": 19180 }, { "epoch": 16.63, "learning_rate": 2.6937762237762237e-06, "loss": 0.3682, "step": 19190 }, { "epoch": 16.64, "learning_rate": 2.693076923076923e-06, "loss": 0.4124, "step": 19200 }, { "epoch": 16.65, "learning_rate": 2.6923776223776223e-06, "loss": 0.3521, "step": 19210 }, { "epoch": 16.65, "learning_rate": 2.691678321678322e-06, "loss": 0.3398, "step": 19220 }, { "epoch": 16.66, "learning_rate": 2.690979020979021e-06, "loss": 0.3953, "step": 19230 }, { "epoch": 16.67, "learning_rate": 2.69027972027972e-06, "loss": 0.3081, "step": 19240 }, { "epoch": 16.68, "learning_rate": 2.6895804195804194e-06, "loss": 0.3745, "step": 19250 }, { "epoch": 16.69, "learning_rate": 2.688881118881119e-06, "loss": 0.3325, "step": 19260 }, { "epoch": 16.7, "learning_rate": 2.688181818181818e-06, "loss": 0.3733, "step": 19270 }, { "epoch": 16.71, "learning_rate": 2.6874825174825175e-06, "loss": 0.5077, "step": 19280 }, { "epoch": 16.72, "learning_rate": 2.6867832167832166e-06, "loss": 0.384, "step": 19290 }, { "epoch": 16.72, "learning_rate": 2.686083916083916e-06, "loss": 0.3758, "step": 19300 }, { "epoch": 16.73, "learning_rate": 2.685384615384615e-06, "loss": 0.359, "step": 19310 }, { "epoch": 16.74, "learning_rate": 2.6846853146853146e-06, "loss": 0.4364, "step": 19320 }, { "epoch": 16.75, "learning_rate": 2.683986013986014e-06, "loss": 0.4155, "step": 19330 }, { "epoch": 16.76, "learning_rate": 2.683286713286713e-06, "loss": 0.3362, "step": 19340 }, { "epoch": 16.77, "learning_rate": 2.6825874125874123e-06, "loss": 0.3266, "step": 19350 }, { "epoch": 16.78, "learning_rate": 2.6818881118881118e-06, "loss": 0.396, "step": 19360 }, { "epoch": 16.78, "learning_rate": 2.6811888111888113e-06, "loss": 0.4046, "step": 19370 }, { "epoch": 16.79, "learning_rate": 2.6804895104895104e-06, "loss": 0.3826, "step": 19380 }, { "epoch": 16.8, "learning_rate": 2.67979020979021e-06, "loss": 0.4214, "step": 19390 }, { "epoch": 16.81, "learning_rate": 2.679090909090909e-06, "loss": 0.4371, "step": 19400 }, { "epoch": 16.82, "learning_rate": 2.678391608391608e-06, "loss": 0.4201, "step": 19410 }, { "epoch": 16.83, "learning_rate": 2.6776923076923075e-06, "loss": 0.4438, "step": 19420 }, { "epoch": 16.84, "learning_rate": 2.676993006993007e-06, "loss": 0.404, "step": 19430 }, { "epoch": 16.85, "learning_rate": 2.6762937062937065e-06, "loss": 0.3562, "step": 19440 }, { "epoch": 16.85, "learning_rate": 2.675594405594405e-06, "loss": 0.4756, "step": 19450 }, { "epoch": 16.86, "learning_rate": 2.6748951048951046e-06, "loss": 0.407, "step": 19460 }, { "epoch": 16.87, "learning_rate": 2.674195804195804e-06, "loss": 0.4391, "step": 19470 }, { "epoch": 16.88, "learning_rate": 2.6734965034965036e-06, "loss": 0.3603, "step": 19480 }, { "epoch": 16.89, "learning_rate": 2.6727972027972027e-06, "loss": 0.3468, "step": 19490 }, { "epoch": 16.9, "learning_rate": 2.6720979020979018e-06, "loss": 0.3874, "step": 19500 }, { "epoch": 16.91, "learning_rate": 2.6713986013986013e-06, "loss": 0.4372, "step": 19510 }, { "epoch": 16.91, "learning_rate": 2.6706993006993004e-06, "loss": 0.3371, "step": 19520 }, { "epoch": 16.92, "learning_rate": 2.67e-06, "loss": 0.351, "step": 19530 }, { "epoch": 16.93, "learning_rate": 2.6693006993006993e-06, "loss": 0.3351, "step": 19540 }, { "epoch": 16.94, "learning_rate": 2.668601398601399e-06, "loss": 0.3939, "step": 19550 }, { "epoch": 16.95, "learning_rate": 2.6679020979020975e-06, "loss": 0.3767, "step": 19560 }, { "epoch": 16.96, "learning_rate": 2.667202797202797e-06, "loss": 0.4356, "step": 19570 }, { "epoch": 16.97, "learning_rate": 2.6665034965034965e-06, "loss": 0.4077, "step": 19580 }, { "epoch": 16.98, "learning_rate": 2.6658041958041956e-06, "loss": 0.3415, "step": 19590 }, { "epoch": 16.98, "learning_rate": 2.665104895104895e-06, "loss": 0.3812, "step": 19600 }, { "epoch": 16.99, "learning_rate": 2.664405594405594e-06, "loss": 0.4391, "step": 19610 }, { "epoch": 17.0, "eval_loss": 0.5583595633506775, "eval_runtime": 135.8775, "eval_samples_per_second": 3.915, "eval_steps_per_second": 1.958, "eval_wer": 0.25544770842707465, "step": 19618 }, { "epoch": 17.0, "learning_rate": 2.6637062937062936e-06, "loss": 0.4462, "step": 19620 }, { "epoch": 17.01, "learning_rate": 2.6630069930069927e-06, "loss": 0.4311, "step": 19630 }, { "epoch": 17.02, "learning_rate": 2.662307692307692e-06, "loss": 0.3632, "step": 19640 }, { "epoch": 17.03, "learning_rate": 2.6616083916083917e-06, "loss": 0.3747, "step": 19650 }, { "epoch": 17.04, "learning_rate": 2.660909090909091e-06, "loss": 0.3097, "step": 19660 }, { "epoch": 17.05, "learning_rate": 2.66020979020979e-06, "loss": 0.4059, "step": 19670 }, { "epoch": 17.05, "learning_rate": 2.6595104895104893e-06, "loss": 0.3929, "step": 19680 }, { "epoch": 17.06, "learning_rate": 2.658811188811189e-06, "loss": 0.4335, "step": 19690 }, { "epoch": 17.07, "learning_rate": 2.658111888111888e-06, "loss": 0.3721, "step": 19700 }, { "epoch": 17.08, "learning_rate": 2.6574125874125874e-06, "loss": 0.3538, "step": 19710 }, { "epoch": 17.09, "learning_rate": 2.6567132867132865e-06, "loss": 0.3729, "step": 19720 }, { "epoch": 17.1, "learning_rate": 2.656013986013986e-06, "loss": 0.413, "step": 19730 }, { "epoch": 17.11, "learning_rate": 2.655314685314685e-06, "loss": 0.3944, "step": 19740 }, { "epoch": 17.11, "learning_rate": 2.6546153846153845e-06, "loss": 0.3932, "step": 19750 }, { "epoch": 17.12, "learning_rate": 2.653916083916084e-06, "loss": 0.3938, "step": 19760 }, { "epoch": 17.13, "learning_rate": 2.6532167832167827e-06, "loss": 0.3072, "step": 19770 }, { "epoch": 17.14, "learning_rate": 2.652517482517482e-06, "loss": 0.3738, "step": 19780 }, { "epoch": 17.15, "learning_rate": 2.6518181818181817e-06, "loss": 0.3518, "step": 19790 }, { "epoch": 17.16, "learning_rate": 2.651118881118881e-06, "loss": 0.3591, "step": 19800 }, { "epoch": 17.17, "learning_rate": 2.6504195804195803e-06, "loss": 0.4291, "step": 19810 }, { "epoch": 17.17, "learning_rate": 2.6497202797202798e-06, "loss": 0.4052, "step": 19820 }, { "epoch": 17.18, "learning_rate": 2.649020979020979e-06, "loss": 0.3796, "step": 19830 }, { "epoch": 17.19, "learning_rate": 2.6483216783216783e-06, "loss": 0.3255, "step": 19840 }, { "epoch": 17.2, "learning_rate": 2.6476223776223774e-06, "loss": 0.3811, "step": 19850 }, { "epoch": 17.21, "learning_rate": 2.646923076923077e-06, "loss": 0.4578, "step": 19860 }, { "epoch": 17.22, "learning_rate": 2.6462237762237764e-06, "loss": 0.4539, "step": 19870 }, { "epoch": 17.23, "learning_rate": 2.645524475524475e-06, "loss": 0.3946, "step": 19880 }, { "epoch": 17.24, "learning_rate": 2.6448251748251745e-06, "loss": 0.4328, "step": 19890 }, { "epoch": 17.24, "learning_rate": 2.644125874125874e-06, "loss": 0.4009, "step": 19900 }, { "epoch": 17.25, "learning_rate": 2.6434265734265735e-06, "loss": 0.373, "step": 19910 }, { "epoch": 17.26, "learning_rate": 2.6427272727272726e-06, "loss": 0.3561, "step": 19920 }, { "epoch": 17.27, "learning_rate": 2.642027972027972e-06, "loss": 0.3972, "step": 19930 }, { "epoch": 17.28, "learning_rate": 2.641328671328671e-06, "loss": 0.3716, "step": 19940 }, { "epoch": 17.29, "learning_rate": 2.6406293706293702e-06, "loss": 0.3482, "step": 19950 }, { "epoch": 17.3, "learning_rate": 2.6399300699300697e-06, "loss": 0.3972, "step": 19960 }, { "epoch": 17.3, "learning_rate": 2.6392307692307692e-06, "loss": 0.4394, "step": 19970 }, { "epoch": 17.31, "learning_rate": 2.6385314685314687e-06, "loss": 0.4083, "step": 19980 }, { "epoch": 17.32, "learning_rate": 2.6378321678321674e-06, "loss": 0.3908, "step": 19990 }, { "epoch": 17.33, "learning_rate": 2.637132867132867e-06, "loss": 0.4101, "step": 20000 }, { "epoch": 17.34, "learning_rate": 2.6364335664335664e-06, "loss": 0.3879, "step": 20010 }, { "epoch": 17.35, "learning_rate": 2.635734265734266e-06, "loss": 0.4163, "step": 20020 }, { "epoch": 17.36, "learning_rate": 2.635034965034965e-06, "loss": 0.3777, "step": 20030 }, { "epoch": 17.37, "learning_rate": 2.634335664335664e-06, "loss": 0.3931, "step": 20040 }, { "epoch": 17.37, "learning_rate": 2.6336363636363635e-06, "loss": 0.374, "step": 20050 }, { "epoch": 17.38, "learning_rate": 2.6329370629370626e-06, "loss": 0.4067, "step": 20060 }, { "epoch": 17.39, "learning_rate": 2.632237762237762e-06, "loss": 0.3838, "step": 20070 }, { "epoch": 17.4, "learning_rate": 2.6315384615384616e-06, "loss": 0.4246, "step": 20080 }, { "epoch": 17.41, "learning_rate": 2.630839160839161e-06, "loss": 0.395, "step": 20090 }, { "epoch": 17.42, "learning_rate": 2.6301398601398597e-06, "loss": 0.3462, "step": 20100 }, { "epoch": 17.43, "learning_rate": 2.6294405594405592e-06, "loss": 0.4599, "step": 20110 }, { "epoch": 17.43, "learning_rate": 2.6287412587412587e-06, "loss": 0.3861, "step": 20120 }, { "epoch": 17.44, "learning_rate": 2.628041958041958e-06, "loss": 0.3687, "step": 20130 }, { "epoch": 17.45, "learning_rate": 2.6273426573426573e-06, "loss": 0.4269, "step": 20140 }, { "epoch": 17.46, "learning_rate": 2.6266433566433564e-06, "loss": 0.4417, "step": 20150 }, { "epoch": 17.47, "learning_rate": 2.625944055944056e-06, "loss": 0.4375, "step": 20160 }, { "epoch": 17.48, "learning_rate": 2.625244755244755e-06, "loss": 0.3211, "step": 20170 }, { "epoch": 17.49, "learning_rate": 2.6245454545454544e-06, "loss": 0.3927, "step": 20180 }, { "epoch": 17.5, "learning_rate": 2.623846153846154e-06, "loss": 0.3841, "step": 20190 }, { "epoch": 17.5, "learning_rate": 2.6231468531468534e-06, "loss": 0.3553, "step": 20200 }, { "epoch": 17.51, "learning_rate": 2.622447552447552e-06, "loss": 0.4109, "step": 20210 }, { "epoch": 17.52, "learning_rate": 2.6217482517482516e-06, "loss": 0.4795, "step": 20220 }, { "epoch": 17.53, "learning_rate": 2.621048951048951e-06, "loss": 0.3969, "step": 20230 }, { "epoch": 17.54, "learning_rate": 2.62034965034965e-06, "loss": 0.3544, "step": 20240 }, { "epoch": 17.55, "learning_rate": 2.6196503496503497e-06, "loss": 0.4274, "step": 20250 }, { "epoch": 17.56, "learning_rate": 2.6189510489510487e-06, "loss": 0.4053, "step": 20260 }, { "epoch": 17.56, "learning_rate": 2.6182517482517482e-06, "loss": 0.4198, "step": 20270 }, { "epoch": 17.57, "learning_rate": 2.6175524475524473e-06, "loss": 0.4458, "step": 20280 }, { "epoch": 17.58, "learning_rate": 2.616853146853147e-06, "loss": 0.3737, "step": 20290 }, { "epoch": 17.59, "learning_rate": 2.6161538461538463e-06, "loss": 0.385, "step": 20300 }, { "epoch": 17.6, "learning_rate": 2.615454545454545e-06, "loss": 0.3633, "step": 20310 }, { "epoch": 17.61, "learning_rate": 2.6147552447552444e-06, "loss": 0.3667, "step": 20320 }, { "epoch": 17.62, "learning_rate": 2.614055944055944e-06, "loss": 0.3878, "step": 20330 }, { "epoch": 17.63, "learning_rate": 2.6133566433566434e-06, "loss": 0.3853, "step": 20340 }, { "epoch": 17.63, "learning_rate": 2.6126573426573425e-06, "loss": 0.3476, "step": 20350 }, { "epoch": 17.64, "learning_rate": 2.611958041958042e-06, "loss": 0.3953, "step": 20360 }, { "epoch": 17.65, "learning_rate": 2.611258741258741e-06, "loss": 0.4068, "step": 20370 }, { "epoch": 17.66, "learning_rate": 2.6105594405594406e-06, "loss": 0.4064, "step": 20380 }, { "epoch": 17.67, "learning_rate": 2.6098601398601396e-06, "loss": 0.3617, "step": 20390 }, { "epoch": 17.68, "learning_rate": 2.609160839160839e-06, "loss": 0.376, "step": 20400 }, { "epoch": 17.69, "learning_rate": 2.6084615384615386e-06, "loss": 0.4201, "step": 20410 }, { "epoch": 17.69, "learning_rate": 2.6077622377622373e-06, "loss": 0.4321, "step": 20420 }, { "epoch": 17.7, "learning_rate": 2.6070629370629368e-06, "loss": 0.3209, "step": 20430 }, { "epoch": 17.71, "learning_rate": 2.6063636363636363e-06, "loss": 0.3947, "step": 20440 }, { "epoch": 17.72, "learning_rate": 2.6056643356643358e-06, "loss": 0.4086, "step": 20450 }, { "epoch": 17.73, "learning_rate": 2.604965034965035e-06, "loss": 0.4005, "step": 20460 }, { "epoch": 17.74, "learning_rate": 2.6042657342657343e-06, "loss": 0.4692, "step": 20470 }, { "epoch": 17.75, "learning_rate": 2.6035664335664334e-06, "loss": 0.3993, "step": 20480 }, { "epoch": 17.76, "learning_rate": 2.6028671328671325e-06, "loss": 0.3955, "step": 20490 }, { "epoch": 17.76, "learning_rate": 2.602167832167832e-06, "loss": 0.3767, "step": 20500 }, { "epoch": 17.77, "learning_rate": 2.6014685314685315e-06, "loss": 0.3714, "step": 20510 }, { "epoch": 17.78, "learning_rate": 2.600769230769231e-06, "loss": 0.4252, "step": 20520 }, { "epoch": 17.79, "learning_rate": 2.6000699300699296e-06, "loss": 0.3484, "step": 20530 }, { "epoch": 17.8, "learning_rate": 2.599370629370629e-06, "loss": 0.4087, "step": 20540 }, { "epoch": 17.81, "learning_rate": 2.5986713286713286e-06, "loss": 0.4252, "step": 20550 }, { "epoch": 17.82, "learning_rate": 2.5979720279720277e-06, "loss": 0.427, "step": 20560 }, { "epoch": 17.82, "learning_rate": 2.597272727272727e-06, "loss": 0.3832, "step": 20570 }, { "epoch": 17.83, "learning_rate": 2.5965734265734263e-06, "loss": 0.4301, "step": 20580 }, { "epoch": 17.84, "learning_rate": 2.5958741258741258e-06, "loss": 0.4196, "step": 20590 }, { "epoch": 17.85, "learning_rate": 2.595174825174825e-06, "loss": 0.3853, "step": 20600 }, { "epoch": 17.86, "learning_rate": 2.5944755244755243e-06, "loss": 0.4572, "step": 20610 }, { "epoch": 17.87, "learning_rate": 2.593776223776224e-06, "loss": 0.4236, "step": 20620 }, { "epoch": 17.88, "learning_rate": 2.5930769230769233e-06, "loss": 0.3852, "step": 20630 }, { "epoch": 17.89, "learning_rate": 2.592377622377622e-06, "loss": 0.3795, "step": 20640 }, { "epoch": 17.89, "learning_rate": 2.5916783216783215e-06, "loss": 0.4265, "step": 20650 }, { "epoch": 17.9, "learning_rate": 2.590979020979021e-06, "loss": 0.4455, "step": 20660 }, { "epoch": 17.91, "learning_rate": 2.59027972027972e-06, "loss": 0.4368, "step": 20670 }, { "epoch": 17.92, "learning_rate": 2.5895804195804195e-06, "loss": 0.4364, "step": 20680 }, { "epoch": 17.93, "learning_rate": 2.5888811188811186e-06, "loss": 0.4531, "step": 20690 }, { "epoch": 17.94, "learning_rate": 2.588181818181818e-06, "loss": 0.39, "step": 20700 }, { "epoch": 17.95, "learning_rate": 2.587482517482517e-06, "loss": 0.3788, "step": 20710 }, { "epoch": 17.95, "learning_rate": 2.5867832167832167e-06, "loss": 0.3861, "step": 20720 }, { "epoch": 17.96, "learning_rate": 2.586083916083916e-06, "loss": 0.385, "step": 20730 }, { "epoch": 17.97, "learning_rate": 2.5853846153846153e-06, "loss": 0.369, "step": 20740 }, { "epoch": 17.98, "learning_rate": 2.5846853146853143e-06, "loss": 0.4202, "step": 20750 }, { "epoch": 17.99, "learning_rate": 2.583986013986014e-06, "loss": 0.3634, "step": 20760 }, { "epoch": 18.0, "learning_rate": 2.5832867132867133e-06, "loss": 0.4082, "step": 20770 }, { "epoch": 18.0, "eval_loss": 0.560993492603302, "eval_runtime": 134.8261, "eval_samples_per_second": 3.946, "eval_steps_per_second": 1.973, "eval_wer": 0.2528122388635341, "step": 20772 }, { "epoch": 18.01, "learning_rate": 2.5825874125874124e-06, "loss": 0.427, "step": 20780 }, { "epoch": 18.02, "learning_rate": 2.581888111888112e-06, "loss": 0.3963, "step": 20790 }, { "epoch": 18.02, "learning_rate": 2.581188811188811e-06, "loss": 0.3682, "step": 20800 }, { "epoch": 18.03, "learning_rate": 2.5804895104895105e-06, "loss": 0.4136, "step": 20810 }, { "epoch": 18.04, "learning_rate": 2.5797902097902095e-06, "loss": 0.4609, "step": 20820 }, { "epoch": 18.05, "learning_rate": 2.579090909090909e-06, "loss": 0.3814, "step": 20830 }, { "epoch": 18.06, "learning_rate": 2.5783916083916085e-06, "loss": 0.3502, "step": 20840 }, { "epoch": 18.07, "learning_rate": 2.577692307692307e-06, "loss": 0.4283, "step": 20850 }, { "epoch": 18.08, "learning_rate": 2.5769930069930067e-06, "loss": 0.3669, "step": 20860 }, { "epoch": 18.08, "learning_rate": 2.576293706293706e-06, "loss": 0.4066, "step": 20870 }, { "epoch": 18.09, "learning_rate": 2.5755944055944057e-06, "loss": 0.4107, "step": 20880 }, { "epoch": 18.1, "learning_rate": 2.5748951048951047e-06, "loss": 0.3645, "step": 20890 }, { "epoch": 18.11, "learning_rate": 2.5741958041958042e-06, "loss": 0.3502, "step": 20900 }, { "epoch": 18.12, "learning_rate": 2.5734965034965033e-06, "loss": 0.4241, "step": 20910 }, { "epoch": 18.13, "learning_rate": 2.5727972027972024e-06, "loss": 0.3582, "step": 20920 }, { "epoch": 18.14, "learning_rate": 2.572097902097902e-06, "loss": 0.3864, "step": 20930 }, { "epoch": 18.15, "learning_rate": 2.5713986013986014e-06, "loss": 0.3675, "step": 20940 }, { "epoch": 18.15, "learning_rate": 2.570699300699301e-06, "loss": 0.3774, "step": 20950 }, { "epoch": 18.16, "learning_rate": 2.5699999999999995e-06, "loss": 0.4393, "step": 20960 }, { "epoch": 18.17, "learning_rate": 2.569300699300699e-06, "loss": 0.4115, "step": 20970 }, { "epoch": 18.18, "learning_rate": 2.5686013986013985e-06, "loss": 0.3484, "step": 20980 }, { "epoch": 18.19, "learning_rate": 2.567902097902098e-06, "loss": 0.3803, "step": 20990 }, { "epoch": 18.2, "learning_rate": 2.567202797202797e-06, "loss": 0.3447, "step": 21000 }, { "epoch": 18.21, "learning_rate": 2.5665034965034966e-06, "loss": 0.4175, "step": 21010 }, { "epoch": 18.21, "learning_rate": 2.5658041958041957e-06, "loss": 0.4695, "step": 21020 }, { "epoch": 18.22, "learning_rate": 2.5651048951048947e-06, "loss": 0.4124, "step": 21030 }, { "epoch": 18.23, "learning_rate": 2.5644055944055942e-06, "loss": 0.3712, "step": 21040 }, { "epoch": 18.24, "learning_rate": 2.5637062937062937e-06, "loss": 0.5031, "step": 21050 }, { "epoch": 18.25, "learning_rate": 2.5630069930069932e-06, "loss": 0.3665, "step": 21060 }, { "epoch": 18.26, "learning_rate": 2.562307692307692e-06, "loss": 0.3783, "step": 21070 }, { "epoch": 18.27, "learning_rate": 2.5616083916083914e-06, "loss": 0.4238, "step": 21080 }, { "epoch": 18.28, "learning_rate": 2.560909090909091e-06, "loss": 0.3632, "step": 21090 }, { "epoch": 18.28, "learning_rate": 2.56020979020979e-06, "loss": 0.4002, "step": 21100 }, { "epoch": 18.29, "learning_rate": 2.5595104895104894e-06, "loss": 0.3893, "step": 21110 }, { "epoch": 18.3, "learning_rate": 2.558811188811189e-06, "loss": 0.4453, "step": 21120 }, { "epoch": 18.31, "learning_rate": 2.558111888111888e-06, "loss": 0.3853, "step": 21130 }, { "epoch": 18.32, "learning_rate": 2.557412587412587e-06, "loss": 0.4136, "step": 21140 }, { "epoch": 18.33, "learning_rate": 2.5567132867132866e-06, "loss": 0.3396, "step": 21150 }, { "epoch": 18.34, "learning_rate": 2.556013986013986e-06, "loss": 0.373, "step": 21160 }, { "epoch": 18.34, "learning_rate": 2.5553146853146856e-06, "loss": 0.4376, "step": 21170 }, { "epoch": 18.35, "learning_rate": 2.5546153846153842e-06, "loss": 0.3995, "step": 21180 }, { "epoch": 18.36, "learning_rate": 2.5539160839160837e-06, "loss": 0.3925, "step": 21190 }, { "epoch": 18.37, "learning_rate": 2.5532167832167832e-06, "loss": 0.3515, "step": 21200 }, { "epoch": 18.38, "learning_rate": 2.5525174825174823e-06, "loss": 0.4145, "step": 21210 }, { "epoch": 18.39, "learning_rate": 2.551818181818182e-06, "loss": 0.3953, "step": 21220 }, { "epoch": 18.4, "learning_rate": 2.551118881118881e-06, "loss": 0.4111, "step": 21230 }, { "epoch": 18.41, "learning_rate": 2.5504195804195804e-06, "loss": 0.3434, "step": 21240 }, { "epoch": 18.41, "learning_rate": 2.5497202797202794e-06, "loss": 0.4359, "step": 21250 }, { "epoch": 18.42, "learning_rate": 2.549020979020979e-06, "loss": 0.3937, "step": 21260 }, { "epoch": 18.43, "learning_rate": 2.5483216783216784e-06, "loss": 0.3623, "step": 21270 }, { "epoch": 18.44, "learning_rate": 2.5476223776223775e-06, "loss": 0.3874, "step": 21280 }, { "epoch": 18.45, "learning_rate": 2.5469230769230766e-06, "loss": 0.4689, "step": 21290 }, { "epoch": 18.46, "learning_rate": 2.546223776223776e-06, "loss": 0.3915, "step": 21300 }, { "epoch": 18.47, "learning_rate": 2.5455244755244756e-06, "loss": 0.411, "step": 21310 }, { "epoch": 18.47, "learning_rate": 2.5448251748251746e-06, "loss": 0.4007, "step": 21320 }, { "epoch": 18.48, "learning_rate": 2.544125874125874e-06, "loss": 0.362, "step": 21330 }, { "epoch": 18.49, "learning_rate": 2.5434265734265732e-06, "loss": 0.4242, "step": 21340 }, { "epoch": 18.5, "learning_rate": 2.5427272727272727e-06, "loss": 0.3352, "step": 21350 }, { "epoch": 18.51, "learning_rate": 2.542027972027972e-06, "loss": 0.3417, "step": 21360 }, { "epoch": 18.52, "learning_rate": 2.5413286713286713e-06, "loss": 0.3786, "step": 21370 }, { "epoch": 18.53, "learning_rate": 2.5406293706293708e-06, "loss": 0.3854, "step": 21380 }, { "epoch": 18.54, "learning_rate": 2.5399300699300694e-06, "loss": 0.4607, "step": 21390 }, { "epoch": 18.54, "learning_rate": 2.539230769230769e-06, "loss": 0.345, "step": 21400 }, { "epoch": 18.55, "learning_rate": 2.5385314685314684e-06, "loss": 0.3871, "step": 21410 }, { "epoch": 18.56, "learning_rate": 2.537832167832168e-06, "loss": 0.4067, "step": 21420 }, { "epoch": 18.57, "learning_rate": 2.537132867132867e-06, "loss": 0.3858, "step": 21430 }, { "epoch": 18.58, "learning_rate": 2.5364335664335665e-06, "loss": 0.4136, "step": 21440 }, { "epoch": 18.59, "learning_rate": 2.5357342657342656e-06, "loss": 0.3779, "step": 21450 }, { "epoch": 18.6, "learning_rate": 2.5350349650349646e-06, "loss": 0.3737, "step": 21460 }, { "epoch": 18.6, "learning_rate": 2.534335664335664e-06, "loss": 0.4113, "step": 21470 }, { "epoch": 18.61, "learning_rate": 2.5336363636363636e-06, "loss": 0.354, "step": 21480 }, { "epoch": 18.62, "learning_rate": 2.532937062937063e-06, "loss": 0.383, "step": 21490 }, { "epoch": 18.63, "learning_rate": 2.5322377622377618e-06, "loss": 0.3859, "step": 21500 }, { "epoch": 18.64, "learning_rate": 2.5315384615384613e-06, "loss": 0.3904, "step": 21510 }, { "epoch": 18.65, "learning_rate": 2.5308391608391608e-06, "loss": 0.381, "step": 21520 }, { "epoch": 18.66, "learning_rate": 2.53013986013986e-06, "loss": 0.4758, "step": 21530 }, { "epoch": 18.67, "learning_rate": 2.5294405594405593e-06, "loss": 0.4253, "step": 21540 }, { "epoch": 18.67, "learning_rate": 2.528741258741259e-06, "loss": 0.3751, "step": 21550 }, { "epoch": 18.68, "learning_rate": 2.528041958041958e-06, "loss": 0.3658, "step": 21560 }, { "epoch": 18.69, "learning_rate": 2.527342657342657e-06, "loss": 0.4032, "step": 21570 }, { "epoch": 18.7, "learning_rate": 2.5266433566433565e-06, "loss": 0.3402, "step": 21580 }, { "epoch": 18.71, "learning_rate": 2.525944055944056e-06, "loss": 0.364, "step": 21590 }, { "epoch": 18.72, "learning_rate": 2.5252447552447555e-06, "loss": 0.3297, "step": 21600 }, { "epoch": 18.73, "learning_rate": 2.524545454545454e-06, "loss": 0.456, "step": 21610 }, { "epoch": 18.73, "learning_rate": 2.5238461538461536e-06, "loss": 0.4218, "step": 21620 }, { "epoch": 18.74, "learning_rate": 2.523146853146853e-06, "loss": 0.3752, "step": 21630 }, { "epoch": 18.75, "learning_rate": 2.522447552447552e-06, "loss": 0.3573, "step": 21640 }, { "epoch": 18.76, "learning_rate": 2.5217482517482517e-06, "loss": 0.3968, "step": 21650 }, { "epoch": 18.77, "learning_rate": 2.521048951048951e-06, "loss": 0.3725, "step": 21660 }, { "epoch": 18.78, "learning_rate": 2.5203496503496503e-06, "loss": 0.3844, "step": 21670 }, { "epoch": 18.79, "learning_rate": 2.5196503496503493e-06, "loss": 0.4076, "step": 21680 }, { "epoch": 18.8, "learning_rate": 2.518951048951049e-06, "loss": 0.4098, "step": 21690 }, { "epoch": 18.8, "learning_rate": 2.5182517482517483e-06, "loss": 0.3585, "step": 21700 }, { "epoch": 18.81, "learning_rate": 2.5175524475524474e-06, "loss": 0.4506, "step": 21710 }, { "epoch": 18.82, "learning_rate": 2.5168531468531465e-06, "loss": 0.4148, "step": 21720 }, { "epoch": 18.83, "learning_rate": 2.516153846153846e-06, "loss": 0.3211, "step": 21730 }, { "epoch": 18.84, "learning_rate": 2.5154545454545455e-06, "loss": 0.3571, "step": 21740 }, { "epoch": 18.85, "learning_rate": 2.5147552447552445e-06, "loss": 0.378, "step": 21750 }, { "epoch": 18.86, "learning_rate": 2.514055944055944e-06, "loss": 0.4275, "step": 21760 }, { "epoch": 18.86, "learning_rate": 2.513356643356643e-06, "loss": 0.4126, "step": 21770 }, { "epoch": 18.87, "learning_rate": 2.5126573426573426e-06, "loss": 0.4135, "step": 21780 }, { "epoch": 18.88, "learning_rate": 2.5119580419580417e-06, "loss": 0.3731, "step": 21790 }, { "epoch": 18.89, "learning_rate": 2.511258741258741e-06, "loss": 0.3684, "step": 21800 }, { "epoch": 18.9, "learning_rate": 2.5105594405594407e-06, "loss": 0.346, "step": 21810 }, { "epoch": 18.91, "learning_rate": 2.5098601398601398e-06, "loss": 0.3587, "step": 21820 }, { "epoch": 18.92, "learning_rate": 2.509160839160839e-06, "loss": 0.4568, "step": 21830 }, { "epoch": 18.93, "learning_rate": 2.5084615384615383e-06, "loss": 0.4482, "step": 21840 }, { "epoch": 18.93, "learning_rate": 2.507762237762238e-06, "loss": 0.3697, "step": 21850 }, { "epoch": 18.94, "learning_rate": 2.507062937062937e-06, "loss": 0.3989, "step": 21860 }, { "epoch": 18.95, "learning_rate": 2.5063636363636364e-06, "loss": 0.4218, "step": 21870 }, { "epoch": 18.96, "learning_rate": 2.5056643356643355e-06, "loss": 0.3684, "step": 21880 }, { "epoch": 18.97, "learning_rate": 2.5049650349650345e-06, "loss": 0.4327, "step": 21890 }, { "epoch": 18.98, "learning_rate": 2.504265734265734e-06, "loss": 0.4212, "step": 21900 }, { "epoch": 18.99, "learning_rate": 2.5035664335664335e-06, "loss": 0.3928, "step": 21910 }, { "epoch": 18.99, "learning_rate": 2.502867132867133e-06, "loss": 0.4316, "step": 21920 }, { "epoch": 19.0, "eval_loss": 0.5407825112342834, "eval_runtime": 135.3965, "eval_samples_per_second": 3.929, "eval_steps_per_second": 1.965, "eval_wer": 0.2506910072636112, "step": 21926 }, { "epoch": 19.0, "learning_rate": 2.502167832167832e-06, "loss": 0.389, "step": 21930 }, { "epoch": 19.01, "learning_rate": 2.501468531468531e-06, "loss": 0.3784, "step": 21940 }, { "epoch": 19.02, "learning_rate": 2.5007692307692307e-06, "loss": 0.3543, "step": 21950 }, { "epoch": 19.03, "learning_rate": 2.50006993006993e-06, "loss": 0.4176, "step": 21960 }, { "epoch": 19.04, "learning_rate": 2.4993706293706292e-06, "loss": 0.4456, "step": 21970 }, { "epoch": 19.05, "learning_rate": 2.4986713286713287e-06, "loss": 0.432, "step": 21980 }, { "epoch": 19.06, "learning_rate": 2.497972027972028e-06, "loss": 0.4524, "step": 21990 }, { "epoch": 19.06, "learning_rate": 2.497272727272727e-06, "loss": 0.3371, "step": 22000 }, { "epoch": 19.07, "learning_rate": 2.4965734265734264e-06, "loss": 0.3873, "step": 22010 }, { "epoch": 19.08, "learning_rate": 2.495874125874126e-06, "loss": 0.3631, "step": 22020 }, { "epoch": 19.09, "learning_rate": 2.4951748251748254e-06, "loss": 0.3886, "step": 22030 }, { "epoch": 19.1, "learning_rate": 2.494475524475524e-06, "loss": 0.3754, "step": 22040 }, { "epoch": 19.11, "learning_rate": 2.4937762237762235e-06, "loss": 0.425, "step": 22050 }, { "epoch": 19.12, "learning_rate": 2.493076923076923e-06, "loss": 0.3737, "step": 22060 }, { "epoch": 19.12, "learning_rate": 2.492377622377622e-06, "loss": 0.4261, "step": 22070 }, { "epoch": 19.13, "learning_rate": 2.4916783216783216e-06, "loss": 0.3958, "step": 22080 }, { "epoch": 19.14, "learning_rate": 2.490979020979021e-06, "loss": 0.3736, "step": 22090 }, { "epoch": 19.15, "learning_rate": 2.49027972027972e-06, "loss": 0.3276, "step": 22100 }, { "epoch": 19.16, "learning_rate": 2.4895804195804192e-06, "loss": 0.3589, "step": 22110 }, { "epoch": 19.17, "learning_rate": 2.4888811188811187e-06, "loss": 0.4129, "step": 22120 }, { "epoch": 19.18, "learning_rate": 2.4881818181818182e-06, "loss": 0.3523, "step": 22130 }, { "epoch": 19.19, "learning_rate": 2.4874825174825177e-06, "loss": 0.4183, "step": 22140 }, { "epoch": 19.19, "learning_rate": 2.4867832167832164e-06, "loss": 0.3582, "step": 22150 }, { "epoch": 19.2, "learning_rate": 2.486083916083916e-06, "loss": 0.387, "step": 22160 }, { "epoch": 19.21, "learning_rate": 2.4853846153846154e-06, "loss": 0.412, "step": 22170 }, { "epoch": 19.22, "learning_rate": 2.4846853146853144e-06, "loss": 0.3966, "step": 22180 }, { "epoch": 19.23, "learning_rate": 2.483986013986014e-06, "loss": 0.4483, "step": 22190 }, { "epoch": 19.24, "learning_rate": 2.4832867132867134e-06, "loss": 0.3605, "step": 22200 }, { "epoch": 19.25, "learning_rate": 2.4825874125874125e-06, "loss": 0.4112, "step": 22210 }, { "epoch": 19.25, "learning_rate": 2.4818881118881116e-06, "loss": 0.3792, "step": 22220 }, { "epoch": 19.26, "learning_rate": 2.481188811188811e-06, "loss": 0.3607, "step": 22230 }, { "epoch": 19.27, "learning_rate": 2.4804895104895106e-06, "loss": 0.4215, "step": 22240 }, { "epoch": 19.28, "learning_rate": 2.4797902097902097e-06, "loss": 0.4503, "step": 22250 }, { "epoch": 19.29, "learning_rate": 2.4790909090909087e-06, "loss": 0.4321, "step": 22260 }, { "epoch": 19.3, "learning_rate": 2.4783916083916082e-06, "loss": 0.367, "step": 22270 }, { "epoch": 19.31, "learning_rate": 2.4776923076923077e-06, "loss": 0.3698, "step": 22280 }, { "epoch": 19.32, "learning_rate": 2.476993006993007e-06, "loss": 0.3944, "step": 22290 }, { "epoch": 19.32, "learning_rate": 2.4762937062937063e-06, "loss": 0.3623, "step": 22300 }, { "epoch": 19.33, "learning_rate": 2.4755944055944058e-06, "loss": 0.408, "step": 22310 }, { "epoch": 19.34, "learning_rate": 2.474895104895105e-06, "loss": 0.4196, "step": 22320 }, { "epoch": 19.35, "learning_rate": 2.474195804195804e-06, "loss": 0.367, "step": 22330 }, { "epoch": 19.36, "learning_rate": 2.4734965034965034e-06, "loss": 0.3914, "step": 22340 }, { "epoch": 19.37, "learning_rate": 2.472797202797203e-06, "loss": 0.4052, "step": 22350 }, { "epoch": 19.38, "learning_rate": 2.472097902097902e-06, "loss": 0.3447, "step": 22360 }, { "epoch": 19.38, "learning_rate": 2.471398601398601e-06, "loss": 0.4061, "step": 22370 }, { "epoch": 19.39, "learning_rate": 2.4706993006993006e-06, "loss": 0.4787, "step": 22380 }, { "epoch": 19.4, "learning_rate": 2.47e-06, "loss": 0.4053, "step": 22390 }, { "epoch": 19.41, "learning_rate": 2.469300699300699e-06, "loss": 0.3524, "step": 22400 }, { "epoch": 19.42, "learning_rate": 2.4686013986013986e-06, "loss": 0.4586, "step": 22410 }, { "epoch": 19.43, "learning_rate": 2.4679020979020977e-06, "loss": 0.3858, "step": 22420 }, { "epoch": 19.44, "learning_rate": 2.4672027972027968e-06, "loss": 0.3866, "step": 22430 }, { "epoch": 19.45, "learning_rate": 2.4665034965034963e-06, "loss": 0.354, "step": 22440 }, { "epoch": 19.45, "learning_rate": 2.4658041958041958e-06, "loss": 0.3874, "step": 22450 }, { "epoch": 19.46, "learning_rate": 2.4651048951048953e-06, "loss": 0.4058, "step": 22460 }, { "epoch": 19.47, "learning_rate": 2.4644055944055943e-06, "loss": 0.4326, "step": 22470 }, { "epoch": 19.48, "learning_rate": 2.4637062937062934e-06, "loss": 0.3791, "step": 22480 }, { "epoch": 19.49, "learning_rate": 2.463006993006993e-06, "loss": 0.4037, "step": 22490 }, { "epoch": 19.5, "learning_rate": 2.462307692307692e-06, "loss": 0.391, "step": 22500 }, { "epoch": 19.51, "learning_rate": 2.4616083916083915e-06, "loss": 0.403, "step": 22510 }, { "epoch": 19.51, "learning_rate": 2.460909090909091e-06, "loss": 0.3796, "step": 22520 }, { "epoch": 19.52, "learning_rate": 2.46020979020979e-06, "loss": 0.4075, "step": 22530 }, { "epoch": 19.53, "learning_rate": 2.459510489510489e-06, "loss": 0.442, "step": 22540 }, { "epoch": 19.54, "learning_rate": 2.4588111888111886e-06, "loss": 0.3926, "step": 22550 }, { "epoch": 19.55, "learning_rate": 2.458111888111888e-06, "loss": 0.3807, "step": 22560 }, { "epoch": 19.56, "learning_rate": 2.4574125874125876e-06, "loss": 0.4076, "step": 22570 }, { "epoch": 19.57, "learning_rate": 2.4567132867132863e-06, "loss": 0.4484, "step": 22580 }, { "epoch": 19.58, "learning_rate": 2.4560139860139858e-06, "loss": 0.3222, "step": 22590 }, { "epoch": 19.58, "learning_rate": 2.4553146853146853e-06, "loss": 0.4182, "step": 22600 }, { "epoch": 19.59, "learning_rate": 2.4546153846153843e-06, "loss": 0.3973, "step": 22610 }, { "epoch": 19.6, "learning_rate": 2.453916083916084e-06, "loss": 0.4256, "step": 22620 }, { "epoch": 19.61, "learning_rate": 2.4532167832167833e-06, "loss": 0.4119, "step": 22630 }, { "epoch": 19.62, "learning_rate": 2.4525174825174824e-06, "loss": 0.3956, "step": 22640 }, { "epoch": 19.63, "learning_rate": 2.4518181818181815e-06, "loss": 0.3509, "step": 22650 }, { "epoch": 19.64, "learning_rate": 2.451118881118881e-06, "loss": 0.3464, "step": 22660 }, { "epoch": 19.64, "learning_rate": 2.4504195804195805e-06, "loss": 0.4038, "step": 22670 }, { "epoch": 19.65, "learning_rate": 2.4497202797202796e-06, "loss": 0.3272, "step": 22680 }, { "epoch": 19.66, "learning_rate": 2.4490209790209786e-06, "loss": 0.3358, "step": 22690 }, { "epoch": 19.67, "learning_rate": 2.448321678321678e-06, "loss": 0.4066, "step": 22700 }, { "epoch": 19.68, "learning_rate": 2.4476223776223776e-06, "loss": 0.3879, "step": 22710 }, { "epoch": 19.69, "learning_rate": 2.4469230769230767e-06, "loss": 0.3762, "step": 22720 }, { "epoch": 19.7, "learning_rate": 2.446223776223776e-06, "loss": 0.4083, "step": 22730 }, { "epoch": 19.71, "learning_rate": 2.4455244755244757e-06, "loss": 0.4895, "step": 22740 }, { "epoch": 19.71, "learning_rate": 2.4448251748251748e-06, "loss": 0.3472, "step": 22750 }, { "epoch": 19.72, "learning_rate": 2.444125874125874e-06, "loss": 0.3847, "step": 22760 }, { "epoch": 19.73, "learning_rate": 2.4434265734265733e-06, "loss": 0.4201, "step": 22770 }, { "epoch": 19.74, "learning_rate": 2.442727272727273e-06, "loss": 0.3952, "step": 22780 }, { "epoch": 19.75, "learning_rate": 2.442027972027972e-06, "loss": 0.3627, "step": 22790 }, { "epoch": 19.76, "learning_rate": 2.441328671328671e-06, "loss": 0.3866, "step": 22800 }, { "epoch": 19.77, "learning_rate": 2.4406293706293705e-06, "loss": 0.4224, "step": 22810 }, { "epoch": 19.77, "learning_rate": 2.43993006993007e-06, "loss": 0.4178, "step": 22820 }, { "epoch": 19.78, "learning_rate": 2.439230769230769e-06, "loss": 0.4198, "step": 22830 }, { "epoch": 19.79, "learning_rate": 2.4385314685314685e-06, "loss": 0.3951, "step": 22840 }, { "epoch": 19.8, "learning_rate": 2.437832167832168e-06, "loss": 0.3302, "step": 22850 }, { "epoch": 19.81, "learning_rate": 2.437202797202797e-06, "loss": 0.3735, "step": 22860 }, { "epoch": 19.82, "learning_rate": 2.4365034965034966e-06, "loss": 0.4324, "step": 22870 }, { "epoch": 19.83, "learning_rate": 2.4358041958041956e-06, "loss": 0.3774, "step": 22880 }, { "epoch": 19.83, "learning_rate": 2.4351048951048947e-06, "loss": 0.3634, "step": 22890 }, { "epoch": 19.84, "learning_rate": 2.4344055944055942e-06, "loss": 0.3314, "step": 22900 }, { "epoch": 19.85, "learning_rate": 2.4337062937062937e-06, "loss": 0.412, "step": 22910 }, { "epoch": 19.86, "learning_rate": 2.4330069930069928e-06, "loss": 0.4328, "step": 22920 }, { "epoch": 19.87, "learning_rate": 2.4323076923076923e-06, "loss": 0.4351, "step": 22930 }, { "epoch": 19.88, "learning_rate": 2.4316083916083918e-06, "loss": 0.3949, "step": 22940 }, { "epoch": 19.89, "learning_rate": 2.430909090909091e-06, "loss": 0.3694, "step": 22950 }, { "epoch": 19.9, "learning_rate": 2.43020979020979e-06, "loss": 0.4665, "step": 22960 }, { "epoch": 19.9, "learning_rate": 2.4295104895104894e-06, "loss": 0.3563, "step": 22970 }, { "epoch": 19.91, "learning_rate": 2.428811188811189e-06, "loss": 0.3771, "step": 22980 }, { "epoch": 19.92, "learning_rate": 2.428111888111888e-06, "loss": 0.3597, "step": 22990 }, { "epoch": 19.93, "learning_rate": 2.427412587412587e-06, "loss": 0.4063, "step": 23000 }, { "epoch": 19.94, "learning_rate": 2.4267132867132866e-06, "loss": 0.3725, "step": 23010 }, { "epoch": 19.95, "learning_rate": 2.426013986013986e-06, "loss": 0.4306, "step": 23020 }, { "epoch": 19.96, "learning_rate": 2.425314685314685e-06, "loss": 0.3789, "step": 23030 }, { "epoch": 19.96, "learning_rate": 2.4246153846153846e-06, "loss": 0.4015, "step": 23040 }, { "epoch": 19.97, "learning_rate": 2.423916083916084e-06, "loss": 0.4076, "step": 23050 }, { "epoch": 19.98, "learning_rate": 2.4232167832167828e-06, "loss": 0.3486, "step": 23060 }, { "epoch": 19.99, "learning_rate": 2.4225174825174823e-06, "loss": 0.3632, "step": 23070 }, { "epoch": 20.0, "learning_rate": 2.4218181818181818e-06, "loss": 0.3136, "step": 23080 }, { "epoch": 20.0, "eval_loss": 0.5591942071914673, "eval_runtime": 134.7021, "eval_samples_per_second": 3.949, "eval_steps_per_second": 1.975, "eval_wer": 0.25249084013627304, "step": 23080 }, { "epoch": 20.01, "learning_rate": 2.4211188811188813e-06, "loss": 0.3984, "step": 23090 }, { "epoch": 20.02, "learning_rate": 2.4204195804195803e-06, "loss": 0.4126, "step": 23100 }, { "epoch": 20.03, "learning_rate": 2.4197202797202794e-06, "loss": 0.4086, "step": 23110 }, { "epoch": 20.03, "learning_rate": 2.419020979020979e-06, "loss": 0.374, "step": 23120 }, { "epoch": 20.04, "learning_rate": 2.418321678321678e-06, "loss": 0.367, "step": 23130 }, { "epoch": 20.05, "learning_rate": 2.4176223776223775e-06, "loss": 0.3317, "step": 23140 }, { "epoch": 20.06, "learning_rate": 2.416923076923077e-06, "loss": 0.3914, "step": 23150 }, { "epoch": 20.07, "learning_rate": 2.4162237762237765e-06, "loss": 0.384, "step": 23160 }, { "epoch": 20.08, "learning_rate": 2.415524475524475e-06, "loss": 0.3982, "step": 23170 }, { "epoch": 20.09, "learning_rate": 2.4148251748251746e-06, "loss": 0.385, "step": 23180 }, { "epoch": 20.1, "learning_rate": 2.414125874125874e-06, "loss": 0.4257, "step": 23190 }, { "epoch": 20.1, "learning_rate": 2.4134265734265736e-06, "loss": 0.3899, "step": 23200 }, { "epoch": 20.11, "learning_rate": 2.4127272727272727e-06, "loss": 0.3788, "step": 23210 }, { "epoch": 20.12, "learning_rate": 2.4120279720279718e-06, "loss": 0.3876, "step": 23220 }, { "epoch": 20.13, "learning_rate": 2.4113286713286713e-06, "loss": 0.3267, "step": 23230 }, { "epoch": 20.14, "learning_rate": 2.4106293706293703e-06, "loss": 0.4032, "step": 23240 }, { "epoch": 20.15, "learning_rate": 2.40993006993007e-06, "loss": 0.3677, "step": 23250 }, { "epoch": 20.16, "learning_rate": 2.4092307692307693e-06, "loss": 0.3476, "step": 23260 }, { "epoch": 20.16, "learning_rate": 2.4085314685314684e-06, "loss": 0.3811, "step": 23270 }, { "epoch": 20.17, "learning_rate": 2.4078321678321675e-06, "loss": 0.4277, "step": 23280 }, { "epoch": 20.18, "learning_rate": 2.407132867132867e-06, "loss": 0.4007, "step": 23290 }, { "epoch": 20.19, "learning_rate": 2.4064335664335665e-06, "loss": 0.3914, "step": 23300 }, { "epoch": 20.2, "learning_rate": 2.4057342657342655e-06, "loss": 0.3485, "step": 23310 }, { "epoch": 20.21, "learning_rate": 2.405034965034965e-06, "loss": 0.3969, "step": 23320 }, { "epoch": 20.22, "learning_rate": 2.404335664335664e-06, "loss": 0.4566, "step": 23330 }, { "epoch": 20.23, "learning_rate": 2.4036363636363636e-06, "loss": 0.3597, "step": 23340 }, { "epoch": 20.23, "learning_rate": 2.4029370629370627e-06, "loss": 0.3356, "step": 23350 }, { "epoch": 20.24, "learning_rate": 2.402237762237762e-06, "loss": 0.3972, "step": 23360 }, { "epoch": 20.25, "learning_rate": 2.4015384615384617e-06, "loss": 0.3903, "step": 23370 }, { "epoch": 20.26, "learning_rate": 2.4008391608391607e-06, "loss": 0.3691, "step": 23380 }, { "epoch": 20.27, "learning_rate": 2.40013986013986e-06, "loss": 0.3839, "step": 23390 }, { "epoch": 20.28, "learning_rate": 2.3994405594405593e-06, "loss": 0.3857, "step": 23400 }, { "epoch": 20.29, "learning_rate": 2.398741258741259e-06, "loss": 0.4017, "step": 23410 }, { "epoch": 20.29, "learning_rate": 2.398041958041958e-06, "loss": 0.4107, "step": 23420 }, { "epoch": 20.3, "learning_rate": 2.397342657342657e-06, "loss": 0.3938, "step": 23430 }, { "epoch": 20.31, "learning_rate": 2.3966433566433565e-06, "loss": 0.3747, "step": 23440 }, { "epoch": 20.32, "learning_rate": 2.395944055944056e-06, "loss": 0.338, "step": 23450 }, { "epoch": 20.33, "learning_rate": 2.395244755244755e-06, "loss": 0.4039, "step": 23460 }, { "epoch": 20.34, "learning_rate": 2.3945454545454545e-06, "loss": 0.3897, "step": 23470 }, { "epoch": 20.35, "learning_rate": 2.393846153846154e-06, "loss": 0.3777, "step": 23480 }, { "epoch": 20.36, "learning_rate": 2.3931468531468527e-06, "loss": 0.3809, "step": 23490 }, { "epoch": 20.36, "learning_rate": 2.392447552447552e-06, "loss": 0.4123, "step": 23500 }, { "epoch": 20.37, "learning_rate": 2.3917482517482517e-06, "loss": 0.3184, "step": 23510 }, { "epoch": 20.38, "learning_rate": 2.391048951048951e-06, "loss": 0.4499, "step": 23520 }, { "epoch": 20.39, "learning_rate": 2.3903496503496502e-06, "loss": 0.3823, "step": 23530 }, { "epoch": 20.4, "learning_rate": 2.3896503496503493e-06, "loss": 0.3515, "step": 23540 }, { "epoch": 20.41, "learning_rate": 2.388951048951049e-06, "loss": 0.3879, "step": 23550 }, { "epoch": 20.42, "learning_rate": 2.3882517482517483e-06, "loss": 0.3481, "step": 23560 }, { "epoch": 20.42, "learning_rate": 2.3875524475524474e-06, "loss": 0.4421, "step": 23570 }, { "epoch": 20.43, "learning_rate": 2.386853146853147e-06, "loss": 0.4234, "step": 23580 }, { "epoch": 20.44, "learning_rate": 2.3861538461538464e-06, "loss": 0.3732, "step": 23590 }, { "epoch": 20.45, "learning_rate": 2.385454545454545e-06, "loss": 0.3774, "step": 23600 }, { "epoch": 20.46, "learning_rate": 2.3847552447552445e-06, "loss": 0.3846, "step": 23610 }, { "epoch": 20.47, "learning_rate": 2.384055944055944e-06, "loss": 0.4003, "step": 23620 }, { "epoch": 20.48, "learning_rate": 2.3833566433566435e-06, "loss": 0.4432, "step": 23630 }, { "epoch": 20.49, "learning_rate": 2.3826573426573426e-06, "loss": 0.4091, "step": 23640 }, { "epoch": 20.49, "learning_rate": 2.3819580419580417e-06, "loss": 0.4014, "step": 23650 }, { "epoch": 20.5, "learning_rate": 2.381258741258741e-06, "loss": 0.3904, "step": 23660 }, { "epoch": 20.51, "learning_rate": 2.3805594405594402e-06, "loss": 0.3942, "step": 23670 }, { "epoch": 20.52, "learning_rate": 2.3798601398601397e-06, "loss": 0.4678, "step": 23680 }, { "epoch": 20.53, "learning_rate": 2.3791608391608392e-06, "loss": 0.3161, "step": 23690 }, { "epoch": 20.54, "learning_rate": 2.3784615384615387e-06, "loss": 0.3986, "step": 23700 }, { "epoch": 20.55, "learning_rate": 2.3777622377622374e-06, "loss": 0.3756, "step": 23710 }, { "epoch": 20.55, "learning_rate": 2.377062937062937e-06, "loss": 0.4178, "step": 23720 }, { "epoch": 20.56, "learning_rate": 2.3763636363636364e-06, "loss": 0.3168, "step": 23730 }, { "epoch": 20.57, "learning_rate": 2.375664335664336e-06, "loss": 0.3617, "step": 23740 }, { "epoch": 20.58, "learning_rate": 2.374965034965035e-06, "loss": 0.4241, "step": 23750 }, { "epoch": 20.59, "learning_rate": 2.374265734265734e-06, "loss": 0.4324, "step": 23760 }, { "epoch": 20.6, "learning_rate": 2.3735664335664335e-06, "loss": 0.3782, "step": 23770 }, { "epoch": 20.61, "learning_rate": 2.3728671328671326e-06, "loss": 0.4475, "step": 23780 }, { "epoch": 20.61, "learning_rate": 2.372167832167832e-06, "loss": 0.3713, "step": 23790 }, { "epoch": 20.62, "learning_rate": 2.3714685314685316e-06, "loss": 0.3692, "step": 23800 }, { "epoch": 20.63, "learning_rate": 2.3707692307692306e-06, "loss": 0.364, "step": 23810 }, { "epoch": 20.64, "learning_rate": 2.3700699300699297e-06, "loss": 0.3905, "step": 23820 }, { "epoch": 20.65, "learning_rate": 2.3693706293706292e-06, "loss": 0.362, "step": 23830 }, { "epoch": 20.66, "learning_rate": 2.3686713286713287e-06, "loss": 0.4497, "step": 23840 }, { "epoch": 20.67, "learning_rate": 2.3679720279720278e-06, "loss": 0.3851, "step": 23850 }, { "epoch": 20.68, "learning_rate": 2.3672727272727273e-06, "loss": 0.3468, "step": 23860 }, { "epoch": 20.68, "learning_rate": 2.3665734265734264e-06, "loss": 0.3688, "step": 23870 }, { "epoch": 20.69, "learning_rate": 2.365874125874126e-06, "loss": 0.4112, "step": 23880 }, { "epoch": 20.7, "learning_rate": 2.365174825174825e-06, "loss": 0.3871, "step": 23890 }, { "epoch": 20.71, "learning_rate": 2.3644755244755244e-06, "loss": 0.4059, "step": 23900 }, { "epoch": 20.72, "learning_rate": 2.363776223776224e-06, "loss": 0.3437, "step": 23910 }, { "epoch": 20.73, "learning_rate": 2.363076923076923e-06, "loss": 0.387, "step": 23920 }, { "epoch": 20.74, "learning_rate": 2.362377622377622e-06, "loss": 0.4489, "step": 23930 }, { "epoch": 20.74, "learning_rate": 2.3616783216783216e-06, "loss": 0.4385, "step": 23940 }, { "epoch": 20.75, "learning_rate": 2.360979020979021e-06, "loss": 0.352, "step": 23950 }, { "epoch": 20.76, "learning_rate": 2.36027972027972e-06, "loss": 0.3235, "step": 23960 }, { "epoch": 20.77, "learning_rate": 2.3595804195804196e-06, "loss": 0.3833, "step": 23970 }, { "epoch": 20.78, "learning_rate": 2.3588811188811187e-06, "loss": 0.4387, "step": 23980 }, { "epoch": 20.79, "learning_rate": 2.358181818181818e-06, "loss": 0.3896, "step": 23990 }, { "epoch": 20.8, "learning_rate": 2.3574825174825173e-06, "loss": 0.4094, "step": 24000 }, { "epoch": 20.81, "learning_rate": 2.3567832167832168e-06, "loss": 0.4098, "step": 24010 }, { "epoch": 20.81, "learning_rate": 2.3560839160839163e-06, "loss": 0.4306, "step": 24020 }, { "epoch": 20.82, "learning_rate": 2.355384615384615e-06, "loss": 0.4632, "step": 24030 }, { "epoch": 20.83, "learning_rate": 2.3546853146853144e-06, "loss": 0.3862, "step": 24040 }, { "epoch": 20.84, "learning_rate": 2.353986013986014e-06, "loss": 0.3786, "step": 24050 }, { "epoch": 20.85, "learning_rate": 2.3532867132867134e-06, "loss": 0.3917, "step": 24060 }, { "epoch": 20.86, "learning_rate": 2.3525874125874125e-06, "loss": 0.409, "step": 24070 }, { "epoch": 20.87, "learning_rate": 2.3518881118881116e-06, "loss": 0.4337, "step": 24080 }, { "epoch": 20.87, "learning_rate": 2.351188811188811e-06, "loss": 0.3868, "step": 24090 }, { "epoch": 20.88, "learning_rate": 2.35048951048951e-06, "loss": 0.344, "step": 24100 }, { "epoch": 20.89, "learning_rate": 2.3497902097902096e-06, "loss": 0.3437, "step": 24110 }, { "epoch": 20.9, "learning_rate": 2.349090909090909e-06, "loss": 0.3807, "step": 24120 }, { "epoch": 20.91, "learning_rate": 2.3483916083916086e-06, "loss": 0.4006, "step": 24130 }, { "epoch": 20.92, "learning_rate": 2.3476923076923073e-06, "loss": 0.388, "step": 24140 }, { "epoch": 20.93, "learning_rate": 2.3469930069930068e-06, "loss": 0.3547, "step": 24150 }, { "epoch": 20.94, "learning_rate": 2.3462937062937063e-06, "loss": 0.3793, "step": 24160 }, { "epoch": 20.94, "learning_rate": 2.3455944055944058e-06, "loss": 0.3923, "step": 24170 }, { "epoch": 20.95, "learning_rate": 2.344895104895105e-06, "loss": 0.3735, "step": 24180 }, { "epoch": 20.96, "learning_rate": 2.344195804195804e-06, "loss": 0.3574, "step": 24190 }, { "epoch": 20.97, "learning_rate": 2.3434965034965034e-06, "loss": 0.3754, "step": 24200 }, { "epoch": 20.98, "learning_rate": 2.3427972027972025e-06, "loss": 0.3825, "step": 24210 }, { "epoch": 20.99, "learning_rate": 2.342097902097902e-06, "loss": 0.3868, "step": 24220 }, { "epoch": 21.0, "learning_rate": 2.3413986013986015e-06, "loss": 0.4249, "step": 24230 }, { "epoch": 21.0, "eval_loss": 0.5684043169021606, "eval_runtime": 135.7482, "eval_samples_per_second": 3.919, "eval_steps_per_second": 1.96, "eval_wer": 0.2560262261361445, "step": 24234 }, { "epoch": 21.01, "learning_rate": 2.340699300699301e-06, "loss": 0.4147, "step": 24240 }, { "epoch": 21.01, "learning_rate": 2.3399999999999996e-06, "loss": 0.3816, "step": 24250 }, { "epoch": 21.02, "learning_rate": 2.339300699300699e-06, "loss": 0.3229, "step": 24260 }, { "epoch": 21.03, "learning_rate": 2.3386013986013986e-06, "loss": 0.4494, "step": 24270 }, { "epoch": 21.04, "learning_rate": 2.3379020979020977e-06, "loss": 0.3372, "step": 24280 }, { "epoch": 21.05, "learning_rate": 2.337202797202797e-06, "loss": 0.4027, "step": 24290 }, { "epoch": 21.06, "learning_rate": 2.3365034965034963e-06, "loss": 0.378, "step": 24300 }, { "epoch": 21.07, "learning_rate": 2.3358041958041958e-06, "loss": 0.3572, "step": 24310 }, { "epoch": 21.07, "learning_rate": 2.335104895104895e-06, "loss": 0.4459, "step": 24320 }, { "epoch": 21.08, "learning_rate": 2.3344055944055943e-06, "loss": 0.415, "step": 24330 }, { "epoch": 21.09, "learning_rate": 2.333706293706294e-06, "loss": 0.3677, "step": 24340 }, { "epoch": 21.1, "learning_rate": 2.3330069930069933e-06, "loss": 0.3709, "step": 24350 }, { "epoch": 21.11, "learning_rate": 2.332307692307692e-06, "loss": 0.3639, "step": 24360 }, { "epoch": 21.12, "learning_rate": 2.3316083916083915e-06, "loss": 0.3739, "step": 24370 }, { "epoch": 21.13, "learning_rate": 2.330909090909091e-06, "loss": 0.4741, "step": 24380 }, { "epoch": 21.14, "learning_rate": 2.33020979020979e-06, "loss": 0.3959, "step": 24390 }, { "epoch": 21.14, "learning_rate": 2.3295104895104895e-06, "loss": 0.4105, "step": 24400 }, { "epoch": 21.15, "learning_rate": 2.3288111888111886e-06, "loss": 0.3114, "step": 24410 }, { "epoch": 21.16, "learning_rate": 2.328111888111888e-06, "loss": 0.3996, "step": 24420 }, { "epoch": 21.17, "learning_rate": 2.327412587412587e-06, "loss": 0.3822, "step": 24430 }, { "epoch": 21.18, "learning_rate": 2.3267132867132867e-06, "loss": 0.3457, "step": 24440 }, { "epoch": 21.19, "learning_rate": 2.326013986013986e-06, "loss": 0.3282, "step": 24450 }, { "epoch": 21.2, "learning_rate": 2.325314685314685e-06, "loss": 0.3591, "step": 24460 }, { "epoch": 21.2, "learning_rate": 2.3246153846153843e-06, "loss": 0.3947, "step": 24470 }, { "epoch": 21.21, "learning_rate": 2.323916083916084e-06, "loss": 0.3338, "step": 24480 }, { "epoch": 21.22, "learning_rate": 2.3232167832167833e-06, "loss": 0.3912, "step": 24490 }, { "epoch": 21.23, "learning_rate": 2.3225174825174824e-06, "loss": 0.3995, "step": 24500 }, { "epoch": 21.24, "learning_rate": 2.321818181818182e-06, "loss": 0.3751, "step": 24510 }, { "epoch": 21.25, "learning_rate": 2.321118881118881e-06, "loss": 0.3852, "step": 24520 }, { "epoch": 21.26, "learning_rate": 2.3204195804195805e-06, "loss": 0.4216, "step": 24530 }, { "epoch": 21.27, "learning_rate": 2.3197202797202795e-06, "loss": 0.3995, "step": 24540 }, { "epoch": 21.27, "learning_rate": 2.319020979020979e-06, "loss": 0.3965, "step": 24550 }, { "epoch": 21.28, "learning_rate": 2.3183216783216785e-06, "loss": 0.3995, "step": 24560 }, { "epoch": 21.29, "learning_rate": 2.317622377622377e-06, "loss": 0.3852, "step": 24570 }, { "epoch": 21.3, "learning_rate": 2.3169230769230767e-06, "loss": 0.3916, "step": 24580 }, { "epoch": 21.31, "learning_rate": 2.316223776223776e-06, "loss": 0.4175, "step": 24590 }, { "epoch": 21.32, "learning_rate": 2.3155244755244757e-06, "loss": 0.3673, "step": 24600 }, { "epoch": 21.33, "learning_rate": 2.3148251748251747e-06, "loss": 0.4021, "step": 24610 }, { "epoch": 21.33, "learning_rate": 2.314125874125874e-06, "loss": 0.3781, "step": 24620 }, { "epoch": 21.34, "learning_rate": 2.3134265734265733e-06, "loss": 0.3848, "step": 24630 }, { "epoch": 21.35, "learning_rate": 2.3127272727272724e-06, "loss": 0.3694, "step": 24640 }, { "epoch": 21.36, "learning_rate": 2.312027972027972e-06, "loss": 0.396, "step": 24650 }, { "epoch": 21.37, "learning_rate": 2.3113286713286714e-06, "loss": 0.3893, "step": 24660 }, { "epoch": 21.38, "learning_rate": 2.310629370629371e-06, "loss": 0.4334, "step": 24670 }, { "epoch": 21.39, "learning_rate": 2.3099300699300695e-06, "loss": 0.385, "step": 24680 }, { "epoch": 21.39, "learning_rate": 2.309230769230769e-06, "loss": 0.4337, "step": 24690 }, { "epoch": 21.4, "learning_rate": 2.3085314685314685e-06, "loss": 0.3979, "step": 24700 }, { "epoch": 21.41, "learning_rate": 2.307832167832168e-06, "loss": 0.4227, "step": 24710 }, { "epoch": 21.42, "learning_rate": 2.307132867132867e-06, "loss": 0.3878, "step": 24720 }, { "epoch": 21.43, "learning_rate": 2.306433566433566e-06, "loss": 0.4102, "step": 24730 }, { "epoch": 21.44, "learning_rate": 2.3057342657342657e-06, "loss": 0.3923, "step": 24740 }, { "epoch": 21.45, "learning_rate": 2.3050349650349647e-06, "loss": 0.3457, "step": 24750 }, { "epoch": 21.46, "learning_rate": 2.3043356643356642e-06, "loss": 0.4122, "step": 24760 }, { "epoch": 21.46, "learning_rate": 2.3036363636363637e-06, "loss": 0.3605, "step": 24770 }, { "epoch": 21.47, "learning_rate": 2.3029370629370632e-06, "loss": 0.3637, "step": 24780 }, { "epoch": 21.48, "learning_rate": 2.302237762237762e-06, "loss": 0.4152, "step": 24790 }, { "epoch": 21.49, "learning_rate": 2.3015384615384614e-06, "loss": 0.3703, "step": 24800 }, { "epoch": 21.5, "learning_rate": 2.300839160839161e-06, "loss": 0.3721, "step": 24810 }, { "epoch": 21.51, "learning_rate": 2.30013986013986e-06, "loss": 0.3466, "step": 24820 }, { "epoch": 21.52, "learning_rate": 2.2994405594405594e-06, "loss": 0.3717, "step": 24830 }, { "epoch": 21.52, "learning_rate": 2.2987412587412585e-06, "loss": 0.3719, "step": 24840 }, { "epoch": 21.53, "learning_rate": 2.298041958041958e-06, "loss": 0.3881, "step": 24850 }, { "epoch": 21.54, "learning_rate": 2.297342657342657e-06, "loss": 0.347, "step": 24860 }, { "epoch": 21.55, "learning_rate": 2.2966433566433566e-06, "loss": 0.3567, "step": 24870 }, { "epoch": 21.56, "learning_rate": 2.295944055944056e-06, "loss": 0.4173, "step": 24880 }, { "epoch": 21.57, "learning_rate": 2.2952447552447556e-06, "loss": 0.3959, "step": 24890 }, { "epoch": 21.58, "learning_rate": 2.2945454545454542e-06, "loss": 0.3761, "step": 24900 }, { "epoch": 21.59, "learning_rate": 2.2938461538461537e-06, "loss": 0.3773, "step": 24910 }, { "epoch": 21.59, "learning_rate": 2.293146853146853e-06, "loss": 0.3891, "step": 24920 }, { "epoch": 21.6, "learning_rate": 2.2924475524475523e-06, "loss": 0.3779, "step": 24930 }, { "epoch": 21.61, "learning_rate": 2.2917482517482518e-06, "loss": 0.4076, "step": 24940 }, { "epoch": 21.62, "learning_rate": 2.291048951048951e-06, "loss": 0.4118, "step": 24950 }, { "epoch": 21.63, "learning_rate": 2.2903496503496503e-06, "loss": 0.3887, "step": 24960 }, { "epoch": 21.64, "learning_rate": 2.2896503496503494e-06, "loss": 0.3366, "step": 24970 }, { "epoch": 21.65, "learning_rate": 2.288951048951049e-06, "loss": 0.3912, "step": 24980 }, { "epoch": 21.65, "learning_rate": 2.2882517482517484e-06, "loss": 0.3827, "step": 24990 }, { "epoch": 21.66, "learning_rate": 2.287552447552447e-06, "loss": 0.3377, "step": 25000 }, { "epoch": 21.67, "learning_rate": 2.2868531468531466e-06, "loss": 0.3491, "step": 25010 }, { "epoch": 21.68, "learning_rate": 2.286153846153846e-06, "loss": 0.3245, "step": 25020 }, { "epoch": 21.69, "learning_rate": 2.2854545454545456e-06, "loss": 0.4169, "step": 25030 }, { "epoch": 21.7, "learning_rate": 2.2847552447552446e-06, "loss": 0.4224, "step": 25040 }, { "epoch": 21.71, "learning_rate": 2.284055944055944e-06, "loss": 0.3476, "step": 25050 }, { "epoch": 21.72, "learning_rate": 2.283356643356643e-06, "loss": 0.4036, "step": 25060 }, { "epoch": 21.72, "learning_rate": 2.2826573426573423e-06, "loss": 0.3634, "step": 25070 }, { "epoch": 21.73, "learning_rate": 2.2819580419580418e-06, "loss": 0.3939, "step": 25080 }, { "epoch": 21.74, "learning_rate": 2.2812587412587413e-06, "loss": 0.3464, "step": 25090 }, { "epoch": 21.75, "learning_rate": 2.2805594405594408e-06, "loss": 0.3893, "step": 25100 }, { "epoch": 21.76, "learning_rate": 2.2798601398601394e-06, "loss": 0.3855, "step": 25110 }, { "epoch": 21.77, "learning_rate": 2.279160839160839e-06, "loss": 0.4167, "step": 25120 }, { "epoch": 21.78, "learning_rate": 2.2784615384615384e-06, "loss": 0.3836, "step": 25130 }, { "epoch": 21.78, "learning_rate": 2.277762237762238e-06, "loss": 0.3105, "step": 25140 }, { "epoch": 21.79, "learning_rate": 2.277062937062937e-06, "loss": 0.3964, "step": 25150 }, { "epoch": 21.8, "learning_rate": 2.276363636363636e-06, "loss": 0.3568, "step": 25160 }, { "epoch": 21.81, "learning_rate": 2.2756643356643355e-06, "loss": 0.3838, "step": 25170 }, { "epoch": 21.82, "learning_rate": 2.2749650349650346e-06, "loss": 0.3986, "step": 25180 }, { "epoch": 21.83, "learning_rate": 2.274265734265734e-06, "loss": 0.382, "step": 25190 }, { "epoch": 21.84, "learning_rate": 2.2735664335664336e-06, "loss": 0.448, "step": 25200 }, { "epoch": 21.85, "learning_rate": 2.272867132867133e-06, "loss": 0.3933, "step": 25210 }, { "epoch": 21.85, "learning_rate": 2.2721678321678318e-06, "loss": 0.4001, "step": 25220 }, { "epoch": 21.86, "learning_rate": 2.2714685314685313e-06, "loss": 0.3441, "step": 25230 }, { "epoch": 21.87, "learning_rate": 2.2707692307692308e-06, "loss": 0.3799, "step": 25240 }, { "epoch": 21.88, "learning_rate": 2.27006993006993e-06, "loss": 0.3925, "step": 25250 }, { "epoch": 21.89, "learning_rate": 2.2693706293706293e-06, "loss": 0.3734, "step": 25260 }, { "epoch": 21.9, "learning_rate": 2.2687412587412584e-06, "loss": 0.4445, "step": 25270 }, { "epoch": 21.91, "learning_rate": 2.268041958041958e-06, "loss": 0.3718, "step": 25280 }, { "epoch": 21.91, "learning_rate": 2.2673426573426574e-06, "loss": 0.4257, "step": 25290 }, { "epoch": 21.92, "learning_rate": 2.266643356643357e-06, "loss": 0.3629, "step": 25300 }, { "epoch": 21.93, "learning_rate": 2.2659440559440555e-06, "loss": 0.345, "step": 25310 }, { "epoch": 21.94, "learning_rate": 2.265244755244755e-06, "loss": 0.424, "step": 25320 }, { "epoch": 21.95, "learning_rate": 2.2645454545454545e-06, "loss": 0.4096, "step": 25330 }, { "epoch": 21.96, "learning_rate": 2.263846153846154e-06, "loss": 0.3915, "step": 25340 }, { "epoch": 21.97, "learning_rate": 2.263146853146853e-06, "loss": 0.4156, "step": 25350 }, { "epoch": 21.98, "learning_rate": 2.2624475524475526e-06, "loss": 0.4044, "step": 25360 }, { "epoch": 21.98, "learning_rate": 2.2617482517482516e-06, "loss": 0.3756, "step": 25370 }, { "epoch": 21.99, "learning_rate": 2.2610489510489507e-06, "loss": 0.4993, "step": 25380 }, { "epoch": 22.0, "eval_loss": 0.55206298828125, "eval_runtime": 133.6827, "eval_samples_per_second": 3.98, "eval_steps_per_second": 1.99, "eval_wer": 0.2529407983544385, "step": 25388 }, { "epoch": 22.0, "learning_rate": 2.2603496503496502e-06, "loss": 0.4081, "step": 25390 }, { "epoch": 22.01, "learning_rate": 2.2596503496503497e-06, "loss": 0.3995, "step": 25400 }, { "epoch": 22.02, "learning_rate": 2.258951048951049e-06, "loss": 0.3564, "step": 25410 }, { "epoch": 22.03, "learning_rate": 2.258251748251748e-06, "loss": 0.39, "step": 25420 }, { "epoch": 22.04, "learning_rate": 2.2575524475524474e-06, "loss": 0.3942, "step": 25430 }, { "epoch": 22.05, "learning_rate": 2.256853146853147e-06, "loss": 0.3723, "step": 25440 }, { "epoch": 22.05, "learning_rate": 2.256153846153846e-06, "loss": 0.4172, "step": 25450 }, { "epoch": 22.06, "learning_rate": 2.2554545454545454e-06, "loss": 0.4109, "step": 25460 }, { "epoch": 22.07, "learning_rate": 2.2547552447552445e-06, "loss": 0.3592, "step": 25470 }, { "epoch": 22.08, "learning_rate": 2.254055944055944e-06, "loss": 0.3938, "step": 25480 }, { "epoch": 22.09, "learning_rate": 2.253356643356643e-06, "loss": 0.4014, "step": 25490 }, { "epoch": 22.1, "learning_rate": 2.2526573426573426e-06, "loss": 0.358, "step": 25500 }, { "epoch": 22.11, "learning_rate": 2.251958041958042e-06, "loss": 0.3604, "step": 25510 }, { "epoch": 22.11, "learning_rate": 2.2512587412587416e-06, "loss": 0.3497, "step": 25520 }, { "epoch": 22.12, "learning_rate": 2.25055944055944e-06, "loss": 0.3939, "step": 25530 }, { "epoch": 22.13, "learning_rate": 2.2499300699300697e-06, "loss": 0.4107, "step": 25540 }, { "epoch": 22.14, "learning_rate": 2.249230769230769e-06, "loss": 0.3557, "step": 25550 }, { "epoch": 22.15, "learning_rate": 2.2485314685314687e-06, "loss": 0.3858, "step": 25560 }, { "epoch": 22.16, "learning_rate": 2.2478321678321677e-06, "loss": 0.3781, "step": 25570 }, { "epoch": 22.17, "learning_rate": 2.247132867132867e-06, "loss": 0.386, "step": 25580 }, { "epoch": 22.17, "learning_rate": 2.2464335664335663e-06, "loss": 0.3992, "step": 25590 }, { "epoch": 22.18, "learning_rate": 2.245734265734266e-06, "loss": 0.3983, "step": 25600 }, { "epoch": 22.19, "learning_rate": 2.2450349650349653e-06, "loss": 0.3997, "step": 25610 }, { "epoch": 22.2, "learning_rate": 2.244335664335664e-06, "loss": 0.4447, "step": 25620 }, { "epoch": 22.21, "learning_rate": 2.2436363636363634e-06, "loss": 0.3922, "step": 25630 }, { "epoch": 22.22, "learning_rate": 2.242937062937063e-06, "loss": 0.381, "step": 25640 }, { "epoch": 22.23, "learning_rate": 2.242237762237762e-06, "loss": 0.4374, "step": 25650 }, { "epoch": 22.24, "learning_rate": 2.2415384615384615e-06, "loss": 0.4023, "step": 25660 }, { "epoch": 22.24, "learning_rate": 2.240839160839161e-06, "loss": 0.3713, "step": 25670 }, { "epoch": 22.25, "learning_rate": 2.24013986013986e-06, "loss": 0.389, "step": 25680 }, { "epoch": 22.26, "learning_rate": 2.239440559440559e-06, "loss": 0.4042, "step": 25690 }, { "epoch": 22.27, "learning_rate": 2.2387412587412587e-06, "loss": 0.3508, "step": 25700 }, { "epoch": 22.28, "learning_rate": 2.238041958041958e-06, "loss": 0.4081, "step": 25710 }, { "epoch": 22.29, "learning_rate": 2.2373426573426572e-06, "loss": 0.3937, "step": 25720 }, { "epoch": 22.3, "learning_rate": 2.2366433566433563e-06, "loss": 0.4126, "step": 25730 }, { "epoch": 22.3, "learning_rate": 2.235944055944056e-06, "loss": 0.3849, "step": 25740 }, { "epoch": 22.31, "learning_rate": 2.2352447552447553e-06, "loss": 0.3666, "step": 25750 }, { "epoch": 22.32, "learning_rate": 2.2345454545454544e-06, "loss": 0.3968, "step": 25760 }, { "epoch": 22.33, "learning_rate": 2.233846153846154e-06, "loss": 0.3478, "step": 25770 }, { "epoch": 22.34, "learning_rate": 2.233146853146853e-06, "loss": 0.4305, "step": 25780 }, { "epoch": 22.35, "learning_rate": 2.2324475524475524e-06, "loss": 0.3786, "step": 25790 }, { "epoch": 22.36, "learning_rate": 2.2317482517482515e-06, "loss": 0.3271, "step": 25800 }, { "epoch": 22.37, "learning_rate": 2.231048951048951e-06, "loss": 0.3788, "step": 25810 }, { "epoch": 22.37, "learning_rate": 2.2303496503496505e-06, "loss": 0.3743, "step": 25820 }, { "epoch": 22.38, "learning_rate": 2.2296503496503496e-06, "loss": 0.4284, "step": 25830 }, { "epoch": 22.39, "learning_rate": 2.2289510489510486e-06, "loss": 0.4357, "step": 25840 }, { "epoch": 22.4, "learning_rate": 2.228251748251748e-06, "loss": 0.3475, "step": 25850 }, { "epoch": 22.41, "learning_rate": 2.2275524475524476e-06, "loss": 0.2906, "step": 25860 }, { "epoch": 22.42, "learning_rate": 2.2268531468531467e-06, "loss": 0.3724, "step": 25870 }, { "epoch": 22.43, "learning_rate": 2.226153846153846e-06, "loss": 0.3659, "step": 25880 }, { "epoch": 22.43, "learning_rate": 2.2254545454545453e-06, "loss": 0.374, "step": 25890 }, { "epoch": 22.44, "learning_rate": 2.2247552447552444e-06, "loss": 0.3879, "step": 25900 }, { "epoch": 22.45, "learning_rate": 2.224055944055944e-06, "loss": 0.3066, "step": 25910 }, { "epoch": 22.46, "learning_rate": 2.2233566433566434e-06, "loss": 0.3119, "step": 25920 }, { "epoch": 22.47, "learning_rate": 2.222657342657343e-06, "loss": 0.4196, "step": 25930 }, { "epoch": 22.48, "learning_rate": 2.2219580419580415e-06, "loss": 0.3935, "step": 25940 }, { "epoch": 22.49, "learning_rate": 2.221258741258741e-06, "loss": 0.363, "step": 25950 }, { "epoch": 22.5, "learning_rate": 2.2205594405594405e-06, "loss": 0.4021, "step": 25960 }, { "epoch": 22.5, "learning_rate": 2.21986013986014e-06, "loss": 0.3808, "step": 25970 }, { "epoch": 22.51, "learning_rate": 2.219160839160839e-06, "loss": 0.4058, "step": 25980 }, { "epoch": 22.52, "learning_rate": 2.2184615384615386e-06, "loss": 0.3699, "step": 25990 }, { "epoch": 22.53, "learning_rate": 2.2177622377622376e-06, "loss": 0.3609, "step": 26000 }, { "epoch": 22.54, "learning_rate": 2.2170629370629367e-06, "loss": 0.3769, "step": 26010 }, { "epoch": 22.55, "learning_rate": 2.216363636363636e-06, "loss": 0.3697, "step": 26020 }, { "epoch": 22.56, "learning_rate": 2.2156643356643357e-06, "loss": 0.4068, "step": 26030 }, { "epoch": 22.56, "learning_rate": 2.214965034965035e-06, "loss": 0.4025, "step": 26040 }, { "epoch": 22.57, "learning_rate": 2.214265734265734e-06, "loss": 0.4122, "step": 26050 }, { "epoch": 22.58, "learning_rate": 2.2135664335664333e-06, "loss": 0.3301, "step": 26060 }, { "epoch": 22.59, "learning_rate": 2.212867132867133e-06, "loss": 0.3911, "step": 26070 }, { "epoch": 22.6, "learning_rate": 2.212167832167832e-06, "loss": 0.3702, "step": 26080 }, { "epoch": 22.61, "learning_rate": 2.2114685314685314e-06, "loss": 0.4195, "step": 26090 }, { "epoch": 22.62, "learning_rate": 2.210769230769231e-06, "loss": 0.418, "step": 26100 }, { "epoch": 22.63, "learning_rate": 2.21006993006993e-06, "loss": 0.3531, "step": 26110 }, { "epoch": 22.63, "learning_rate": 2.209370629370629e-06, "loss": 0.4043, "step": 26120 }, { "epoch": 22.64, "learning_rate": 2.2086713286713286e-06, "loss": 0.3328, "step": 26130 }, { "epoch": 22.65, "learning_rate": 2.207972027972028e-06, "loss": 0.328, "step": 26140 }, { "epoch": 22.66, "learning_rate": 2.207272727272727e-06, "loss": 0.4128, "step": 26150 }, { "epoch": 22.67, "learning_rate": 2.206573426573426e-06, "loss": 0.3926, "step": 26160 }, { "epoch": 22.68, "learning_rate": 2.2058741258741257e-06, "loss": 0.3639, "step": 26170 }, { "epoch": 22.69, "learning_rate": 2.205174825174825e-06, "loss": 0.3715, "step": 26180 }, { "epoch": 22.69, "learning_rate": 2.2044755244755243e-06, "loss": 0.3521, "step": 26190 }, { "epoch": 22.7, "learning_rate": 2.2037762237762238e-06, "loss": 0.3788, "step": 26200 }, { "epoch": 22.71, "learning_rate": 2.2030769230769233e-06, "loss": 0.3915, "step": 26210 }, { "epoch": 22.72, "learning_rate": 2.2023776223776223e-06, "loss": 0.3423, "step": 26220 }, { "epoch": 22.73, "learning_rate": 2.2016783216783214e-06, "loss": 0.373, "step": 26230 }, { "epoch": 22.74, "learning_rate": 2.200979020979021e-06, "loss": 0.3901, "step": 26240 }, { "epoch": 22.75, "learning_rate": 2.2002797202797204e-06, "loss": 0.4118, "step": 26250 }, { "epoch": 22.76, "learning_rate": 2.1995804195804195e-06, "loss": 0.3516, "step": 26260 }, { "epoch": 22.76, "learning_rate": 2.1988811188811185e-06, "loss": 0.3985, "step": 26270 }, { "epoch": 22.77, "learning_rate": 2.198181818181818e-06, "loss": 0.3818, "step": 26280 }, { "epoch": 22.78, "learning_rate": 2.1974825174825175e-06, "loss": 0.4288, "step": 26290 }, { "epoch": 22.79, "learning_rate": 2.1967832167832166e-06, "loss": 0.3869, "step": 26300 }, { "epoch": 22.8, "learning_rate": 2.196083916083916e-06, "loss": 0.363, "step": 26310 }, { "epoch": 22.81, "learning_rate": 2.195384615384615e-06, "loss": 0.383, "step": 26320 }, { "epoch": 22.82, "learning_rate": 2.1946853146853143e-06, "loss": 0.3899, "step": 26330 }, { "epoch": 22.82, "learning_rate": 2.1939860139860138e-06, "loss": 0.3354, "step": 26340 }, { "epoch": 22.83, "learning_rate": 2.1932867132867132e-06, "loss": 0.3557, "step": 26350 }, { "epoch": 22.84, "learning_rate": 2.1925874125874127e-06, "loss": 0.4285, "step": 26360 }, { "epoch": 22.85, "learning_rate": 2.191888111888112e-06, "loss": 0.373, "step": 26370 }, { "epoch": 22.86, "learning_rate": 2.191188811188811e-06, "loss": 0.3531, "step": 26380 }, { "epoch": 22.87, "learning_rate": 2.1904895104895104e-06, "loss": 0.3789, "step": 26390 }, { "epoch": 22.88, "learning_rate": 2.18979020979021e-06, "loss": 0.3444, "step": 26400 }, { "epoch": 22.89, "learning_rate": 2.189090909090909e-06, "loss": 0.3703, "step": 26410 }, { "epoch": 22.89, "learning_rate": 2.1883916083916085e-06, "loss": 0.3799, "step": 26420 }, { "epoch": 22.9, "learning_rate": 2.1876923076923075e-06, "loss": 0.3731, "step": 26430 }, { "epoch": 22.91, "learning_rate": 2.1869930069930066e-06, "loss": 0.428, "step": 26440 }, { "epoch": 22.92, "learning_rate": 2.186293706293706e-06, "loss": 0.3845, "step": 26450 }, { "epoch": 22.93, "learning_rate": 2.1855944055944056e-06, "loss": 0.3844, "step": 26460 }, { "epoch": 22.94, "learning_rate": 2.184895104895105e-06, "loss": 0.3658, "step": 26470 }, { "epoch": 22.95, "learning_rate": 2.184195804195804e-06, "loss": 0.3885, "step": 26480 }, { "epoch": 22.95, "learning_rate": 2.1834965034965032e-06, "loss": 0.3828, "step": 26490 }, { "epoch": 22.96, "learning_rate": 2.1827972027972027e-06, "loss": 0.4448, "step": 26500 }, { "epoch": 22.97, "learning_rate": 2.182097902097902e-06, "loss": 0.351, "step": 26510 }, { "epoch": 22.98, "learning_rate": 2.1813986013986013e-06, "loss": 0.3683, "step": 26520 }, { "epoch": 22.99, "learning_rate": 2.180699300699301e-06, "loss": 0.3684, "step": 26530 }, { "epoch": 23.0, "learning_rate": 2.18e-06, "loss": 0.4006, "step": 26540 }, { "epoch": 23.0, "eval_loss": 0.5390881299972534, "eval_runtime": 135.1116, "eval_samples_per_second": 3.937, "eval_steps_per_second": 1.969, "eval_wer": 0.2539692742816738, "step": 26542 }, { "epoch": 23.01, "learning_rate": 2.179300699300699e-06, "loss": 0.4004, "step": 26550 }, { "epoch": 23.02, "learning_rate": 2.1786013986013985e-06, "loss": 0.3702, "step": 26560 }, { "epoch": 23.02, "learning_rate": 2.177902097902098e-06, "loss": 0.3652, "step": 26570 }, { "epoch": 23.03, "learning_rate": 2.1772027972027974e-06, "loss": 0.3967, "step": 26580 }, { "epoch": 23.04, "learning_rate": 2.176503496503496e-06, "loss": 0.4196, "step": 26590 }, { "epoch": 23.05, "learning_rate": 2.1758041958041956e-06, "loss": 0.3222, "step": 26600 }, { "epoch": 23.06, "learning_rate": 2.175104895104895e-06, "loss": 0.4268, "step": 26610 }, { "epoch": 23.07, "learning_rate": 2.174405594405594e-06, "loss": 0.3838, "step": 26620 }, { "epoch": 23.08, "learning_rate": 2.1737062937062937e-06, "loss": 0.3729, "step": 26630 }, { "epoch": 23.08, "learning_rate": 2.173006993006993e-06, "loss": 0.3547, "step": 26640 }, { "epoch": 23.09, "learning_rate": 2.1723076923076922e-06, "loss": 0.3471, "step": 26650 }, { "epoch": 23.1, "learning_rate": 2.1716083916083913e-06, "loss": 0.3904, "step": 26660 }, { "epoch": 23.11, "learning_rate": 2.170909090909091e-06, "loss": 0.3874, "step": 26670 }, { "epoch": 23.12, "learning_rate": 2.1702097902097903e-06, "loss": 0.4084, "step": 26680 }, { "epoch": 23.13, "learning_rate": 2.1695104895104894e-06, "loss": 0.4002, "step": 26690 }, { "epoch": 23.14, "learning_rate": 2.1688111888111884e-06, "loss": 0.376, "step": 26700 }, { "epoch": 23.15, "learning_rate": 2.168111888111888e-06, "loss": 0.3864, "step": 26710 }, { "epoch": 23.15, "learning_rate": 2.1674125874125874e-06, "loss": 0.319, "step": 26720 }, { "epoch": 23.16, "learning_rate": 2.1667132867132865e-06, "loss": 0.4121, "step": 26730 }, { "epoch": 23.17, "learning_rate": 2.166013986013986e-06, "loss": 0.4444, "step": 26740 }, { "epoch": 23.18, "learning_rate": 2.1653146853146855e-06, "loss": 0.3773, "step": 26750 }, { "epoch": 23.19, "learning_rate": 2.1646153846153846e-06, "loss": 0.392, "step": 26760 }, { "epoch": 23.2, "learning_rate": 2.1639160839160837e-06, "loss": 0.4112, "step": 26770 }, { "epoch": 23.21, "learning_rate": 2.163216783216783e-06, "loss": 0.355, "step": 26780 }, { "epoch": 23.21, "learning_rate": 2.1625174825174826e-06, "loss": 0.4104, "step": 26790 }, { "epoch": 23.22, "learning_rate": 2.1618181818181817e-06, "loss": 0.387, "step": 26800 }, { "epoch": 23.23, "learning_rate": 2.161118881118881e-06, "loss": 0.3586, "step": 26810 }, { "epoch": 23.24, "learning_rate": 2.1604195804195803e-06, "loss": 0.3314, "step": 26820 }, { "epoch": 23.25, "learning_rate": 2.1597202797202798e-06, "loss": 0.3541, "step": 26830 }, { "epoch": 23.26, "learning_rate": 2.159020979020979e-06, "loss": 0.3251, "step": 26840 }, { "epoch": 23.27, "learning_rate": 2.1583216783216784e-06, "loss": 0.3827, "step": 26850 }, { "epoch": 23.28, "learning_rate": 2.157622377622378e-06, "loss": 0.3847, "step": 26860 }, { "epoch": 23.28, "learning_rate": 2.1569230769230765e-06, "loss": 0.3511, "step": 26870 }, { "epoch": 23.29, "learning_rate": 2.156223776223776e-06, "loss": 0.3836, "step": 26880 }, { "epoch": 23.3, "learning_rate": 2.1555244755244755e-06, "loss": 0.4105, "step": 26890 }, { "epoch": 23.31, "learning_rate": 2.154825174825175e-06, "loss": 0.389, "step": 26900 }, { "epoch": 23.32, "learning_rate": 2.154125874125874e-06, "loss": 0.4224, "step": 26910 }, { "epoch": 23.33, "learning_rate": 2.153426573426573e-06, "loss": 0.3815, "step": 26920 }, { "epoch": 23.34, "learning_rate": 2.1527272727272726e-06, "loss": 0.4167, "step": 26930 }, { "epoch": 23.34, "learning_rate": 2.152027972027972e-06, "loss": 0.3705, "step": 26940 }, { "epoch": 23.35, "learning_rate": 2.151328671328671e-06, "loss": 0.3442, "step": 26950 }, { "epoch": 23.36, "learning_rate": 2.1506293706293707e-06, "loss": 0.3981, "step": 26960 }, { "epoch": 23.37, "learning_rate": 2.1499300699300698e-06, "loss": 0.3808, "step": 26970 }, { "epoch": 23.38, "learning_rate": 2.149230769230769e-06, "loss": 0.3783, "step": 26980 }, { "epoch": 23.39, "learning_rate": 2.1485314685314683e-06, "loss": 0.4623, "step": 26990 }, { "epoch": 23.4, "learning_rate": 2.147832167832168e-06, "loss": 0.4182, "step": 27000 }, { "epoch": 23.41, "learning_rate": 2.1471328671328673e-06, "loss": 0.3527, "step": 27010 }, { "epoch": 23.41, "learning_rate": 2.1464335664335664e-06, "loss": 0.439, "step": 27020 }, { "epoch": 23.42, "learning_rate": 2.1457342657342655e-06, "loss": 0.3807, "step": 27030 }, { "epoch": 23.43, "learning_rate": 2.145034965034965e-06, "loss": 0.4682, "step": 27040 }, { "epoch": 23.44, "learning_rate": 2.144335664335664e-06, "loss": 0.3696, "step": 27050 }, { "epoch": 23.45, "learning_rate": 2.1436363636363636e-06, "loss": 0.4157, "step": 27060 }, { "epoch": 23.46, "learning_rate": 2.142937062937063e-06, "loss": 0.36, "step": 27070 }, { "epoch": 23.47, "learning_rate": 2.142237762237762e-06, "loss": 0.4192, "step": 27080 }, { "epoch": 23.47, "learning_rate": 2.141538461538461e-06, "loss": 0.3983, "step": 27090 }, { "epoch": 23.48, "learning_rate": 2.1408391608391607e-06, "loss": 0.376, "step": 27100 }, { "epoch": 23.49, "learning_rate": 2.14013986013986e-06, "loss": 0.3796, "step": 27110 }, { "epoch": 23.5, "learning_rate": 2.1394405594405593e-06, "loss": 0.3944, "step": 27120 }, { "epoch": 23.51, "learning_rate": 2.1387412587412583e-06, "loss": 0.3578, "step": 27130 }, { "epoch": 23.52, "learning_rate": 2.138041958041958e-06, "loss": 0.4543, "step": 27140 }, { "epoch": 23.53, "learning_rate": 2.1373426573426573e-06, "loss": 0.3819, "step": 27150 }, { "epoch": 23.54, "learning_rate": 2.1366433566433564e-06, "loss": 0.4166, "step": 27160 }, { "epoch": 23.54, "learning_rate": 2.135944055944056e-06, "loss": 0.3704, "step": 27170 }, { "epoch": 23.55, "learning_rate": 2.1352447552447554e-06, "loss": 0.4091, "step": 27180 }, { "epoch": 23.56, "learning_rate": 2.1345454545454545e-06, "loss": 0.4358, "step": 27190 }, { "epoch": 23.57, "learning_rate": 2.1338461538461535e-06, "loss": 0.376, "step": 27200 }, { "epoch": 23.58, "learning_rate": 2.133146853146853e-06, "loss": 0.3762, "step": 27210 }, { "epoch": 23.59, "learning_rate": 2.1324475524475525e-06, "loss": 0.3738, "step": 27220 }, { "epoch": 23.6, "learning_rate": 2.1317482517482516e-06, "loss": 0.4496, "step": 27230 }, { "epoch": 23.6, "learning_rate": 2.1310489510489507e-06, "loss": 0.3792, "step": 27240 }, { "epoch": 23.61, "learning_rate": 2.13034965034965e-06, "loss": 0.3751, "step": 27250 }, { "epoch": 23.62, "learning_rate": 2.1296503496503497e-06, "loss": 0.3919, "step": 27260 }, { "epoch": 23.63, "learning_rate": 2.1289510489510488e-06, "loss": 0.3704, "step": 27270 }, { "epoch": 23.64, "learning_rate": 2.1282517482517483e-06, "loss": 0.4081, "step": 27280 }, { "epoch": 23.65, "learning_rate": 2.1275524475524478e-06, "loss": 0.4452, "step": 27290 }, { "epoch": 23.66, "learning_rate": 2.1268531468531464e-06, "loss": 0.431, "step": 27300 }, { "epoch": 23.67, "learning_rate": 2.126153846153846e-06, "loss": 0.3536, "step": 27310 }, { "epoch": 23.67, "learning_rate": 2.1254545454545454e-06, "loss": 0.4114, "step": 27320 }, { "epoch": 23.68, "learning_rate": 2.124755244755245e-06, "loss": 0.3842, "step": 27330 }, { "epoch": 23.69, "learning_rate": 2.124055944055944e-06, "loss": 0.353, "step": 27340 }, { "epoch": 23.7, "learning_rate": 2.123356643356643e-06, "loss": 0.4224, "step": 27350 }, { "epoch": 23.71, "learning_rate": 2.1226573426573425e-06, "loss": 0.3435, "step": 27360 }, { "epoch": 23.72, "learning_rate": 2.121958041958042e-06, "loss": 0.3487, "step": 27370 }, { "epoch": 23.73, "learning_rate": 2.121258741258741e-06, "loss": 0.3942, "step": 27380 }, { "epoch": 23.73, "learning_rate": 2.1205594405594406e-06, "loss": 0.3632, "step": 27390 }, { "epoch": 23.74, "learning_rate": 2.11986013986014e-06, "loss": 0.382, "step": 27400 }, { "epoch": 23.75, "learning_rate": 2.1191608391608387e-06, "loss": 0.3673, "step": 27410 }, { "epoch": 23.76, "learning_rate": 2.1184615384615382e-06, "loss": 0.3575, "step": 27420 }, { "epoch": 23.77, "learning_rate": 2.1177622377622377e-06, "loss": 0.419, "step": 27430 }, { "epoch": 23.78, "learning_rate": 2.1170629370629372e-06, "loss": 0.3871, "step": 27440 }, { "epoch": 23.79, "learning_rate": 2.1163636363636363e-06, "loss": 0.3454, "step": 27450 }, { "epoch": 23.8, "learning_rate": 2.1156643356643354e-06, "loss": 0.334, "step": 27460 }, { "epoch": 23.8, "learning_rate": 2.114965034965035e-06, "loss": 0.3547, "step": 27470 }, { "epoch": 23.81, "learning_rate": 2.114265734265734e-06, "loss": 0.3734, "step": 27480 }, { "epoch": 23.82, "learning_rate": 2.1135664335664335e-06, "loss": 0.4145, "step": 27490 }, { "epoch": 23.83, "learning_rate": 2.112867132867133e-06, "loss": 0.4302, "step": 27500 }, { "epoch": 23.84, "learning_rate": 2.112167832167832e-06, "loss": 0.3534, "step": 27510 }, { "epoch": 23.85, "learning_rate": 2.111468531468531e-06, "loss": 0.3707, "step": 27520 }, { "epoch": 23.86, "learning_rate": 2.1107692307692306e-06, "loss": 0.4046, "step": 27530 }, { "epoch": 23.86, "learning_rate": 2.11006993006993e-06, "loss": 0.3533, "step": 27540 }, { "epoch": 23.87, "learning_rate": 2.1093706293706296e-06, "loss": 0.3866, "step": 27550 }, { "epoch": 23.88, "learning_rate": 2.1086713286713287e-06, "loss": 0.3552, "step": 27560 }, { "epoch": 23.89, "learning_rate": 2.1079720279720277e-06, "loss": 0.3502, "step": 27570 }, { "epoch": 23.9, "learning_rate": 2.1072727272727272e-06, "loss": 0.3573, "step": 27580 }, { "epoch": 23.91, "learning_rate": 2.1065734265734263e-06, "loss": 0.3815, "step": 27590 }, { "epoch": 23.92, "learning_rate": 2.105874125874126e-06, "loss": 0.3983, "step": 27600 }, { "epoch": 23.93, "learning_rate": 2.1051748251748253e-06, "loss": 0.3672, "step": 27610 }, { "epoch": 23.93, "learning_rate": 2.1044755244755244e-06, "loss": 0.3297, "step": 27620 }, { "epoch": 23.94, "learning_rate": 2.1037762237762234e-06, "loss": 0.4176, "step": 27630 }, { "epoch": 23.95, "learning_rate": 2.103076923076923e-06, "loss": 0.4519, "step": 27640 }, { "epoch": 23.96, "learning_rate": 2.1023776223776224e-06, "loss": 0.3794, "step": 27650 }, { "epoch": 23.97, "learning_rate": 2.1016783216783215e-06, "loss": 0.3804, "step": 27660 }, { "epoch": 23.98, "learning_rate": 2.1009790209790206e-06, "loss": 0.3239, "step": 27670 }, { "epoch": 23.99, "learning_rate": 2.10027972027972e-06, "loss": 0.3851, "step": 27680 }, { "epoch": 23.99, "learning_rate": 2.0995804195804196e-06, "loss": 0.3415, "step": 27690 }, { "epoch": 24.0, "eval_loss": 0.5621957182884216, "eval_runtime": 135.5763, "eval_samples_per_second": 3.924, "eval_steps_per_second": 1.962, "eval_wer": 0.250305328790898, "step": 27696 }, { "epoch": 24.0, "learning_rate": 2.0988811188811187e-06, "loss": 0.3816, "step": 27700 }, { "epoch": 24.01, "learning_rate": 2.098181818181818e-06, "loss": 0.4067, "step": 27710 }, { "epoch": 24.02, "learning_rate": 2.0974825174825176e-06, "loss": 0.3512, "step": 27720 }, { "epoch": 24.03, "learning_rate": 2.0967832167832167e-06, "loss": 0.368, "step": 27730 }, { "epoch": 24.04, "learning_rate": 2.096083916083916e-06, "loss": 0.4063, "step": 27740 }, { "epoch": 24.05, "learning_rate": 2.0953846153846153e-06, "loss": 0.3105, "step": 27750 }, { "epoch": 24.06, "learning_rate": 2.0947552447552448e-06, "loss": 0.3747, "step": 27760 }, { "epoch": 24.06, "learning_rate": 2.094055944055944e-06, "loss": 0.3939, "step": 27770 }, { "epoch": 24.07, "learning_rate": 2.0933566433566433e-06, "loss": 0.3713, "step": 27780 }, { "epoch": 24.08, "learning_rate": 2.0926573426573424e-06, "loss": 0.3839, "step": 27790 }, { "epoch": 24.09, "learning_rate": 2.091958041958042e-06, "loss": 0.3202, "step": 27800 }, { "epoch": 24.1, "learning_rate": 2.0912587412587414e-06, "loss": 0.3735, "step": 27810 }, { "epoch": 24.11, "learning_rate": 2.0905594405594405e-06, "loss": 0.3817, "step": 27820 }, { "epoch": 24.12, "learning_rate": 2.0898601398601395e-06, "loss": 0.388, "step": 27830 }, { "epoch": 24.12, "learning_rate": 2.089160839160839e-06, "loss": 0.3489, "step": 27840 }, { "epoch": 24.13, "learning_rate": 2.0884615384615385e-06, "loss": 0.3306, "step": 27850 }, { "epoch": 24.14, "learning_rate": 2.0877622377622376e-06, "loss": 0.358, "step": 27860 }, { "epoch": 24.15, "learning_rate": 2.087062937062937e-06, "loss": 0.395, "step": 27870 }, { "epoch": 24.16, "learning_rate": 2.086363636363636e-06, "loss": 0.419, "step": 27880 }, { "epoch": 24.17, "learning_rate": 2.0856643356643357e-06, "loss": 0.3394, "step": 27890 }, { "epoch": 24.18, "learning_rate": 2.0849650349650347e-06, "loss": 0.3663, "step": 27900 }, { "epoch": 24.19, "learning_rate": 2.0842657342657342e-06, "loss": 0.3996, "step": 27910 }, { "epoch": 24.19, "learning_rate": 2.0835664335664337e-06, "loss": 0.359, "step": 27920 }, { "epoch": 24.2, "learning_rate": 2.0828671328671324e-06, "loss": 0.4252, "step": 27930 }, { "epoch": 24.21, "learning_rate": 2.082167832167832e-06, "loss": 0.3889, "step": 27940 }, { "epoch": 24.22, "learning_rate": 2.0814685314685314e-06, "loss": 0.3811, "step": 27950 }, { "epoch": 24.23, "learning_rate": 2.080769230769231e-06, "loss": 0.3844, "step": 27960 }, { "epoch": 24.24, "learning_rate": 2.08006993006993e-06, "loss": 0.3364, "step": 27970 }, { "epoch": 24.25, "learning_rate": 2.079370629370629e-06, "loss": 0.4162, "step": 27980 }, { "epoch": 24.25, "learning_rate": 2.0786713286713285e-06, "loss": 0.4423, "step": 27990 }, { "epoch": 24.26, "learning_rate": 2.077972027972028e-06, "loss": 0.3822, "step": 28000 }, { "epoch": 24.27, "learning_rate": 2.077272727272727e-06, "loss": 0.3784, "step": 28010 }, { "epoch": 24.28, "learning_rate": 2.0765734265734266e-06, "loss": 0.3552, "step": 28020 }, { "epoch": 24.29, "learning_rate": 2.075874125874126e-06, "loss": 0.3577, "step": 28030 }, { "epoch": 24.3, "learning_rate": 2.0751748251748247e-06, "loss": 0.3526, "step": 28040 }, { "epoch": 24.31, "learning_rate": 2.0744755244755242e-06, "loss": 0.4053, "step": 28050 }, { "epoch": 24.32, "learning_rate": 2.0737762237762237e-06, "loss": 0.3904, "step": 28060 }, { "epoch": 24.32, "learning_rate": 2.0730769230769232e-06, "loss": 0.4229, "step": 28070 }, { "epoch": 24.33, "learning_rate": 2.0723776223776223e-06, "loss": 0.3946, "step": 28080 }, { "epoch": 24.34, "learning_rate": 2.0716783216783214e-06, "loss": 0.4186, "step": 28090 }, { "epoch": 24.35, "learning_rate": 2.070979020979021e-06, "loss": 0.3745, "step": 28100 }, { "epoch": 24.36, "learning_rate": 2.07027972027972e-06, "loss": 0.3804, "step": 28110 }, { "epoch": 24.37, "learning_rate": 2.0695804195804194e-06, "loss": 0.3588, "step": 28120 }, { "epoch": 24.38, "learning_rate": 2.068881118881119e-06, "loss": 0.3584, "step": 28130 }, { "epoch": 24.38, "learning_rate": 2.0681818181818184e-06, "loss": 0.4453, "step": 28140 }, { "epoch": 24.39, "learning_rate": 2.067482517482517e-06, "loss": 0.3888, "step": 28150 }, { "epoch": 24.4, "learning_rate": 2.0667832167832166e-06, "loss": 0.4119, "step": 28160 }, { "epoch": 24.41, "learning_rate": 2.066083916083916e-06, "loss": 0.3672, "step": 28170 }, { "epoch": 24.42, "learning_rate": 2.0653846153846156e-06, "loss": 0.366, "step": 28180 }, { "epoch": 24.43, "learning_rate": 2.0646853146853147e-06, "loss": 0.4376, "step": 28190 }, { "epoch": 24.44, "learning_rate": 2.0639860139860137e-06, "loss": 0.3449, "step": 28200 }, { "epoch": 24.45, "learning_rate": 2.0632867132867132e-06, "loss": 0.3657, "step": 28210 }, { "epoch": 24.45, "learning_rate": 2.0625874125874123e-06, "loss": 0.369, "step": 28220 }, { "epoch": 24.46, "learning_rate": 2.061888111888112e-06, "loss": 0.3602, "step": 28230 }, { "epoch": 24.47, "learning_rate": 2.0611888111888113e-06, "loss": 0.4175, "step": 28240 }, { "epoch": 24.48, "learning_rate": 2.060489510489511e-06, "loss": 0.3883, "step": 28250 }, { "epoch": 24.49, "learning_rate": 2.0597902097902094e-06, "loss": 0.3688, "step": 28260 }, { "epoch": 24.5, "learning_rate": 2.059090909090909e-06, "loss": 0.4029, "step": 28270 }, { "epoch": 24.51, "learning_rate": 2.0583916083916084e-06, "loss": 0.3525, "step": 28280 }, { "epoch": 24.51, "learning_rate": 2.0576923076923075e-06, "loss": 0.3956, "step": 28290 }, { "epoch": 24.52, "learning_rate": 2.056993006993007e-06, "loss": 0.3645, "step": 28300 }, { "epoch": 24.53, "learning_rate": 2.056293706293706e-06, "loss": 0.3766, "step": 28310 }, { "epoch": 24.54, "learning_rate": 2.0555944055944056e-06, "loss": 0.3573, "step": 28320 }, { "epoch": 24.55, "learning_rate": 2.0548951048951046e-06, "loss": 0.4017, "step": 28330 }, { "epoch": 24.56, "learning_rate": 2.054195804195804e-06, "loss": 0.3781, "step": 28340 }, { "epoch": 24.57, "learning_rate": 2.0534965034965036e-06, "loss": 0.36, "step": 28350 }, { "epoch": 24.58, "learning_rate": 2.0527972027972027e-06, "loss": 0.3383, "step": 28360 }, { "epoch": 24.58, "learning_rate": 2.0520979020979018e-06, "loss": 0.4027, "step": 28370 }, { "epoch": 24.59, "learning_rate": 2.0513986013986013e-06, "loss": 0.3551, "step": 28380 }, { "epoch": 24.6, "learning_rate": 2.0506993006993008e-06, "loss": 0.3997, "step": 28390 }, { "epoch": 24.61, "learning_rate": 2.05e-06, "loss": 0.4885, "step": 28400 }, { "epoch": 24.62, "learning_rate": 2.0493006993006994e-06, "loss": 0.4051, "step": 28410 }, { "epoch": 24.63, "learning_rate": 2.0486013986013984e-06, "loss": 0.3174, "step": 28420 }, { "epoch": 24.64, "learning_rate": 2.047902097902098e-06, "loss": 0.3527, "step": 28430 }, { "epoch": 24.64, "learning_rate": 2.047202797202797e-06, "loss": 0.409, "step": 28440 }, { "epoch": 24.65, "learning_rate": 2.0465034965034965e-06, "loss": 0.3858, "step": 28450 }, { "epoch": 24.66, "learning_rate": 2.045804195804196e-06, "loss": 0.4063, "step": 28460 }, { "epoch": 24.67, "learning_rate": 2.0451048951048946e-06, "loss": 0.4017, "step": 28470 }, { "epoch": 24.68, "learning_rate": 2.044405594405594e-06, "loss": 0.3747, "step": 28480 }, { "epoch": 24.69, "learning_rate": 2.0437062937062936e-06, "loss": 0.3442, "step": 28490 }, { "epoch": 24.7, "learning_rate": 2.043006993006993e-06, "loss": 0.4353, "step": 28500 }, { "epoch": 24.71, "learning_rate": 2.042307692307692e-06, "loss": 0.3733, "step": 28510 }, { "epoch": 24.71, "learning_rate": 2.0416083916083917e-06, "loss": 0.3516, "step": 28520 }, { "epoch": 24.72, "learning_rate": 2.0409090909090908e-06, "loss": 0.3923, "step": 28530 }, { "epoch": 24.73, "learning_rate": 2.0402097902097903e-06, "loss": 0.3526, "step": 28540 }, { "epoch": 24.74, "learning_rate": 2.0395104895104893e-06, "loss": 0.3825, "step": 28550 }, { "epoch": 24.75, "learning_rate": 2.038811188811189e-06, "loss": 0.3442, "step": 28560 }, { "epoch": 24.76, "learning_rate": 2.0381118881118883e-06, "loss": 0.4184, "step": 28570 }, { "epoch": 24.77, "learning_rate": 2.037412587412587e-06, "loss": 0.3586, "step": 28580 }, { "epoch": 24.77, "learning_rate": 2.0367132867132865e-06, "loss": 0.361, "step": 28590 }, { "epoch": 24.78, "learning_rate": 2.036013986013986e-06, "loss": 0.3993, "step": 28600 }, { "epoch": 24.79, "learning_rate": 2.0353146853146855e-06, "loss": 0.392, "step": 28610 }, { "epoch": 24.8, "learning_rate": 2.0346153846153846e-06, "loss": 0.3895, "step": 28620 }, { "epoch": 24.81, "learning_rate": 2.0339160839160836e-06, "loss": 0.3679, "step": 28630 }, { "epoch": 24.82, "learning_rate": 2.033216783216783e-06, "loss": 0.3637, "step": 28640 }, { "epoch": 24.83, "learning_rate": 2.032517482517482e-06, "loss": 0.3761, "step": 28650 }, { "epoch": 24.83, "learning_rate": 2.0318181818181817e-06, "loss": 0.3866, "step": 28660 }, { "epoch": 24.84, "learning_rate": 2.031118881118881e-06, "loss": 0.4122, "step": 28670 }, { "epoch": 24.85, "learning_rate": 2.0304195804195807e-06, "loss": 0.3918, "step": 28680 }, { "epoch": 24.86, "learning_rate": 2.0297202797202793e-06, "loss": 0.3436, "step": 28690 }, { "epoch": 24.87, "learning_rate": 2.029020979020979e-06, "loss": 0.396, "step": 28700 }, { "epoch": 24.88, "learning_rate": 2.0283216783216783e-06, "loss": 0.3699, "step": 28710 }, { "epoch": 24.89, "learning_rate": 2.0276223776223774e-06, "loss": 0.3412, "step": 28720 }, { "epoch": 24.9, "learning_rate": 2.026923076923077e-06, "loss": 0.3594, "step": 28730 }, { "epoch": 24.9, "learning_rate": 2.026223776223776e-06, "loss": 0.4354, "step": 28740 }, { "epoch": 24.91, "learning_rate": 2.0255244755244755e-06, "loss": 0.3387, "step": 28750 }, { "epoch": 24.92, "learning_rate": 2.0248251748251745e-06, "loss": 0.3553, "step": 28760 }, { "epoch": 24.93, "learning_rate": 2.024125874125874e-06, "loss": 0.3067, "step": 28770 }, { "epoch": 24.94, "learning_rate": 2.0234265734265735e-06, "loss": 0.3769, "step": 28780 }, { "epoch": 24.95, "learning_rate": 2.022727272727273e-06, "loss": 0.4394, "step": 28790 }, { "epoch": 24.96, "learning_rate": 2.0220279720279717e-06, "loss": 0.4139, "step": 28800 }, { "epoch": 24.96, "learning_rate": 2.021328671328671e-06, "loss": 0.3479, "step": 28810 }, { "epoch": 24.97, "learning_rate": 2.0206293706293707e-06, "loss": 0.3557, "step": 28820 }, { "epoch": 24.98, "learning_rate": 2.0199300699300698e-06, "loss": 0.4021, "step": 28830 }, { "epoch": 24.99, "learning_rate": 2.0192307692307692e-06, "loss": 0.407, "step": 28840 }, { "epoch": 25.0, "learning_rate": 2.0185314685314683e-06, "loss": 0.3938, "step": 28850 }, { "epoch": 25.0, "eval_loss": 0.5533283352851868, "eval_runtime": 134.8549, "eval_samples_per_second": 3.945, "eval_steps_per_second": 1.972, "eval_wer": 0.2540978337725783, "step": 28850 }, { "epoch": 25.01, "learning_rate": 2.017832167832168e-06, "loss": 0.3985, "step": 28860 }, { "epoch": 25.02, "learning_rate": 2.017132867132867e-06, "loss": 0.3684, "step": 28870 }, { "epoch": 25.03, "learning_rate": 2.0164335664335664e-06, "loss": 0.3493, "step": 28880 }, { "epoch": 25.03, "learning_rate": 2.015734265734266e-06, "loss": 0.3979, "step": 28890 }, { "epoch": 25.04, "learning_rate": 2.0150349650349645e-06, "loss": 0.3724, "step": 28900 }, { "epoch": 25.05, "learning_rate": 2.014335664335664e-06, "loss": 0.3743, "step": 28910 }, { "epoch": 25.06, "learning_rate": 2.0136363636363635e-06, "loss": 0.3506, "step": 28920 }, { "epoch": 25.07, "learning_rate": 2.012937062937063e-06, "loss": 0.3633, "step": 28930 }, { "epoch": 25.08, "learning_rate": 2.012237762237762e-06, "loss": 0.3833, "step": 28940 }, { "epoch": 25.09, "learning_rate": 2.0115384615384616e-06, "loss": 0.3936, "step": 28950 }, { "epoch": 25.1, "learning_rate": 2.0108391608391607e-06, "loss": 0.4143, "step": 28960 }, { "epoch": 25.1, "learning_rate": 2.01013986013986e-06, "loss": 0.3808, "step": 28970 }, { "epoch": 25.11, "learning_rate": 2.0094405594405592e-06, "loss": 0.3896, "step": 28980 }, { "epoch": 25.12, "learning_rate": 2.0087412587412587e-06, "loss": 0.443, "step": 28990 }, { "epoch": 25.13, "learning_rate": 2.0080419580419582e-06, "loss": 0.4138, "step": 29000 }, { "epoch": 25.14, "learning_rate": 2.007342657342657e-06, "loss": 0.3609, "step": 29010 }, { "epoch": 25.15, "learning_rate": 2.0066433566433564e-06, "loss": 0.3322, "step": 29020 }, { "epoch": 25.16, "learning_rate": 2.005944055944056e-06, "loss": 0.3868, "step": 29030 }, { "epoch": 25.16, "learning_rate": 2.0052447552447554e-06, "loss": 0.3576, "step": 29040 }, { "epoch": 25.17, "learning_rate": 2.0045454545454544e-06, "loss": 0.4285, "step": 29050 }, { "epoch": 25.18, "learning_rate": 2.003846153846154e-06, "loss": 0.3718, "step": 29060 }, { "epoch": 25.19, "learning_rate": 2.003146853146853e-06, "loss": 0.3549, "step": 29070 }, { "epoch": 25.2, "learning_rate": 2.002447552447552e-06, "loss": 0.3326, "step": 29080 }, { "epoch": 25.21, "learning_rate": 2.0017482517482516e-06, "loss": 0.3645, "step": 29090 }, { "epoch": 25.22, "learning_rate": 2.001048951048951e-06, "loss": 0.4107, "step": 29100 }, { "epoch": 25.23, "learning_rate": 2.0003496503496506e-06, "loss": 0.379, "step": 29110 }, { "epoch": 25.23, "learning_rate": 1.9996503496503497e-06, "loss": 0.4511, "step": 29120 }, { "epoch": 25.24, "learning_rate": 1.9989510489510487e-06, "loss": 0.2738, "step": 29130 }, { "epoch": 25.25, "learning_rate": 1.9982517482517482e-06, "loss": 0.3324, "step": 29140 }, { "epoch": 25.26, "learning_rate": 1.9975524475524473e-06, "loss": 0.3471, "step": 29150 }, { "epoch": 25.27, "learning_rate": 1.996853146853147e-06, "loss": 0.3251, "step": 29160 }, { "epoch": 25.28, "learning_rate": 1.996153846153846e-06, "loss": 0.3745, "step": 29170 }, { "epoch": 25.29, "learning_rate": 1.9954545454545454e-06, "loss": 0.3525, "step": 29180 }, { "epoch": 25.29, "learning_rate": 1.994755244755245e-06, "loss": 0.4024, "step": 29190 }, { "epoch": 25.3, "learning_rate": 1.994055944055944e-06, "loss": 0.3859, "step": 29200 }, { "epoch": 25.31, "learning_rate": 1.9933566433566434e-06, "loss": 0.3689, "step": 29210 }, { "epoch": 25.32, "learning_rate": 1.9926573426573425e-06, "loss": 0.3818, "step": 29220 }, { "epoch": 25.33, "learning_rate": 1.991958041958042e-06, "loss": 0.392, "step": 29230 }, { "epoch": 25.34, "learning_rate": 1.991258741258741e-06, "loss": 0.4117, "step": 29240 }, { "epoch": 25.35, "learning_rate": 1.99055944055944e-06, "loss": 0.3697, "step": 29250 }, { "epoch": 25.36, "learning_rate": 1.9898601398601397e-06, "loss": 0.4136, "step": 29260 }, { "epoch": 25.36, "learning_rate": 1.989160839160839e-06, "loss": 0.3876, "step": 29270 }, { "epoch": 25.37, "learning_rate": 1.9884615384615382e-06, "loss": 0.4172, "step": 29280 }, { "epoch": 25.38, "learning_rate": 1.9877622377622377e-06, "loss": 0.4208, "step": 29290 }, { "epoch": 25.39, "learning_rate": 1.9870629370629372e-06, "loss": 0.3257, "step": 29300 }, { "epoch": 25.4, "learning_rate": 1.9863636363636363e-06, "loss": 0.3967, "step": 29310 }, { "epoch": 25.41, "learning_rate": 1.9856643356643358e-06, "loss": 0.4194, "step": 29320 }, { "epoch": 25.42, "learning_rate": 1.984965034965035e-06, "loss": 0.3644, "step": 29330 }, { "epoch": 25.42, "learning_rate": 1.984265734265734e-06, "loss": 0.439, "step": 29340 }, { "epoch": 25.43, "learning_rate": 1.9835664335664334e-06, "loss": 0.4496, "step": 29350 }, { "epoch": 25.44, "learning_rate": 1.9828671328671325e-06, "loss": 0.3671, "step": 29360 }, { "epoch": 25.45, "learning_rate": 1.982167832167832e-06, "loss": 0.3465, "step": 29370 }, { "epoch": 25.46, "learning_rate": 1.9814685314685315e-06, "loss": 0.3648, "step": 29380 }, { "epoch": 25.47, "learning_rate": 1.9807692307692306e-06, "loss": 0.3448, "step": 29390 }, { "epoch": 25.48, "learning_rate": 1.98006993006993e-06, "loss": 0.366, "step": 29400 }, { "epoch": 25.49, "learning_rate": 1.9793706293706296e-06, "loss": 0.4236, "step": 29410 }, { "epoch": 25.49, "learning_rate": 1.9786713286713286e-06, "loss": 0.3443, "step": 29420 }, { "epoch": 25.5, "learning_rate": 1.9779720279720277e-06, "loss": 0.3399, "step": 29430 }, { "epoch": 25.51, "learning_rate": 1.977272727272727e-06, "loss": 0.3953, "step": 29440 }, { "epoch": 25.52, "learning_rate": 1.9765734265734263e-06, "loss": 0.3883, "step": 29450 }, { "epoch": 25.53, "learning_rate": 1.9758741258741258e-06, "loss": 0.3768, "step": 29460 }, { "epoch": 25.54, "learning_rate": 1.975174825174825e-06, "loss": 0.3587, "step": 29470 }, { "epoch": 25.55, "learning_rate": 1.9744755244755243e-06, "loss": 0.3948, "step": 29480 }, { "epoch": 25.55, "learning_rate": 1.973776223776224e-06, "loss": 0.3911, "step": 29490 }, { "epoch": 25.56, "learning_rate": 1.973076923076923e-06, "loss": 0.4282, "step": 29500 }, { "epoch": 25.57, "learning_rate": 1.9723776223776224e-06, "loss": 0.3315, "step": 29510 }, { "epoch": 25.58, "learning_rate": 1.9716783216783215e-06, "loss": 0.3706, "step": 29520 }, { "epoch": 25.59, "learning_rate": 1.970979020979021e-06, "loss": 0.4202, "step": 29530 }, { "epoch": 25.6, "learning_rate": 1.97027972027972e-06, "loss": 0.3886, "step": 29540 }, { "epoch": 25.61, "learning_rate": 1.9695804195804196e-06, "loss": 0.3891, "step": 29550 }, { "epoch": 25.61, "learning_rate": 1.9688811188811186e-06, "loss": 0.3281, "step": 29560 }, { "epoch": 25.62, "learning_rate": 1.968181818181818e-06, "loss": 0.4184, "step": 29570 }, { "epoch": 25.63, "learning_rate": 1.967482517482517e-06, "loss": 0.3783, "step": 29580 }, { "epoch": 25.64, "learning_rate": 1.9667832167832167e-06, "loss": 0.3379, "step": 29590 }, { "epoch": 25.65, "learning_rate": 1.966083916083916e-06, "loss": 0.3912, "step": 29600 }, { "epoch": 25.66, "learning_rate": 1.9653846153846153e-06, "loss": 0.4055, "step": 29610 }, { "epoch": 25.67, "learning_rate": 1.9646853146853148e-06, "loss": 0.3494, "step": 29620 }, { "epoch": 25.68, "learning_rate": 1.963986013986014e-06, "loss": 0.3599, "step": 29630 }, { "epoch": 25.68, "learning_rate": 1.9632867132867133e-06, "loss": 0.4213, "step": 29640 }, { "epoch": 25.69, "learning_rate": 1.9625874125874124e-06, "loss": 0.3993, "step": 29650 }, { "epoch": 25.7, "learning_rate": 1.961888111888112e-06, "loss": 0.3751, "step": 29660 }, { "epoch": 25.71, "learning_rate": 1.961188811188811e-06, "loss": 0.3582, "step": 29670 }, { "epoch": 25.72, "learning_rate": 1.9604895104895105e-06, "loss": 0.3391, "step": 29680 }, { "epoch": 25.73, "learning_rate": 1.9597902097902095e-06, "loss": 0.3844, "step": 29690 }, { "epoch": 25.74, "learning_rate": 1.959090909090909e-06, "loss": 0.4644, "step": 29700 }, { "epoch": 25.74, "learning_rate": 1.958391608391608e-06, "loss": 0.3793, "step": 29710 }, { "epoch": 25.75, "learning_rate": 1.9576923076923076e-06, "loss": 0.438, "step": 29720 }, { "epoch": 25.76, "learning_rate": 1.956993006993007e-06, "loss": 0.3883, "step": 29730 }, { "epoch": 25.77, "learning_rate": 1.956293706293706e-06, "loss": 0.3923, "step": 29740 }, { "epoch": 25.78, "learning_rate": 1.9555944055944057e-06, "loss": 0.4291, "step": 29750 }, { "epoch": 25.79, "learning_rate": 1.9548951048951048e-06, "loss": 0.359, "step": 29760 }, { "epoch": 25.8, "learning_rate": 1.9541958041958043e-06, "loss": 0.4473, "step": 29770 }, { "epoch": 25.81, "learning_rate": 1.9534965034965033e-06, "loss": 0.3519, "step": 29780 }, { "epoch": 25.81, "learning_rate": 1.952797202797203e-06, "loss": 0.3373, "step": 29790 }, { "epoch": 25.82, "learning_rate": 1.952097902097902e-06, "loss": 0.3667, "step": 29800 }, { "epoch": 25.83, "learning_rate": 1.9513986013986014e-06, "loss": 0.3505, "step": 29810 }, { "epoch": 25.84, "learning_rate": 1.9506993006993005e-06, "loss": 0.3392, "step": 29820 }, { "epoch": 25.85, "learning_rate": 1.95e-06, "loss": 0.3719, "step": 29830 }, { "epoch": 25.86, "learning_rate": 1.9493006993006995e-06, "loss": 0.3555, "step": 29840 }, { "epoch": 25.87, "learning_rate": 1.9486013986013985e-06, "loss": 0.4009, "step": 29850 }, { "epoch": 25.87, "learning_rate": 1.947902097902098e-06, "loss": 0.3475, "step": 29860 }, { "epoch": 25.88, "learning_rate": 1.947202797202797e-06, "loss": 0.4121, "step": 29870 }, { "epoch": 25.89, "learning_rate": 1.946503496503496e-06, "loss": 0.37, "step": 29880 }, { "epoch": 25.9, "learning_rate": 1.9458041958041957e-06, "loss": 0.3507, "step": 29890 }, { "epoch": 25.91, "learning_rate": 1.9451048951048947e-06, "loss": 0.4051, "step": 29900 }, { "epoch": 25.92, "learning_rate": 1.9444055944055942e-06, "loss": 0.3669, "step": 29910 }, { "epoch": 25.93, "learning_rate": 1.9437062937062937e-06, "loss": 0.3776, "step": 29920 }, { "epoch": 25.94, "learning_rate": 1.943006993006993e-06, "loss": 0.3033, "step": 29930 }, { "epoch": 25.94, "learning_rate": 1.9423076923076923e-06, "loss": 0.4222, "step": 29940 }, { "epoch": 25.95, "learning_rate": 1.941608391608392e-06, "loss": 0.4284, "step": 29950 }, { "epoch": 25.96, "learning_rate": 1.940979020979021e-06, "loss": 0.3916, "step": 29960 }, { "epoch": 25.97, "learning_rate": 1.94027972027972e-06, "loss": 0.3203, "step": 29970 }, { "epoch": 25.98, "learning_rate": 1.9395804195804194e-06, "loss": 0.3179, "step": 29980 }, { "epoch": 25.99, "learning_rate": 1.938881118881119e-06, "loss": 0.4541, "step": 29990 }, { "epoch": 26.0, "learning_rate": 1.938181818181818e-06, "loss": 0.4509, "step": 30000 }, { "epoch": 26.0, "eval_loss": 0.5566795468330383, "eval_runtime": 137.3215, "eval_samples_per_second": 3.874, "eval_steps_per_second": 1.937, "eval_wer": 0.24863405540914058, "step": 30004 }, { "epoch": 26.01, "learning_rate": 1.9374825174825175e-06, "loss": 0.331, "step": 30010 }, { "epoch": 26.01, "learning_rate": 1.9367832167832166e-06, "loss": 0.341, "step": 30020 }, { "epoch": 26.02, "learning_rate": 1.936083916083916e-06, "loss": 0.3829, "step": 30030 }, { "epoch": 26.03, "learning_rate": 1.9353846153846156e-06, "loss": 0.4277, "step": 30040 }, { "epoch": 26.04, "learning_rate": 1.9346853146853146e-06, "loss": 0.3695, "step": 30050 }, { "epoch": 26.05, "learning_rate": 1.9339860139860137e-06, "loss": 0.3736, "step": 30060 }, { "epoch": 26.06, "learning_rate": 1.933286713286713e-06, "loss": 0.3632, "step": 30070 }, { "epoch": 26.07, "learning_rate": 1.9325874125874123e-06, "loss": 0.3675, "step": 30080 }, { "epoch": 26.07, "learning_rate": 1.9318881118881118e-06, "loss": 0.3919, "step": 30090 }, { "epoch": 26.08, "learning_rate": 1.931188811188811e-06, "loss": 0.4781, "step": 30100 }, { "epoch": 26.09, "learning_rate": 1.9304895104895103e-06, "loss": 0.4024, "step": 30110 }, { "epoch": 26.1, "learning_rate": 1.92979020979021e-06, "loss": 0.3457, "step": 30120 }, { "epoch": 26.11, "learning_rate": 1.929090909090909e-06, "loss": 0.373, "step": 30130 }, { "epoch": 26.12, "learning_rate": 1.9283916083916084e-06, "loss": 0.4276, "step": 30140 }, { "epoch": 26.13, "learning_rate": 1.9276923076923075e-06, "loss": 0.3916, "step": 30150 }, { "epoch": 26.14, "learning_rate": 1.926993006993007e-06, "loss": 0.3897, "step": 30160 }, { "epoch": 26.14, "learning_rate": 1.926293706293706e-06, "loss": 0.3996, "step": 30170 }, { "epoch": 26.15, "learning_rate": 1.9255944055944055e-06, "loss": 0.3456, "step": 30180 }, { "epoch": 26.16, "learning_rate": 1.9248951048951046e-06, "loss": 0.3332, "step": 30190 }, { "epoch": 26.17, "learning_rate": 1.924195804195804e-06, "loss": 0.3873, "step": 30200 }, { "epoch": 26.18, "learning_rate": 1.923496503496503e-06, "loss": 0.3484, "step": 30210 }, { "epoch": 26.19, "learning_rate": 1.9227972027972027e-06, "loss": 0.3626, "step": 30220 }, { "epoch": 26.2, "learning_rate": 1.922097902097902e-06, "loss": 0.3595, "step": 30230 }, { "epoch": 26.2, "learning_rate": 1.9213986013986013e-06, "loss": 0.4079, "step": 30240 }, { "epoch": 26.21, "learning_rate": 1.9206993006993008e-06, "loss": 0.3836, "step": 30250 }, { "epoch": 26.22, "learning_rate": 1.92e-06, "loss": 0.4066, "step": 30260 }, { "epoch": 26.23, "learning_rate": 1.9193006993006993e-06, "loss": 0.3826, "step": 30270 }, { "epoch": 26.24, "learning_rate": 1.9186013986013984e-06, "loss": 0.3621, "step": 30280 }, { "epoch": 26.25, "learning_rate": 1.917902097902098e-06, "loss": 0.399, "step": 30290 }, { "epoch": 26.26, "learning_rate": 1.917202797202797e-06, "loss": 0.468, "step": 30300 }, { "epoch": 26.27, "learning_rate": 1.9165034965034965e-06, "loss": 0.3621, "step": 30310 }, { "epoch": 26.27, "learning_rate": 1.9158041958041955e-06, "loss": 0.4275, "step": 30320 }, { "epoch": 26.28, "learning_rate": 1.915104895104895e-06, "loss": 0.3894, "step": 30330 }, { "epoch": 26.29, "learning_rate": 1.9144055944055945e-06, "loss": 0.3466, "step": 30340 }, { "epoch": 26.3, "learning_rate": 1.9137062937062936e-06, "loss": 0.4006, "step": 30350 }, { "epoch": 26.31, "learning_rate": 1.913006993006993e-06, "loss": 0.3204, "step": 30360 }, { "epoch": 26.32, "learning_rate": 1.912307692307692e-06, "loss": 0.4006, "step": 30370 }, { "epoch": 26.33, "learning_rate": 1.9116083916083917e-06, "loss": 0.3396, "step": 30380 }, { "epoch": 26.33, "learning_rate": 1.9109090909090907e-06, "loss": 0.3836, "step": 30390 }, { "epoch": 26.34, "learning_rate": 1.9102097902097902e-06, "loss": 0.3941, "step": 30400 }, { "epoch": 26.35, "learning_rate": 1.9095104895104893e-06, "loss": 0.4129, "step": 30410 }, { "epoch": 26.36, "learning_rate": 1.908811188811189e-06, "loss": 0.4021, "step": 30420 }, { "epoch": 26.37, "learning_rate": 1.908111888111888e-06, "loss": 0.3448, "step": 30430 }, { "epoch": 26.38, "learning_rate": 1.9074125874125874e-06, "loss": 0.3963, "step": 30440 }, { "epoch": 26.39, "learning_rate": 1.9067132867132867e-06, "loss": 0.3782, "step": 30450 }, { "epoch": 26.39, "learning_rate": 1.906013986013986e-06, "loss": 0.3195, "step": 30460 }, { "epoch": 26.4, "learning_rate": 1.9053146853146852e-06, "loss": 0.4381, "step": 30470 }, { "epoch": 26.41, "learning_rate": 1.9046153846153845e-06, "loss": 0.3247, "step": 30480 }, { "epoch": 26.42, "learning_rate": 1.903916083916084e-06, "loss": 0.379, "step": 30490 }, { "epoch": 26.43, "learning_rate": 1.903216783216783e-06, "loss": 0.3943, "step": 30500 }, { "epoch": 26.44, "learning_rate": 1.9025174825174824e-06, "loss": 0.3868, "step": 30510 }, { "epoch": 26.45, "learning_rate": 1.9018181818181817e-06, "loss": 0.3622, "step": 30520 }, { "epoch": 26.46, "learning_rate": 1.901118881118881e-06, "loss": 0.4147, "step": 30530 }, { "epoch": 26.46, "learning_rate": 1.9004195804195804e-06, "loss": 0.4051, "step": 30540 }, { "epoch": 26.47, "learning_rate": 1.8997202797202795e-06, "loss": 0.3756, "step": 30550 }, { "epoch": 26.48, "learning_rate": 1.899020979020979e-06, "loss": 0.376, "step": 30560 }, { "epoch": 26.49, "learning_rate": 1.8983216783216783e-06, "loss": 0.364, "step": 30570 }, { "epoch": 26.5, "learning_rate": 1.8976223776223776e-06, "loss": 0.3638, "step": 30580 }, { "epoch": 26.51, "learning_rate": 1.8969230769230769e-06, "loss": 0.3573, "step": 30590 }, { "epoch": 26.52, "learning_rate": 1.896223776223776e-06, "loss": 0.3813, "step": 30600 }, { "epoch": 26.52, "learning_rate": 1.8955244755244754e-06, "loss": 0.3925, "step": 30610 }, { "epoch": 26.53, "learning_rate": 1.8948251748251747e-06, "loss": 0.3528, "step": 30620 }, { "epoch": 26.54, "learning_rate": 1.894125874125874e-06, "loss": 0.361, "step": 30630 }, { "epoch": 26.55, "learning_rate": 1.8934265734265733e-06, "loss": 0.3667, "step": 30640 }, { "epoch": 26.56, "learning_rate": 1.8927272727272728e-06, "loss": 0.3815, "step": 30650 }, { "epoch": 26.57, "learning_rate": 1.8920279720279719e-06, "loss": 0.4043, "step": 30660 }, { "epoch": 26.58, "learning_rate": 1.8913286713286712e-06, "loss": 0.3642, "step": 30670 }, { "epoch": 26.59, "learning_rate": 1.8906293706293707e-06, "loss": 0.3322, "step": 30680 }, { "epoch": 26.59, "learning_rate": 1.8899300699300697e-06, "loss": 0.4152, "step": 30690 }, { "epoch": 26.6, "learning_rate": 1.8892307692307692e-06, "loss": 0.4589, "step": 30700 }, { "epoch": 26.61, "learning_rate": 1.8885314685314683e-06, "loss": 0.3927, "step": 30710 }, { "epoch": 26.62, "learning_rate": 1.8878321678321678e-06, "loss": 0.3514, "step": 30720 }, { "epoch": 26.63, "learning_rate": 1.887132867132867e-06, "loss": 0.3987, "step": 30730 }, { "epoch": 26.64, "learning_rate": 1.8864335664335664e-06, "loss": 0.3924, "step": 30740 }, { "epoch": 26.65, "learning_rate": 1.8857342657342656e-06, "loss": 0.3721, "step": 30750 }, { "epoch": 26.65, "learning_rate": 1.885034965034965e-06, "loss": 0.4027, "step": 30760 }, { "epoch": 26.66, "learning_rate": 1.8843356643356642e-06, "loss": 0.3327, "step": 30770 }, { "epoch": 26.67, "learning_rate": 1.8836363636363635e-06, "loss": 0.3517, "step": 30780 }, { "epoch": 26.68, "learning_rate": 1.8829370629370628e-06, "loss": 0.3319, "step": 30790 }, { "epoch": 26.69, "learning_rate": 1.882237762237762e-06, "loss": 0.3603, "step": 30800 }, { "epoch": 26.7, "learning_rate": 1.8815384615384616e-06, "loss": 0.4292, "step": 30810 }, { "epoch": 26.71, "learning_rate": 1.8808391608391606e-06, "loss": 0.3922, "step": 30820 }, { "epoch": 26.72, "learning_rate": 1.8801398601398601e-06, "loss": 0.3476, "step": 30830 }, { "epoch": 26.72, "learning_rate": 1.8794405594405594e-06, "loss": 0.378, "step": 30840 }, { "epoch": 26.73, "learning_rate": 1.8787412587412585e-06, "loss": 0.4082, "step": 30850 }, { "epoch": 26.74, "learning_rate": 1.878041958041958e-06, "loss": 0.3795, "step": 30860 }, { "epoch": 26.75, "learning_rate": 1.877342657342657e-06, "loss": 0.3642, "step": 30870 }, { "epoch": 26.76, "learning_rate": 1.8766433566433566e-06, "loss": 0.3987, "step": 30880 }, { "epoch": 26.77, "learning_rate": 1.8759440559440559e-06, "loss": 0.3377, "step": 30890 }, { "epoch": 26.78, "learning_rate": 1.8752447552447551e-06, "loss": 0.4408, "step": 30900 }, { "epoch": 26.78, "learning_rate": 1.8745454545454544e-06, "loss": 0.3129, "step": 30910 }, { "epoch": 26.79, "learning_rate": 1.873846153846154e-06, "loss": 0.3814, "step": 30920 }, { "epoch": 26.8, "learning_rate": 1.873146853146853e-06, "loss": 0.3311, "step": 30930 }, { "epoch": 26.81, "learning_rate": 1.8724475524475523e-06, "loss": 0.3986, "step": 30940 }, { "epoch": 26.82, "learning_rate": 1.8717482517482518e-06, "loss": 0.3727, "step": 30950 }, { "epoch": 26.83, "learning_rate": 1.8710489510489508e-06, "loss": 0.3677, "step": 30960 }, { "epoch": 26.84, "learning_rate": 1.8703496503496503e-06, "loss": 0.3461, "step": 30970 }, { "epoch": 26.85, "learning_rate": 1.8696503496503494e-06, "loss": 0.3699, "step": 30980 }, { "epoch": 26.85, "learning_rate": 1.868951048951049e-06, "loss": 0.4387, "step": 30990 }, { "epoch": 26.86, "learning_rate": 1.8682517482517482e-06, "loss": 0.3552, "step": 31000 }, { "epoch": 26.87, "learning_rate": 1.8675524475524475e-06, "loss": 0.3734, "step": 31010 }, { "epoch": 26.88, "learning_rate": 1.8668531468531468e-06, "loss": 0.4173, "step": 31020 }, { "epoch": 26.89, "learning_rate": 1.866153846153846e-06, "loss": 0.3429, "step": 31030 }, { "epoch": 26.9, "learning_rate": 1.8654545454545453e-06, "loss": 0.4001, "step": 31040 }, { "epoch": 26.91, "learning_rate": 1.8647552447552446e-06, "loss": 0.3468, "step": 31050 }, { "epoch": 26.91, "learning_rate": 1.864055944055944e-06, "loss": 0.3783, "step": 31060 }, { "epoch": 26.92, "learning_rate": 1.8633566433566432e-06, "loss": 0.3875, "step": 31070 }, { "epoch": 26.93, "learning_rate": 1.8626573426573427e-06, "loss": 0.3293, "step": 31080 }, { "epoch": 26.94, "learning_rate": 1.8619580419580418e-06, "loss": 0.3913, "step": 31090 }, { "epoch": 26.95, "learning_rate": 1.8612587412587413e-06, "loss": 0.4083, "step": 31100 }, { "epoch": 26.96, "learning_rate": 1.8605594405594406e-06, "loss": 0.3357, "step": 31110 }, { "epoch": 26.97, "learning_rate": 1.8598601398601396e-06, "loss": 0.3768, "step": 31120 }, { "epoch": 26.98, "learning_rate": 1.8591608391608391e-06, "loss": 0.3425, "step": 31130 }, { "epoch": 26.98, "learning_rate": 1.8584615384615384e-06, "loss": 0.4, "step": 31140 }, { "epoch": 26.99, "learning_rate": 1.8577622377622377e-06, "loss": 0.3583, "step": 31150 }, { "epoch": 27.0, "eval_loss": 0.5641392469406128, "eval_runtime": 136.2547, "eval_samples_per_second": 3.904, "eval_steps_per_second": 1.952, "eval_wer": 0.25229800089991644, "step": 31158 }, { "epoch": 27.0, "learning_rate": 1.857062937062937e-06, "loss": 0.4314, "step": 31160 }, { "epoch": 27.01, "learning_rate": 1.8563636363636363e-06, "loss": 0.4011, "step": 31170 }, { "epoch": 27.02, "learning_rate": 1.8556643356643355e-06, "loss": 0.3816, "step": 31180 }, { "epoch": 27.03, "learning_rate": 1.854965034965035e-06, "loss": 0.3846, "step": 31190 }, { "epoch": 27.04, "learning_rate": 1.8542657342657341e-06, "loss": 0.3608, "step": 31200 }, { "epoch": 27.05, "learning_rate": 1.8535664335664334e-06, "loss": 0.3791, "step": 31210 }, { "epoch": 27.05, "learning_rate": 1.852867132867133e-06, "loss": 0.4113, "step": 31220 }, { "epoch": 27.06, "learning_rate": 1.852167832167832e-06, "loss": 0.3469, "step": 31230 }, { "epoch": 27.07, "learning_rate": 1.8514685314685315e-06, "loss": 0.3932, "step": 31240 }, { "epoch": 27.08, "learning_rate": 1.8507692307692305e-06, "loss": 0.3928, "step": 31250 }, { "epoch": 27.09, "learning_rate": 1.85006993006993e-06, "loss": 0.328, "step": 31260 }, { "epoch": 27.1, "learning_rate": 1.8493706293706293e-06, "loss": 0.3303, "step": 31270 }, { "epoch": 27.11, "learning_rate": 1.8486713286713286e-06, "loss": 0.3637, "step": 31280 }, { "epoch": 27.11, "learning_rate": 1.847972027972028e-06, "loss": 0.3607, "step": 31290 }, { "epoch": 27.12, "learning_rate": 1.8472727272727272e-06, "loss": 0.394, "step": 31300 }, { "epoch": 27.13, "learning_rate": 1.8465734265734265e-06, "loss": 0.4039, "step": 31310 }, { "epoch": 27.14, "learning_rate": 1.8458741258741258e-06, "loss": 0.3861, "step": 31320 }, { "epoch": 27.15, "learning_rate": 1.8451748251748252e-06, "loss": 0.3385, "step": 31330 }, { "epoch": 27.16, "learning_rate": 1.8444755244755243e-06, "loss": 0.3482, "step": 31340 }, { "epoch": 27.17, "learning_rate": 1.8437762237762238e-06, "loss": 0.3543, "step": 31350 }, { "epoch": 27.17, "learning_rate": 1.8430769230769229e-06, "loss": 0.4551, "step": 31360 }, { "epoch": 27.18, "learning_rate": 1.8423776223776224e-06, "loss": 0.3558, "step": 31370 }, { "epoch": 27.19, "learning_rate": 1.8416783216783217e-06, "loss": 0.3725, "step": 31380 }, { "epoch": 27.2, "learning_rate": 1.8409790209790207e-06, "loss": 0.3708, "step": 31390 }, { "epoch": 27.21, "learning_rate": 1.8402797202797202e-06, "loss": 0.3762, "step": 31400 }, { "epoch": 27.22, "learning_rate": 1.8395804195804195e-06, "loss": 0.3454, "step": 31410 }, { "epoch": 27.23, "learning_rate": 1.8388811188811188e-06, "loss": 0.3676, "step": 31420 }, { "epoch": 27.24, "learning_rate": 1.838181818181818e-06, "loss": 0.3525, "step": 31430 }, { "epoch": 27.24, "learning_rate": 1.8374825174825174e-06, "loss": 0.369, "step": 31440 }, { "epoch": 27.25, "learning_rate": 1.8367832167832167e-06, "loss": 0.391, "step": 31450 }, { "epoch": 27.26, "learning_rate": 1.8360839160839162e-06, "loss": 0.3938, "step": 31460 }, { "epoch": 27.27, "learning_rate": 1.8353846153846152e-06, "loss": 0.3873, "step": 31470 }, { "epoch": 27.28, "learning_rate": 1.8346853146853145e-06, "loss": 0.3405, "step": 31480 }, { "epoch": 27.29, "learning_rate": 1.833986013986014e-06, "loss": 0.3682, "step": 31490 }, { "epoch": 27.3, "learning_rate": 1.833286713286713e-06, "loss": 0.3943, "step": 31500 }, { "epoch": 27.3, "learning_rate": 1.8325874125874126e-06, "loss": 0.3856, "step": 31510 }, { "epoch": 27.31, "learning_rate": 1.8318881118881117e-06, "loss": 0.416, "step": 31520 }, { "epoch": 27.32, "learning_rate": 1.8311888111888112e-06, "loss": 0.3424, "step": 31530 }, { "epoch": 27.33, "learning_rate": 1.8304895104895104e-06, "loss": 0.3573, "step": 31540 }, { "epoch": 27.34, "learning_rate": 1.8297902097902097e-06, "loss": 0.3489, "step": 31550 }, { "epoch": 27.35, "learning_rate": 1.829090909090909e-06, "loss": 0.4039, "step": 31560 }, { "epoch": 27.36, "learning_rate": 1.8283916083916083e-06, "loss": 0.3618, "step": 31570 }, { "epoch": 27.37, "learning_rate": 1.8276923076923076e-06, "loss": 0.3253, "step": 31580 }, { "epoch": 27.37, "learning_rate": 1.8269930069930069e-06, "loss": 0.3501, "step": 31590 }, { "epoch": 27.38, "learning_rate": 1.8262937062937064e-06, "loss": 0.3475, "step": 31600 }, { "epoch": 27.39, "learning_rate": 1.8255944055944054e-06, "loss": 0.3852, "step": 31610 }, { "epoch": 27.4, "learning_rate": 1.824895104895105e-06, "loss": 0.3352, "step": 31620 }, { "epoch": 27.41, "learning_rate": 1.824195804195804e-06, "loss": 0.3391, "step": 31630 }, { "epoch": 27.42, "learning_rate": 1.8234965034965035e-06, "loss": 0.3885, "step": 31640 }, { "epoch": 27.43, "learning_rate": 1.8227972027972028e-06, "loss": 0.358, "step": 31650 }, { "epoch": 27.43, "learning_rate": 1.8220979020979019e-06, "loss": 0.3604, "step": 31660 }, { "epoch": 27.44, "learning_rate": 1.8213986013986014e-06, "loss": 0.3526, "step": 31670 }, { "epoch": 27.45, "learning_rate": 1.8206993006993007e-06, "loss": 0.3765, "step": 31680 }, { "epoch": 27.46, "learning_rate": 1.82e-06, "loss": 0.3577, "step": 31690 }, { "epoch": 27.47, "learning_rate": 1.8193006993006992e-06, "loss": 0.3842, "step": 31700 }, { "epoch": 27.48, "learning_rate": 1.8186013986013985e-06, "loss": 0.3789, "step": 31710 }, { "epoch": 27.49, "learning_rate": 1.8179020979020978e-06, "loss": 0.4499, "step": 31720 }, { "epoch": 27.5, "learning_rate": 1.817202797202797e-06, "loss": 0.3503, "step": 31730 }, { "epoch": 27.5, "learning_rate": 1.8165034965034964e-06, "loss": 0.3301, "step": 31740 }, { "epoch": 27.51, "learning_rate": 1.8158041958041956e-06, "loss": 0.3902, "step": 31750 }, { "epoch": 27.52, "learning_rate": 1.8151048951048951e-06, "loss": 0.423, "step": 31760 }, { "epoch": 27.53, "learning_rate": 1.8144055944055942e-06, "loss": 0.4111, "step": 31770 }, { "epoch": 27.54, "learning_rate": 1.8137062937062937e-06, "loss": 0.3757, "step": 31780 }, { "epoch": 27.55, "learning_rate": 1.8130069930069928e-06, "loss": 0.3748, "step": 31790 }, { "epoch": 27.56, "learning_rate": 1.8123076923076923e-06, "loss": 0.3695, "step": 31800 }, { "epoch": 27.56, "learning_rate": 1.8116083916083916e-06, "loss": 0.3734, "step": 31810 }, { "epoch": 27.57, "learning_rate": 1.8109090909090906e-06, "loss": 0.3587, "step": 31820 }, { "epoch": 27.58, "learning_rate": 1.8102097902097901e-06, "loss": 0.366, "step": 31830 }, { "epoch": 27.59, "learning_rate": 1.8095104895104894e-06, "loss": 0.3811, "step": 31840 }, { "epoch": 27.6, "learning_rate": 1.8088111888111887e-06, "loss": 0.3845, "step": 31850 }, { "epoch": 27.61, "learning_rate": 1.808111888111888e-06, "loss": 0.3945, "step": 31860 }, { "epoch": 27.62, "learning_rate": 1.8074125874125875e-06, "loss": 0.4014, "step": 31870 }, { "epoch": 27.63, "learning_rate": 1.8067132867132866e-06, "loss": 0.3829, "step": 31880 }, { "epoch": 27.63, "learning_rate": 1.806013986013986e-06, "loss": 0.4039, "step": 31890 }, { "epoch": 27.64, "learning_rate": 1.8053146853146851e-06, "loss": 0.4097, "step": 31900 }, { "epoch": 27.65, "learning_rate": 1.8046153846153844e-06, "loss": 0.3733, "step": 31910 }, { "epoch": 27.66, "learning_rate": 1.803916083916084e-06, "loss": 0.3835, "step": 31920 }, { "epoch": 27.67, "learning_rate": 1.803216783216783e-06, "loss": 0.3801, "step": 31930 }, { "epoch": 27.68, "learning_rate": 1.8025174825174825e-06, "loss": 0.3225, "step": 31940 }, { "epoch": 27.69, "learning_rate": 1.8018181818181818e-06, "loss": 0.4131, "step": 31950 }, { "epoch": 27.69, "learning_rate": 1.801118881118881e-06, "loss": 0.3939, "step": 31960 }, { "epoch": 27.7, "learning_rate": 1.8004195804195803e-06, "loss": 0.341, "step": 31970 }, { "epoch": 27.71, "learning_rate": 1.7997202797202796e-06, "loss": 0.3937, "step": 31980 }, { "epoch": 27.72, "learning_rate": 1.799020979020979e-06, "loss": 0.3684, "step": 31990 }, { "epoch": 27.73, "learning_rate": 1.7983216783216782e-06, "loss": 0.3699, "step": 32000 }, { "epoch": 27.74, "learning_rate": 1.7976223776223775e-06, "loss": 0.3764, "step": 32010 }, { "epoch": 27.75, "learning_rate": 1.7969230769230768e-06, "loss": 0.3609, "step": 32020 }, { "epoch": 27.76, "learning_rate": 1.7962237762237763e-06, "loss": 0.3248, "step": 32030 }, { "epoch": 27.76, "learning_rate": 1.7955244755244753e-06, "loss": 0.4042, "step": 32040 }, { "epoch": 27.77, "learning_rate": 1.7948251748251748e-06, "loss": 0.4085, "step": 32050 }, { "epoch": 27.78, "learning_rate": 1.794125874125874e-06, "loss": 0.4023, "step": 32060 }, { "epoch": 27.79, "learning_rate": 1.7934265734265734e-06, "loss": 0.317, "step": 32070 }, { "epoch": 27.8, "learning_rate": 1.7927272727272727e-06, "loss": 0.3857, "step": 32080 }, { "epoch": 27.81, "learning_rate": 1.7920279720279718e-06, "loss": 0.3571, "step": 32090 }, { "epoch": 27.82, "learning_rate": 1.7913286713286713e-06, "loss": 0.4025, "step": 32100 }, { "epoch": 27.82, "learning_rate": 1.7906293706293706e-06, "loss": 0.3897, "step": 32110 }, { "epoch": 27.83, "learning_rate": 1.7899300699300698e-06, "loss": 0.4233, "step": 32120 }, { "epoch": 27.84, "learning_rate": 1.7892307692307691e-06, "loss": 0.373, "step": 32130 }, { "epoch": 27.85, "learning_rate": 1.7885314685314686e-06, "loss": 0.3689, "step": 32140 }, { "epoch": 27.86, "learning_rate": 1.7878321678321677e-06, "loss": 0.3384, "step": 32150 }, { "epoch": 27.87, "learning_rate": 1.7871328671328672e-06, "loss": 0.393, "step": 32160 }, { "epoch": 27.88, "learning_rate": 1.7864335664335663e-06, "loss": 0.3157, "step": 32170 }, { "epoch": 27.89, "learning_rate": 1.7857342657342655e-06, "loss": 0.4032, "step": 32180 }, { "epoch": 27.89, "learning_rate": 1.785034965034965e-06, "loss": 0.3611, "step": 32190 }, { "epoch": 27.9, "learning_rate": 1.7843356643356641e-06, "loss": 0.3538, "step": 32200 }, { "epoch": 27.91, "learning_rate": 1.7836363636363636e-06, "loss": 0.3398, "step": 32210 }, { "epoch": 27.92, "learning_rate": 1.782937062937063e-06, "loss": 0.3714, "step": 32220 }, { "epoch": 27.93, "learning_rate": 1.7822377622377622e-06, "loss": 0.3936, "step": 32230 }, { "epoch": 27.94, "learning_rate": 1.7815384615384615e-06, "loss": 0.3473, "step": 32240 }, { "epoch": 27.95, "learning_rate": 1.7808391608391608e-06, "loss": 0.4004, "step": 32250 }, { "epoch": 27.95, "learning_rate": 1.78013986013986e-06, "loss": 0.3311, "step": 32260 }, { "epoch": 27.96, "learning_rate": 1.7794405594405593e-06, "loss": 0.3644, "step": 32270 }, { "epoch": 27.97, "learning_rate": 1.7787412587412586e-06, "loss": 0.3806, "step": 32280 }, { "epoch": 27.98, "learning_rate": 1.778041958041958e-06, "loss": 0.3713, "step": 32290 }, { "epoch": 27.99, "learning_rate": 1.7773426573426574e-06, "loss": 0.3826, "step": 32300 }, { "epoch": 28.0, "learning_rate": 1.7766433566433565e-06, "loss": 0.4084, "step": 32310 }, { "epoch": 28.0, "eval_loss": 0.568722128868103, "eval_runtime": 137.4904, "eval_samples_per_second": 3.869, "eval_steps_per_second": 1.935, "eval_wer": 0.2521051616635598, "step": 32312 }, { "epoch": 28.01, "learning_rate": 1.775944055944056e-06, "loss": 0.4081, "step": 32320 }, { "epoch": 28.02, "learning_rate": 1.775244755244755e-06, "loss": 0.3512, "step": 32330 }, { "epoch": 28.02, "learning_rate": 1.7745454545454545e-06, "loss": 0.351, "step": 32340 }, { "epoch": 28.03, "learning_rate": 1.7738461538461538e-06, "loss": 0.3402, "step": 32350 }, { "epoch": 28.04, "learning_rate": 1.7731468531468529e-06, "loss": 0.3992, "step": 32360 }, { "epoch": 28.05, "learning_rate": 1.7724475524475524e-06, "loss": 0.4322, "step": 32370 }, { "epoch": 28.06, "learning_rate": 1.7717482517482517e-06, "loss": 0.3604, "step": 32380 }, { "epoch": 28.07, "learning_rate": 1.771048951048951e-06, "loss": 0.3135, "step": 32390 }, { "epoch": 28.08, "learning_rate": 1.7703496503496502e-06, "loss": 0.3935, "step": 32400 }, { "epoch": 28.08, "learning_rate": 1.7696503496503497e-06, "loss": 0.3196, "step": 32410 }, { "epoch": 28.09, "learning_rate": 1.7689510489510488e-06, "loss": 0.3479, "step": 32420 }, { "epoch": 28.1, "learning_rate": 1.7682517482517483e-06, "loss": 0.4076, "step": 32430 }, { "epoch": 28.11, "learning_rate": 1.7675524475524474e-06, "loss": 0.3654, "step": 32440 }, { "epoch": 28.12, "learning_rate": 1.7668531468531467e-06, "loss": 0.3773, "step": 32450 }, { "epoch": 28.13, "learning_rate": 1.7661538461538462e-06, "loss": 0.3836, "step": 32460 }, { "epoch": 28.14, "learning_rate": 1.7654545454545452e-06, "loss": 0.3514, "step": 32470 }, { "epoch": 28.15, "learning_rate": 1.7647552447552447e-06, "loss": 0.4039, "step": 32480 }, { "epoch": 28.15, "learning_rate": 1.764055944055944e-06, "loss": 0.3392, "step": 32490 }, { "epoch": 28.16, "learning_rate": 1.7633566433566433e-06, "loss": 0.359, "step": 32500 }, { "epoch": 28.17, "learning_rate": 1.7626573426573426e-06, "loss": 0.3671, "step": 32510 }, { "epoch": 28.18, "learning_rate": 1.7619580419580419e-06, "loss": 0.3782, "step": 32520 }, { "epoch": 28.19, "learning_rate": 1.7612587412587412e-06, "loss": 0.3816, "step": 32530 }, { "epoch": 28.2, "learning_rate": 1.7605594405594404e-06, "loss": 0.3251, "step": 32540 }, { "epoch": 28.21, "learning_rate": 1.7598601398601397e-06, "loss": 0.3907, "step": 32550 }, { "epoch": 28.21, "learning_rate": 1.759160839160839e-06, "loss": 0.4064, "step": 32560 }, { "epoch": 28.22, "learning_rate": 1.7584615384615385e-06, "loss": 0.3726, "step": 32570 }, { "epoch": 28.23, "learning_rate": 1.7577622377622376e-06, "loss": 0.3508, "step": 32580 }, { "epoch": 28.24, "learning_rate": 1.757062937062937e-06, "loss": 0.3468, "step": 32590 }, { "epoch": 28.25, "learning_rate": 1.7563636363636364e-06, "loss": 0.4059, "step": 32600 }, { "epoch": 28.26, "learning_rate": 1.7556643356643357e-06, "loss": 0.4445, "step": 32610 }, { "epoch": 28.27, "learning_rate": 1.754965034965035e-06, "loss": 0.4066, "step": 32620 }, { "epoch": 28.28, "learning_rate": 1.754265734265734e-06, "loss": 0.3494, "step": 32630 }, { "epoch": 28.28, "learning_rate": 1.7535664335664335e-06, "loss": 0.3554, "step": 32640 }, { "epoch": 28.29, "learning_rate": 1.7528671328671328e-06, "loss": 0.3856, "step": 32650 }, { "epoch": 28.3, "learning_rate": 1.752167832167832e-06, "loss": 0.3978, "step": 32660 }, { "epoch": 28.31, "learning_rate": 1.7514685314685314e-06, "loss": 0.3472, "step": 32670 }, { "epoch": 28.32, "learning_rate": 1.7507692307692309e-06, "loss": 0.3697, "step": 32680 }, { "epoch": 28.33, "learning_rate": 1.75006993006993e-06, "loss": 0.3225, "step": 32690 }, { "epoch": 28.34, "learning_rate": 1.7493706293706292e-06, "loss": 0.3769, "step": 32700 }, { "epoch": 28.34, "learning_rate": 1.7486713286713285e-06, "loss": 0.3747, "step": 32710 }, { "epoch": 28.35, "learning_rate": 1.7479720279720278e-06, "loss": 0.3268, "step": 32720 }, { "epoch": 28.36, "learning_rate": 1.7472727272727273e-06, "loss": 0.4022, "step": 32730 }, { "epoch": 28.37, "learning_rate": 1.7465734265734264e-06, "loss": 0.3495, "step": 32740 }, { "epoch": 28.38, "learning_rate": 1.7458741258741259e-06, "loss": 0.4143, "step": 32750 }, { "epoch": 28.39, "learning_rate": 1.7451748251748251e-06, "loss": 0.3261, "step": 32760 }, { "epoch": 28.4, "learning_rate": 1.7444755244755244e-06, "loss": 0.3724, "step": 32770 }, { "epoch": 28.41, "learning_rate": 1.7437762237762237e-06, "loss": 0.3713, "step": 32780 }, { "epoch": 28.41, "learning_rate": 1.7430769230769228e-06, "loss": 0.4072, "step": 32790 }, { "epoch": 28.42, "learning_rate": 1.7423776223776223e-06, "loss": 0.3862, "step": 32800 }, { "epoch": 28.43, "learning_rate": 1.7416783216783216e-06, "loss": 0.4113, "step": 32810 }, { "epoch": 28.44, "learning_rate": 1.7409790209790209e-06, "loss": 0.3918, "step": 32820 }, { "epoch": 28.45, "learning_rate": 1.7403496503496501e-06, "loss": 0.369, "step": 32830 }, { "epoch": 28.46, "learning_rate": 1.7396503496503496e-06, "loss": 0.3563, "step": 32840 }, { "epoch": 28.47, "learning_rate": 1.7389510489510489e-06, "loss": 0.3593, "step": 32850 }, { "epoch": 28.47, "learning_rate": 1.7382517482517482e-06, "loss": 0.3922, "step": 32860 }, { "epoch": 28.48, "learning_rate": 1.7375524475524475e-06, "loss": 0.4448, "step": 32870 }, { "epoch": 28.49, "learning_rate": 1.736853146853147e-06, "loss": 0.3888, "step": 32880 }, { "epoch": 28.5, "learning_rate": 1.736153846153846e-06, "loss": 0.3244, "step": 32890 }, { "epoch": 28.51, "learning_rate": 1.7354545454545453e-06, "loss": 0.3501, "step": 32900 }, { "epoch": 28.52, "learning_rate": 1.7347552447552446e-06, "loss": 0.4159, "step": 32910 }, { "epoch": 28.53, "learning_rate": 1.7340559440559439e-06, "loss": 0.3692, "step": 32920 }, { "epoch": 28.54, "learning_rate": 1.7333566433566434e-06, "loss": 0.3711, "step": 32930 }, { "epoch": 28.54, "learning_rate": 1.7326573426573425e-06, "loss": 0.3636, "step": 32940 }, { "epoch": 28.55, "learning_rate": 1.731958041958042e-06, "loss": 0.3652, "step": 32950 }, { "epoch": 28.56, "learning_rate": 1.7312587412587412e-06, "loss": 0.4086, "step": 32960 }, { "epoch": 28.57, "learning_rate": 1.7305594405594405e-06, "loss": 0.3202, "step": 32970 }, { "epoch": 28.58, "learning_rate": 1.7298601398601398e-06, "loss": 0.33, "step": 32980 }, { "epoch": 28.59, "learning_rate": 1.729160839160839e-06, "loss": 0.371, "step": 32990 }, { "epoch": 28.6, "learning_rate": 1.7284615384615384e-06, "loss": 0.384, "step": 33000 }, { "epoch": 28.6, "learning_rate": 1.7277622377622377e-06, "loss": 0.3612, "step": 33010 }, { "epoch": 28.61, "learning_rate": 1.727062937062937e-06, "loss": 0.385, "step": 33020 }, { "epoch": 28.62, "learning_rate": 1.7263636363636362e-06, "loss": 0.3638, "step": 33030 }, { "epoch": 28.63, "learning_rate": 1.7256643356643357e-06, "loss": 0.3553, "step": 33040 }, { "epoch": 28.64, "learning_rate": 1.7249650349650348e-06, "loss": 0.4293, "step": 33050 }, { "epoch": 28.65, "learning_rate": 1.7242657342657343e-06, "loss": 0.385, "step": 33060 }, { "epoch": 28.66, "learning_rate": 1.7235664335664336e-06, "loss": 0.3787, "step": 33070 }, { "epoch": 28.67, "learning_rate": 1.7228671328671327e-06, "loss": 0.373, "step": 33080 }, { "epoch": 28.67, "learning_rate": 1.7221678321678322e-06, "loss": 0.3868, "step": 33090 }, { "epoch": 28.68, "learning_rate": 1.7214685314685312e-06, "loss": 0.3748, "step": 33100 }, { "epoch": 28.69, "learning_rate": 1.7207692307692307e-06, "loss": 0.3846, "step": 33110 }, { "epoch": 28.7, "learning_rate": 1.72006993006993e-06, "loss": 0.3777, "step": 33120 }, { "epoch": 28.71, "learning_rate": 1.7193706293706293e-06, "loss": 0.369, "step": 33130 }, { "epoch": 28.72, "learning_rate": 1.7186713286713286e-06, "loss": 0.3733, "step": 33140 }, { "epoch": 28.73, "learning_rate": 1.717972027972028e-06, "loss": 0.3676, "step": 33150 }, { "epoch": 28.73, "learning_rate": 1.7172727272727272e-06, "loss": 0.4108, "step": 33160 }, { "epoch": 28.74, "learning_rate": 1.7165734265734264e-06, "loss": 0.3825, "step": 33170 }, { "epoch": 28.75, "learning_rate": 1.715874125874126e-06, "loss": 0.3638, "step": 33180 }, { "epoch": 28.76, "learning_rate": 1.715174825174825e-06, "loss": 0.3664, "step": 33190 }, { "epoch": 28.77, "learning_rate": 1.7144755244755245e-06, "loss": 0.3941, "step": 33200 }, { "epoch": 28.78, "learning_rate": 1.7137762237762236e-06, "loss": 0.3873, "step": 33210 }, { "epoch": 28.79, "learning_rate": 1.713076923076923e-06, "loss": 0.3623, "step": 33220 }, { "epoch": 28.8, "learning_rate": 1.7123776223776224e-06, "loss": 0.3523, "step": 33230 }, { "epoch": 28.8, "learning_rate": 1.7116783216783214e-06, "loss": 0.3801, "step": 33240 }, { "epoch": 28.81, "learning_rate": 1.710979020979021e-06, "loss": 0.3508, "step": 33250 }, { "epoch": 28.82, "learning_rate": 1.7102797202797202e-06, "loss": 0.3487, "step": 33260 }, { "epoch": 28.83, "learning_rate": 1.7095804195804195e-06, "loss": 0.3378, "step": 33270 }, { "epoch": 28.84, "learning_rate": 1.7088811188811188e-06, "loss": 0.4113, "step": 33280 }, { "epoch": 28.85, "learning_rate": 1.708181818181818e-06, "loss": 0.3687, "step": 33290 }, { "epoch": 28.86, "learning_rate": 1.7074825174825174e-06, "loss": 0.3522, "step": 33300 }, { "epoch": 28.86, "learning_rate": 1.7067832167832169e-06, "loss": 0.3869, "step": 33310 }, { "epoch": 28.87, "learning_rate": 1.706083916083916e-06, "loss": 0.3857, "step": 33320 }, { "epoch": 28.88, "learning_rate": 1.7053846153846152e-06, "loss": 0.3923, "step": 33330 }, { "epoch": 28.89, "learning_rate": 1.7046853146853147e-06, "loss": 0.3645, "step": 33340 }, { "epoch": 28.9, "learning_rate": 1.7039860139860138e-06, "loss": 0.3899, "step": 33350 }, { "epoch": 28.91, "learning_rate": 1.7032867132867133e-06, "loss": 0.3523, "step": 33360 }, { "epoch": 28.92, "learning_rate": 1.7025874125874124e-06, "loss": 0.3441, "step": 33370 }, { "epoch": 28.93, "learning_rate": 1.7018881118881119e-06, "loss": 0.4076, "step": 33380 }, { "epoch": 28.93, "learning_rate": 1.7011888111888111e-06, "loss": 0.3111, "step": 33390 }, { "epoch": 28.94, "learning_rate": 1.7004895104895104e-06, "loss": 0.353, "step": 33400 }, { "epoch": 28.95, "learning_rate": 1.6997902097902097e-06, "loss": 0.4195, "step": 33410 }, { "epoch": 28.96, "learning_rate": 1.699090909090909e-06, "loss": 0.2943, "step": 33420 }, { "epoch": 28.97, "learning_rate": 1.6983916083916083e-06, "loss": 0.3757, "step": 33430 }, { "epoch": 28.98, "learning_rate": 1.6976923076923076e-06, "loss": 0.3184, "step": 33440 }, { "epoch": 28.99, "learning_rate": 1.696993006993007e-06, "loss": 0.4107, "step": 33450 }, { "epoch": 28.99, "learning_rate": 1.6962937062937061e-06, "loss": 0.3916, "step": 33460 }, { "epoch": 29.0, "eval_loss": 0.5656043887138367, "eval_runtime": 135.8464, "eval_samples_per_second": 3.916, "eval_steps_per_second": 1.958, "eval_wer": 0.2494696921000193, "step": 33466 }, { "epoch": 29.0, "learning_rate": 1.6955944055944056e-06, "loss": 0.4027, "step": 33470 }, { "epoch": 29.01, "learning_rate": 1.6948951048951047e-06, "loss": 0.3603, "step": 33480 }, { "epoch": 29.02, "learning_rate": 1.6941958041958042e-06, "loss": 0.364, "step": 33490 }, { "epoch": 29.03, "learning_rate": 1.6934965034965035e-06, "loss": 0.3812, "step": 33500 }, { "epoch": 29.04, "learning_rate": 1.6927972027972026e-06, "loss": 0.3828, "step": 33510 }, { "epoch": 29.05, "learning_rate": 1.692097902097902e-06, "loss": 0.3753, "step": 33520 }, { "epoch": 29.06, "learning_rate": 1.6913986013986013e-06, "loss": 0.3995, "step": 33530 }, { "epoch": 29.06, "learning_rate": 1.6906993006993006e-06, "loss": 0.3793, "step": 33540 }, { "epoch": 29.07, "learning_rate": 1.69e-06, "loss": 0.4096, "step": 33550 }, { "epoch": 29.08, "learning_rate": 1.6893006993006992e-06, "loss": 0.3429, "step": 33560 }, { "epoch": 29.09, "learning_rate": 1.6886013986013985e-06, "loss": 0.3749, "step": 33570 }, { "epoch": 29.1, "learning_rate": 1.687902097902098e-06, "loss": 0.353, "step": 33580 }, { "epoch": 29.11, "learning_rate": 1.687202797202797e-06, "loss": 0.4113, "step": 33590 }, { "epoch": 29.12, "learning_rate": 1.6865034965034963e-06, "loss": 0.3883, "step": 33600 }, { "epoch": 29.12, "learning_rate": 1.6858041958041958e-06, "loss": 0.3624, "step": 33610 }, { "epoch": 29.13, "learning_rate": 1.685104895104895e-06, "loss": 0.3857, "step": 33620 }, { "epoch": 29.14, "learning_rate": 1.6844055944055944e-06, "loss": 0.3628, "step": 33630 }, { "epoch": 29.15, "learning_rate": 1.6837062937062935e-06, "loss": 0.3251, "step": 33640 }, { "epoch": 29.16, "learning_rate": 1.683006993006993e-06, "loss": 0.3287, "step": 33650 }, { "epoch": 29.17, "learning_rate": 1.6823076923076923e-06, "loss": 0.4003, "step": 33660 }, { "epoch": 29.18, "learning_rate": 1.6816083916083915e-06, "loss": 0.3441, "step": 33670 }, { "epoch": 29.19, "learning_rate": 1.6809090909090908e-06, "loss": 0.3336, "step": 33680 }, { "epoch": 29.19, "learning_rate": 1.6802097902097901e-06, "loss": 0.3581, "step": 33690 }, { "epoch": 29.2, "learning_rate": 1.6795104895104894e-06, "loss": 0.3547, "step": 33700 }, { "epoch": 29.21, "learning_rate": 1.6788111888111887e-06, "loss": 0.3512, "step": 33710 }, { "epoch": 29.22, "learning_rate": 1.6781118881118882e-06, "loss": 0.3349, "step": 33720 }, { "epoch": 29.23, "learning_rate": 1.6774125874125873e-06, "loss": 0.335, "step": 33730 }, { "epoch": 29.24, "learning_rate": 1.6767132867132868e-06, "loss": 0.3946, "step": 33740 }, { "epoch": 29.25, "learning_rate": 1.6760139860139858e-06, "loss": 0.3519, "step": 33750 }, { "epoch": 29.25, "learning_rate": 1.6753146853146853e-06, "loss": 0.3994, "step": 33760 }, { "epoch": 29.26, "learning_rate": 1.6746153846153846e-06, "loss": 0.4, "step": 33770 }, { "epoch": 29.27, "learning_rate": 1.6739160839160837e-06, "loss": 0.3892, "step": 33780 }, { "epoch": 29.28, "learning_rate": 1.6732167832167832e-06, "loss": 0.3496, "step": 33790 }, { "epoch": 29.29, "learning_rate": 1.6725174825174825e-06, "loss": 0.3959, "step": 33800 }, { "epoch": 29.3, "learning_rate": 1.6718181818181818e-06, "loss": 0.3793, "step": 33810 }, { "epoch": 29.31, "learning_rate": 1.671118881118881e-06, "loss": 0.3249, "step": 33820 }, { "epoch": 29.32, "learning_rate": 1.6704195804195803e-06, "loss": 0.3672, "step": 33830 }, { "epoch": 29.32, "learning_rate": 1.6697202797202796e-06, "loss": 0.4126, "step": 33840 }, { "epoch": 29.33, "learning_rate": 1.669020979020979e-06, "loss": 0.3912, "step": 33850 }, { "epoch": 29.34, "learning_rate": 1.6683216783216782e-06, "loss": 0.355, "step": 33860 }, { "epoch": 29.35, "learning_rate": 1.6676223776223775e-06, "loss": 0.3485, "step": 33870 }, { "epoch": 29.36, "learning_rate": 1.666923076923077e-06, "loss": 0.3303, "step": 33880 }, { "epoch": 29.37, "learning_rate": 1.666223776223776e-06, "loss": 0.3702, "step": 33890 }, { "epoch": 29.38, "learning_rate": 1.6655244755244755e-06, "loss": 0.3903, "step": 33900 }, { "epoch": 29.38, "learning_rate": 1.6648251748251746e-06, "loss": 0.3441, "step": 33910 }, { "epoch": 29.39, "learning_rate": 1.664125874125874e-06, "loss": 0.4614, "step": 33920 }, { "epoch": 29.4, "learning_rate": 1.6634265734265734e-06, "loss": 0.4162, "step": 33930 }, { "epoch": 29.41, "learning_rate": 1.6627272727272727e-06, "loss": 0.339, "step": 33940 }, { "epoch": 29.42, "learning_rate": 1.662027972027972e-06, "loss": 0.3922, "step": 33950 }, { "epoch": 29.43, "learning_rate": 1.6613286713286712e-06, "loss": 0.403, "step": 33960 }, { "epoch": 29.44, "learning_rate": 1.6606293706293705e-06, "loss": 0.4064, "step": 33970 }, { "epoch": 29.45, "learning_rate": 1.6599300699300698e-06, "loss": 0.3831, "step": 33980 }, { "epoch": 29.45, "learning_rate": 1.6592307692307693e-06, "loss": 0.4108, "step": 33990 }, { "epoch": 29.46, "learning_rate": 1.6585314685314684e-06, "loss": 0.3298, "step": 34000 }, { "epoch": 29.47, "learning_rate": 1.6578321678321679e-06, "loss": 0.3735, "step": 34010 }, { "epoch": 29.48, "learning_rate": 1.657132867132867e-06, "loss": 0.3878, "step": 34020 }, { "epoch": 29.49, "learning_rate": 1.6564335664335664e-06, "loss": 0.398, "step": 34030 }, { "epoch": 29.5, "learning_rate": 1.6557342657342657e-06, "loss": 0.362, "step": 34040 }, { "epoch": 29.51, "learning_rate": 1.6550349650349648e-06, "loss": 0.4029, "step": 34050 }, { "epoch": 29.51, "learning_rate": 1.6543356643356643e-06, "loss": 0.3755, "step": 34060 }, { "epoch": 29.52, "learning_rate": 1.6536363636363636e-06, "loss": 0.3183, "step": 34070 }, { "epoch": 29.53, "learning_rate": 1.6529370629370629e-06, "loss": 0.3432, "step": 34080 }, { "epoch": 29.54, "learning_rate": 1.6522377622377622e-06, "loss": 0.3807, "step": 34090 }, { "epoch": 29.55, "learning_rate": 1.6515384615384614e-06, "loss": 0.3386, "step": 34100 }, { "epoch": 29.56, "learning_rate": 1.6508391608391607e-06, "loss": 0.3606, "step": 34110 }, { "epoch": 29.57, "learning_rate": 1.6501398601398602e-06, "loss": 0.4485, "step": 34120 }, { "epoch": 29.58, "learning_rate": 1.6494405594405593e-06, "loss": 0.3701, "step": 34130 }, { "epoch": 29.58, "learning_rate": 1.6487412587412586e-06, "loss": 0.3498, "step": 34140 }, { "epoch": 29.59, "learning_rate": 1.648041958041958e-06, "loss": 0.3324, "step": 34150 }, { "epoch": 29.6, "learning_rate": 1.6473426573426572e-06, "loss": 0.3444, "step": 34160 }, { "epoch": 29.61, "learning_rate": 1.6466433566433567e-06, "loss": 0.3844, "step": 34170 }, { "epoch": 29.62, "learning_rate": 1.6459440559440557e-06, "loss": 0.3856, "step": 34180 }, { "epoch": 29.63, "learning_rate": 1.6452447552447552e-06, "loss": 0.3968, "step": 34190 }, { "epoch": 29.64, "learning_rate": 1.6445454545454545e-06, "loss": 0.3755, "step": 34200 }, { "epoch": 29.64, "learning_rate": 1.6438461538461538e-06, "loss": 0.4211, "step": 34210 }, { "epoch": 29.65, "learning_rate": 1.643146853146853e-06, "loss": 0.3817, "step": 34220 }, { "epoch": 29.66, "learning_rate": 1.6424475524475524e-06, "loss": 0.3811, "step": 34230 }, { "epoch": 29.67, "learning_rate": 1.6417482517482516e-06, "loss": 0.3229, "step": 34240 }, { "epoch": 29.68, "learning_rate": 1.641048951048951e-06, "loss": 0.421, "step": 34250 }, { "epoch": 29.69, "learning_rate": 1.6403496503496504e-06, "loss": 0.3709, "step": 34260 }, { "epoch": 29.7, "learning_rate": 1.6396503496503495e-06, "loss": 0.4524, "step": 34270 }, { "epoch": 29.71, "learning_rate": 1.638951048951049e-06, "loss": 0.3726, "step": 34280 }, { "epoch": 29.71, "learning_rate": 1.638251748251748e-06, "loss": 0.3111, "step": 34290 }, { "epoch": 29.72, "learning_rate": 1.6375524475524474e-06, "loss": 0.3639, "step": 34300 }, { "epoch": 29.73, "learning_rate": 1.6368531468531469e-06, "loss": 0.4219, "step": 34310 }, { "epoch": 29.74, "learning_rate": 1.636153846153846e-06, "loss": 0.3993, "step": 34320 }, { "epoch": 29.75, "learning_rate": 1.6354545454545454e-06, "loss": 0.3243, "step": 34330 }, { "epoch": 29.76, "learning_rate": 1.6347552447552447e-06, "loss": 0.4005, "step": 34340 }, { "epoch": 29.77, "learning_rate": 1.634055944055944e-06, "loss": 0.4288, "step": 34350 }, { "epoch": 29.77, "learning_rate": 1.6333566433566433e-06, "loss": 0.491, "step": 34360 }, { "epoch": 29.78, "learning_rate": 1.6326573426573426e-06, "loss": 0.4482, "step": 34370 }, { "epoch": 29.79, "learning_rate": 1.6319580419580419e-06, "loss": 0.4113, "step": 34380 }, { "epoch": 29.8, "learning_rate": 1.6312587412587411e-06, "loss": 0.35, "step": 34390 }, { "epoch": 29.81, "learning_rate": 1.6305594405594404e-06, "loss": 0.373, "step": 34400 }, { "epoch": 29.82, "learning_rate": 1.6298601398601397e-06, "loss": 0.3738, "step": 34410 }, { "epoch": 29.83, "learning_rate": 1.6291608391608392e-06, "loss": 0.3479, "step": 34420 }, { "epoch": 29.83, "learning_rate": 1.6284615384615383e-06, "loss": 0.3902, "step": 34430 }, { "epoch": 29.84, "learning_rate": 1.6277622377622378e-06, "loss": 0.377, "step": 34440 }, { "epoch": 29.85, "learning_rate": 1.627062937062937e-06, "loss": 0.3926, "step": 34450 }, { "epoch": 29.86, "learning_rate": 1.6263636363636363e-06, "loss": 0.3604, "step": 34460 }, { "epoch": 29.87, "learning_rate": 1.6256643356643356e-06, "loss": 0.367, "step": 34470 }, { "epoch": 29.88, "learning_rate": 1.6249650349650347e-06, "loss": 0.439, "step": 34480 }, { "epoch": 29.89, "learning_rate": 1.6242657342657342e-06, "loss": 0.4341, "step": 34490 }, { "epoch": 29.9, "learning_rate": 1.6235664335664335e-06, "loss": 0.3464, "step": 34500 }, { "epoch": 29.9, "learning_rate": 1.6228671328671328e-06, "loss": 0.3569, "step": 34510 }, { "epoch": 29.91, "learning_rate": 1.622167832167832e-06, "loss": 0.3835, "step": 34520 }, { "epoch": 29.92, "learning_rate": 1.6215384615384615e-06, "loss": 0.3977, "step": 34530 }, { "epoch": 29.93, "learning_rate": 1.6208391608391608e-06, "loss": 0.3297, "step": 34540 }, { "epoch": 29.94, "learning_rate": 1.62013986013986e-06, "loss": 0.3743, "step": 34550 }, { "epoch": 29.95, "learning_rate": 1.6194405594405594e-06, "loss": 0.4124, "step": 34560 }, { "epoch": 29.96, "learning_rate": 1.6187412587412589e-06, "loss": 0.3618, "step": 34570 }, { "epoch": 29.96, "learning_rate": 1.618041958041958e-06, "loss": 0.3684, "step": 34580 }, { "epoch": 29.97, "learning_rate": 1.6173426573426572e-06, "loss": 0.362, "step": 34590 }, { "epoch": 29.98, "learning_rate": 1.6166433566433565e-06, "loss": 0.3643, "step": 34600 }, { "epoch": 29.99, "learning_rate": 1.6159440559440558e-06, "loss": 0.351, "step": 34610 }, { "epoch": 30.0, "learning_rate": 1.6152447552447553e-06, "loss": 0.4298, "step": 34620 }, { "epoch": 30.0, "eval_loss": 0.5718466639518738, "eval_runtime": 137.3598, "eval_samples_per_second": 3.873, "eval_steps_per_second": 1.937, "eval_wer": 0.24985537057273252, "step": 34620 }, { "epoch": 30.01, "learning_rate": 1.6145454545454544e-06, "loss": 0.4091, "step": 34630 }, { "epoch": 30.02, "learning_rate": 1.6138461538461539e-06, "loss": 0.3421, "step": 34640 }, { "epoch": 30.03, "learning_rate": 1.6131468531468532e-06, "loss": 0.3637, "step": 34650 }, { "epoch": 30.03, "learning_rate": 1.6124475524475524e-06, "loss": 0.3804, "step": 34660 }, { "epoch": 30.04, "learning_rate": 1.6117482517482517e-06, "loss": 0.3391, "step": 34670 }, { "epoch": 30.05, "learning_rate": 1.6110489510489508e-06, "loss": 0.3682, "step": 34680 }, { "epoch": 30.06, "learning_rate": 1.6103496503496503e-06, "loss": 0.4202, "step": 34690 }, { "epoch": 30.07, "learning_rate": 1.6096503496503496e-06, "loss": 0.3785, "step": 34700 }, { "epoch": 30.08, "learning_rate": 1.6089510489510489e-06, "loss": 0.424, "step": 34710 }, { "epoch": 30.09, "learning_rate": 1.6082517482517482e-06, "loss": 0.3877, "step": 34720 }, { "epoch": 30.1, "learning_rate": 1.6075524475524476e-06, "loss": 0.3444, "step": 34730 }, { "epoch": 30.1, "learning_rate": 1.6068531468531467e-06, "loss": 0.3997, "step": 34740 }, { "epoch": 30.11, "learning_rate": 1.606153846153846e-06, "loss": 0.3541, "step": 34750 }, { "epoch": 30.12, "learning_rate": 1.6054545454545453e-06, "loss": 0.3894, "step": 34760 }, { "epoch": 30.13, "learning_rate": 1.6047552447552446e-06, "loss": 0.3606, "step": 34770 }, { "epoch": 30.14, "learning_rate": 1.604055944055944e-06, "loss": 0.3636, "step": 34780 }, { "epoch": 30.15, "learning_rate": 1.6033566433566431e-06, "loss": 0.3572, "step": 34790 }, { "epoch": 30.16, "learning_rate": 1.6026573426573426e-06, "loss": 0.3856, "step": 34800 }, { "epoch": 30.16, "learning_rate": 1.601958041958042e-06, "loss": 0.3364, "step": 34810 }, { "epoch": 30.17, "learning_rate": 1.6012587412587412e-06, "loss": 0.3653, "step": 34820 }, { "epoch": 30.18, "learning_rate": 1.6005594405594405e-06, "loss": 0.3721, "step": 34830 }, { "epoch": 30.19, "learning_rate": 1.5998601398601398e-06, "loss": 0.3632, "step": 34840 }, { "epoch": 30.2, "learning_rate": 1.599160839160839e-06, "loss": 0.3592, "step": 34850 }, { "epoch": 30.21, "learning_rate": 1.5984615384615384e-06, "loss": 0.3721, "step": 34860 }, { "epoch": 30.22, "learning_rate": 1.5977622377622376e-06, "loss": 0.4172, "step": 34870 }, { "epoch": 30.23, "learning_rate": 1.597062937062937e-06, "loss": 0.3367, "step": 34880 }, { "epoch": 30.23, "learning_rate": 1.5963636363636364e-06, "loss": 0.3765, "step": 34890 }, { "epoch": 30.24, "learning_rate": 1.5956643356643355e-06, "loss": 0.3662, "step": 34900 }, { "epoch": 30.25, "learning_rate": 1.594965034965035e-06, "loss": 0.3884, "step": 34910 }, { "epoch": 30.26, "learning_rate": 1.5942657342657343e-06, "loss": 0.3728, "step": 34920 }, { "epoch": 30.27, "learning_rate": 1.5935664335664334e-06, "loss": 0.3489, "step": 34930 }, { "epoch": 30.28, "learning_rate": 1.5928671328671328e-06, "loss": 0.3379, "step": 34940 }, { "epoch": 30.29, "learning_rate": 1.592167832167832e-06, "loss": 0.3322, "step": 34950 }, { "epoch": 30.29, "learning_rate": 1.5914685314685314e-06, "loss": 0.3663, "step": 34960 }, { "epoch": 30.3, "learning_rate": 1.5907692307692307e-06, "loss": 0.4156, "step": 34970 }, { "epoch": 30.31, "learning_rate": 1.59006993006993e-06, "loss": 0.3471, "step": 34980 }, { "epoch": 30.32, "learning_rate": 1.5893706293706293e-06, "loss": 0.369, "step": 34990 }, { "epoch": 30.33, "learning_rate": 1.5886713286713288e-06, "loss": 0.3399, "step": 35000 }, { "epoch": 30.34, "learning_rate": 1.5879720279720278e-06, "loss": 0.3496, "step": 35010 }, { "epoch": 30.35, "learning_rate": 1.5872727272727271e-06, "loss": 0.3927, "step": 35020 }, { "epoch": 30.36, "learning_rate": 1.5865734265734266e-06, "loss": 0.3727, "step": 35030 }, { "epoch": 30.36, "learning_rate": 1.5858741258741257e-06, "loss": 0.358, "step": 35040 }, { "epoch": 30.37, "learning_rate": 1.5851748251748252e-06, "loss": 0.3672, "step": 35050 }, { "epoch": 30.38, "learning_rate": 1.5844755244755243e-06, "loss": 0.3451, "step": 35060 }, { "epoch": 30.39, "learning_rate": 1.5837762237762238e-06, "loss": 0.3325, "step": 35070 }, { "epoch": 30.4, "learning_rate": 1.583076923076923e-06, "loss": 0.3569, "step": 35080 }, { "epoch": 30.41, "learning_rate": 1.5823776223776223e-06, "loss": 0.371, "step": 35090 }, { "epoch": 30.42, "learning_rate": 1.5816783216783216e-06, "loss": 0.3603, "step": 35100 }, { "epoch": 30.42, "learning_rate": 1.580979020979021e-06, "loss": 0.3758, "step": 35110 }, { "epoch": 30.43, "learning_rate": 1.5802797202797202e-06, "loss": 0.3824, "step": 35120 }, { "epoch": 30.44, "learning_rate": 1.5795804195804195e-06, "loss": 0.3723, "step": 35130 }, { "epoch": 30.45, "learning_rate": 1.5788811188811188e-06, "loss": 0.4211, "step": 35140 }, { "epoch": 30.46, "learning_rate": 1.578181818181818e-06, "loss": 0.3785, "step": 35150 }, { "epoch": 30.47, "learning_rate": 1.5774825174825175e-06, "loss": 0.409, "step": 35160 }, { "epoch": 30.48, "learning_rate": 1.5767832167832166e-06, "loss": 0.4054, "step": 35170 }, { "epoch": 30.49, "learning_rate": 1.5760839160839161e-06, "loss": 0.3717, "step": 35180 }, { "epoch": 30.49, "learning_rate": 1.5753846153846154e-06, "loss": 0.4008, "step": 35190 }, { "epoch": 30.5, "learning_rate": 1.5746853146853145e-06, "loss": 0.3472, "step": 35200 }, { "epoch": 30.51, "learning_rate": 1.573986013986014e-06, "loss": 0.4362, "step": 35210 }, { "epoch": 30.52, "learning_rate": 1.573286713286713e-06, "loss": 0.4502, "step": 35220 }, { "epoch": 30.53, "learning_rate": 1.5725874125874125e-06, "loss": 0.3301, "step": 35230 }, { "epoch": 30.54, "learning_rate": 1.5718881118881118e-06, "loss": 0.3875, "step": 35240 }, { "epoch": 30.55, "learning_rate": 1.5711888111888111e-06, "loss": 0.352, "step": 35250 }, { "epoch": 30.55, "learning_rate": 1.5704895104895104e-06, "loss": 0.3891, "step": 35260 }, { "epoch": 30.56, "learning_rate": 1.56979020979021e-06, "loss": 0.4293, "step": 35270 }, { "epoch": 30.57, "learning_rate": 1.569090909090909e-06, "loss": 0.3905, "step": 35280 }, { "epoch": 30.58, "learning_rate": 1.5683916083916083e-06, "loss": 0.3849, "step": 35290 }, { "epoch": 30.59, "learning_rate": 1.5676923076923078e-06, "loss": 0.39, "step": 35300 }, { "epoch": 30.6, "learning_rate": 1.5669930069930068e-06, "loss": 0.396, "step": 35310 }, { "epoch": 30.61, "learning_rate": 1.5662937062937063e-06, "loss": 0.3906, "step": 35320 }, { "epoch": 30.61, "learning_rate": 1.5655944055944054e-06, "loss": 0.3884, "step": 35330 }, { "epoch": 30.62, "learning_rate": 1.5648951048951049e-06, "loss": 0.3665, "step": 35340 }, { "epoch": 30.63, "learning_rate": 1.5641958041958042e-06, "loss": 0.3593, "step": 35350 }, { "epoch": 30.64, "learning_rate": 1.5634965034965035e-06, "loss": 0.3586, "step": 35360 }, { "epoch": 30.65, "learning_rate": 1.5627972027972027e-06, "loss": 0.3464, "step": 35370 }, { "epoch": 30.66, "learning_rate": 1.562097902097902e-06, "loss": 0.3643, "step": 35380 }, { "epoch": 30.67, "learning_rate": 1.5613986013986013e-06, "loss": 0.3734, "step": 35390 }, { "epoch": 30.68, "learning_rate": 1.5606993006993006e-06, "loss": 0.3686, "step": 35400 }, { "epoch": 30.68, "learning_rate": 1.5599999999999999e-06, "loss": 0.3713, "step": 35410 }, { "epoch": 30.69, "learning_rate": 1.5593006993006992e-06, "loss": 0.3656, "step": 35420 }, { "epoch": 30.7, "learning_rate": 1.5586013986013987e-06, "loss": 0.3911, "step": 35430 }, { "epoch": 30.71, "learning_rate": 1.5579020979020977e-06, "loss": 0.3081, "step": 35440 }, { "epoch": 30.72, "learning_rate": 1.5572027972027972e-06, "loss": 0.3021, "step": 35450 }, { "epoch": 30.73, "learning_rate": 1.5565034965034965e-06, "loss": 0.4553, "step": 35460 }, { "epoch": 30.74, "learning_rate": 1.5558041958041956e-06, "loss": 0.3951, "step": 35470 }, { "epoch": 30.74, "learning_rate": 1.555104895104895e-06, "loss": 0.372, "step": 35480 }, { "epoch": 30.75, "learning_rate": 1.5544055944055942e-06, "loss": 0.37, "step": 35490 }, { "epoch": 30.76, "learning_rate": 1.5537062937062937e-06, "loss": 0.3266, "step": 35500 }, { "epoch": 30.77, "learning_rate": 1.553006993006993e-06, "loss": 0.3462, "step": 35510 }, { "epoch": 30.78, "learning_rate": 1.5523076923076922e-06, "loss": 0.3416, "step": 35520 }, { "epoch": 30.79, "learning_rate": 1.5516083916083915e-06, "loss": 0.355, "step": 35530 }, { "epoch": 30.8, "learning_rate": 1.550909090909091e-06, "loss": 0.3883, "step": 35540 }, { "epoch": 30.81, "learning_rate": 1.55020979020979e-06, "loss": 0.3916, "step": 35550 }, { "epoch": 30.81, "learning_rate": 1.5495104895104894e-06, "loss": 0.407, "step": 35560 }, { "epoch": 30.82, "learning_rate": 1.5488111888111889e-06, "loss": 0.3629, "step": 35570 }, { "epoch": 30.83, "learning_rate": 1.548111888111888e-06, "loss": 0.3844, "step": 35580 }, { "epoch": 30.84, "learning_rate": 1.5474125874125874e-06, "loss": 0.3713, "step": 35590 }, { "epoch": 30.85, "learning_rate": 1.5467132867132865e-06, "loss": 0.3512, "step": 35600 }, { "epoch": 30.86, "learning_rate": 1.546013986013986e-06, "loss": 0.3197, "step": 35610 }, { "epoch": 30.87, "learning_rate": 1.5453146853146853e-06, "loss": 0.3575, "step": 35620 }, { "epoch": 30.87, "learning_rate": 1.5446153846153846e-06, "loss": 0.3383, "step": 35630 }, { "epoch": 30.88, "learning_rate": 1.5439160839160839e-06, "loss": 0.3747, "step": 35640 }, { "epoch": 30.89, "learning_rate": 1.5432167832167832e-06, "loss": 0.3644, "step": 35650 }, { "epoch": 30.9, "learning_rate": 1.5425174825174824e-06, "loss": 0.3445, "step": 35660 }, { "epoch": 30.91, "learning_rate": 1.5418181818181817e-06, "loss": 0.3674, "step": 35670 }, { "epoch": 30.92, "learning_rate": 1.541118881118881e-06, "loss": 0.404, "step": 35680 }, { "epoch": 30.93, "learning_rate": 1.5404195804195803e-06, "loss": 0.3292, "step": 35690 }, { "epoch": 30.94, "learning_rate": 1.5397202797202798e-06, "loss": 0.3722, "step": 35700 }, { "epoch": 30.94, "learning_rate": 1.5390209790209789e-06, "loss": 0.3704, "step": 35710 }, { "epoch": 30.95, "learning_rate": 1.5383216783216784e-06, "loss": 0.4484, "step": 35720 }, { "epoch": 30.96, "learning_rate": 1.5376223776223776e-06, "loss": 0.3342, "step": 35730 }, { "epoch": 30.97, "learning_rate": 1.5369230769230767e-06, "loss": 0.3784, "step": 35740 }, { "epoch": 30.98, "learning_rate": 1.5362237762237762e-06, "loss": 0.3727, "step": 35750 }, { "epoch": 30.99, "learning_rate": 1.5355244755244753e-06, "loss": 0.3832, "step": 35760 }, { "epoch": 31.0, "learning_rate": 1.5348251748251748e-06, "loss": 0.3544, "step": 35770 }, { "epoch": 31.0, "eval_loss": 0.5595405697822571, "eval_runtime": 134.7991, "eval_samples_per_second": 3.947, "eval_steps_per_second": 1.973, "eval_wer": 0.24445587195474705, "step": 35774 }, { "epoch": 31.01, "learning_rate": 1.534125874125874e-06, "loss": 0.3527, "step": 35780 }, { "epoch": 31.01, "learning_rate": 1.5334265734265734e-06, "loss": 0.3921, "step": 35790 }, { "epoch": 31.02, "learning_rate": 1.5327272727272726e-06, "loss": 0.354, "step": 35800 }, { "epoch": 31.03, "learning_rate": 1.532027972027972e-06, "loss": 0.3689, "step": 35810 }, { "epoch": 31.04, "learning_rate": 1.5313286713286712e-06, "loss": 0.3668, "step": 35820 }, { "epoch": 31.05, "learning_rate": 1.5306293706293705e-06, "loss": 0.3723, "step": 35830 }, { "epoch": 31.06, "learning_rate": 1.52993006993007e-06, "loss": 0.3158, "step": 35840 }, { "epoch": 31.07, "learning_rate": 1.529230769230769e-06, "loss": 0.3894, "step": 35850 }, { "epoch": 31.07, "learning_rate": 1.5285314685314686e-06, "loss": 0.3496, "step": 35860 }, { "epoch": 31.08, "learning_rate": 1.5278321678321676e-06, "loss": 0.3798, "step": 35870 }, { "epoch": 31.09, "learning_rate": 1.5271328671328671e-06, "loss": 0.4188, "step": 35880 }, { "epoch": 31.1, "learning_rate": 1.5264335664335664e-06, "loss": 0.4129, "step": 35890 }, { "epoch": 31.11, "learning_rate": 1.5257342657342655e-06, "loss": 0.3586, "step": 35900 }, { "epoch": 31.12, "learning_rate": 1.525034965034965e-06, "loss": 0.389, "step": 35910 }, { "epoch": 31.13, "learning_rate": 1.5243356643356643e-06, "loss": 0.3768, "step": 35920 }, { "epoch": 31.14, "learning_rate": 1.5236363636363636e-06, "loss": 0.3302, "step": 35930 }, { "epoch": 31.14, "learning_rate": 1.5229370629370628e-06, "loss": 0.3416, "step": 35940 }, { "epoch": 31.15, "learning_rate": 1.5222377622377621e-06, "loss": 0.3617, "step": 35950 }, { "epoch": 31.16, "learning_rate": 1.5215384615384614e-06, "loss": 0.347, "step": 35960 }, { "epoch": 31.17, "learning_rate": 1.520839160839161e-06, "loss": 0.4397, "step": 35970 }, { "epoch": 31.18, "learning_rate": 1.52013986013986e-06, "loss": 0.33, "step": 35980 }, { "epoch": 31.19, "learning_rate": 1.5194405594405593e-06, "loss": 0.3698, "step": 35990 }, { "epoch": 31.2, "learning_rate": 1.5187412587412588e-06, "loss": 0.2978, "step": 36000 }, { "epoch": 31.2, "learning_rate": 1.5180419580419578e-06, "loss": 0.3654, "step": 36010 }, { "epoch": 31.21, "learning_rate": 1.5173426573426573e-06, "loss": 0.3906, "step": 36020 }, { "epoch": 31.22, "learning_rate": 1.5166433566433564e-06, "loss": 0.4131, "step": 36030 }, { "epoch": 31.23, "learning_rate": 1.515944055944056e-06, "loss": 0.3378, "step": 36040 }, { "epoch": 31.24, "learning_rate": 1.5152447552447552e-06, "loss": 0.3822, "step": 36050 }, { "epoch": 31.25, "learning_rate": 1.5145454545454545e-06, "loss": 0.3885, "step": 36060 }, { "epoch": 31.26, "learning_rate": 1.5138461538461538e-06, "loss": 0.4119, "step": 36070 }, { "epoch": 31.27, "learning_rate": 1.513146853146853e-06, "loss": 0.4497, "step": 36080 }, { "epoch": 31.27, "learning_rate": 1.5124475524475523e-06, "loss": 0.386, "step": 36090 }, { "epoch": 31.28, "learning_rate": 1.5117482517482516e-06, "loss": 0.3351, "step": 36100 }, { "epoch": 31.29, "learning_rate": 1.5110489510489511e-06, "loss": 0.3998, "step": 36110 }, { "epoch": 31.3, "learning_rate": 1.5103496503496502e-06, "loss": 0.4054, "step": 36120 }, { "epoch": 31.31, "learning_rate": 1.5096503496503497e-06, "loss": 0.4027, "step": 36130 }, { "epoch": 31.32, "learning_rate": 1.5089510489510488e-06, "loss": 0.4144, "step": 36140 }, { "epoch": 31.33, "learning_rate": 1.5082517482517483e-06, "loss": 0.3257, "step": 36150 }, { "epoch": 31.33, "learning_rate": 1.5075524475524475e-06, "loss": 0.3145, "step": 36160 }, { "epoch": 31.34, "learning_rate": 1.5068531468531466e-06, "loss": 0.3325, "step": 36170 }, { "epoch": 31.35, "learning_rate": 1.5061538461538461e-06, "loss": 0.3591, "step": 36180 }, { "epoch": 31.36, "learning_rate": 1.5054545454545454e-06, "loss": 0.3613, "step": 36190 }, { "epoch": 31.37, "learning_rate": 1.5047552447552447e-06, "loss": 0.3663, "step": 36200 }, { "epoch": 31.38, "learning_rate": 1.504055944055944e-06, "loss": 0.3922, "step": 36210 }, { "epoch": 31.39, "learning_rate": 1.5033566433566433e-06, "loss": 0.349, "step": 36220 }, { "epoch": 31.39, "learning_rate": 1.5026573426573425e-06, "loss": 0.3971, "step": 36230 }, { "epoch": 31.4, "learning_rate": 1.501958041958042e-06, "loss": 0.3792, "step": 36240 }, { "epoch": 31.41, "learning_rate": 1.5012587412587411e-06, "loss": 0.3938, "step": 36250 }, { "epoch": 31.42, "learning_rate": 1.5005594405594404e-06, "loss": 0.3061, "step": 36260 }, { "epoch": 31.43, "learning_rate": 1.49986013986014e-06, "loss": 0.3731, "step": 36270 }, { "epoch": 31.44, "learning_rate": 1.499160839160839e-06, "loss": 0.3302, "step": 36280 }, { "epoch": 31.45, "learning_rate": 1.4984615384615385e-06, "loss": 0.3524, "step": 36290 }, { "epoch": 31.46, "learning_rate": 1.4977622377622378e-06, "loss": 0.3296, "step": 36300 }, { "epoch": 31.46, "learning_rate": 1.497062937062937e-06, "loss": 0.3934, "step": 36310 }, { "epoch": 31.47, "learning_rate": 1.4963636363636363e-06, "loss": 0.3872, "step": 36320 }, { "epoch": 31.48, "learning_rate": 1.4956643356643356e-06, "loss": 0.3328, "step": 36330 }, { "epoch": 31.49, "learning_rate": 1.4949650349650349e-06, "loss": 0.4192, "step": 36340 }, { "epoch": 31.5, "learning_rate": 1.4942657342657342e-06, "loss": 0.3213, "step": 36350 }, { "epoch": 31.51, "learning_rate": 1.4935664335664335e-06, "loss": 0.3741, "step": 36360 }, { "epoch": 31.52, "learning_rate": 1.4928671328671327e-06, "loss": 0.4464, "step": 36370 }, { "epoch": 31.52, "learning_rate": 1.4921678321678322e-06, "loss": 0.3015, "step": 36380 }, { "epoch": 31.53, "learning_rate": 1.4914685314685313e-06, "loss": 0.4096, "step": 36390 }, { "epoch": 31.54, "learning_rate": 1.4907692307692308e-06, "loss": 0.3798, "step": 36400 }, { "epoch": 31.55, "learning_rate": 1.4900699300699299e-06, "loss": 0.3412, "step": 36410 }, { "epoch": 31.56, "learning_rate": 1.4893706293706294e-06, "loss": 0.3456, "step": 36420 }, { "epoch": 31.57, "learning_rate": 1.4886713286713287e-06, "loss": 0.3703, "step": 36430 }, { "epoch": 31.58, "learning_rate": 1.4879720279720277e-06, "loss": 0.395, "step": 36440 }, { "epoch": 31.59, "learning_rate": 1.4872727272727272e-06, "loss": 0.3474, "step": 36450 }, { "epoch": 31.59, "learning_rate": 1.4865734265734265e-06, "loss": 0.3511, "step": 36460 }, { "epoch": 31.6, "learning_rate": 1.4858741258741258e-06, "loss": 0.3584, "step": 36470 }, { "epoch": 31.61, "learning_rate": 1.485174825174825e-06, "loss": 0.2995, "step": 36480 }, { "epoch": 31.62, "learning_rate": 1.4844755244755246e-06, "loss": 0.3691, "step": 36490 }, { "epoch": 31.63, "learning_rate": 1.4837762237762237e-06, "loss": 0.3622, "step": 36500 }, { "epoch": 31.64, "learning_rate": 1.4830769230769232e-06, "loss": 0.3831, "step": 36510 }, { "epoch": 31.65, "learning_rate": 1.4823776223776222e-06, "loss": 0.3504, "step": 36520 }, { "epoch": 31.65, "learning_rate": 1.4816783216783215e-06, "loss": 0.3921, "step": 36530 }, { "epoch": 31.66, "learning_rate": 1.480979020979021e-06, "loss": 0.3505, "step": 36540 }, { "epoch": 31.67, "learning_rate": 1.48027972027972e-06, "loss": 0.4103, "step": 36550 }, { "epoch": 31.68, "learning_rate": 1.4795804195804196e-06, "loss": 0.3525, "step": 36560 }, { "epoch": 31.69, "learning_rate": 1.4788811188811189e-06, "loss": 0.3725, "step": 36570 }, { "epoch": 31.7, "learning_rate": 1.4781818181818182e-06, "loss": 0.3332, "step": 36580 }, { "epoch": 31.71, "learning_rate": 1.4774825174825174e-06, "loss": 0.3543, "step": 36590 }, { "epoch": 31.72, "learning_rate": 1.4767832167832167e-06, "loss": 0.361, "step": 36600 }, { "epoch": 31.72, "learning_rate": 1.476083916083916e-06, "loss": 0.3543, "step": 36610 }, { "epoch": 31.73, "learning_rate": 1.4753846153846153e-06, "loss": 0.4512, "step": 36620 }, { "epoch": 31.74, "learning_rate": 1.4746853146853146e-06, "loss": 0.3457, "step": 36630 }, { "epoch": 31.75, "learning_rate": 1.4739860139860139e-06, "loss": 0.3774, "step": 36640 }, { "epoch": 31.76, "learning_rate": 1.4732867132867134e-06, "loss": 0.3264, "step": 36650 }, { "epoch": 31.77, "learning_rate": 1.4725874125874124e-06, "loss": 0.3726, "step": 36660 }, { "epoch": 31.78, "learning_rate": 1.471888111888112e-06, "loss": 0.3406, "step": 36670 }, { "epoch": 31.78, "learning_rate": 1.471188811188811e-06, "loss": 0.3768, "step": 36680 }, { "epoch": 31.79, "learning_rate": 1.4704895104895105e-06, "loss": 0.4042, "step": 36690 }, { "epoch": 31.8, "learning_rate": 1.4697902097902098e-06, "loss": 0.3551, "step": 36700 }, { "epoch": 31.81, "learning_rate": 1.4690909090909089e-06, "loss": 0.3684, "step": 36710 }, { "epoch": 31.82, "learning_rate": 1.4683916083916084e-06, "loss": 0.3271, "step": 36720 }, { "epoch": 31.83, "learning_rate": 1.4676923076923076e-06, "loss": 0.4142, "step": 36730 }, { "epoch": 31.84, "learning_rate": 1.466993006993007e-06, "loss": 0.3726, "step": 36740 }, { "epoch": 31.85, "learning_rate": 1.4662937062937062e-06, "loss": 0.3297, "step": 36750 }, { "epoch": 31.85, "learning_rate": 1.4655944055944057e-06, "loss": 0.3958, "step": 36760 }, { "epoch": 31.86, "learning_rate": 1.4648951048951048e-06, "loss": 0.4074, "step": 36770 }, { "epoch": 31.87, "learning_rate": 1.464195804195804e-06, "loss": 0.3892, "step": 36780 }, { "epoch": 31.88, "learning_rate": 1.4634965034965034e-06, "loss": 0.3234, "step": 36790 }, { "epoch": 31.89, "learning_rate": 1.4627972027972026e-06, "loss": 0.385, "step": 36800 }, { "epoch": 31.9, "learning_rate": 1.4620979020979021e-06, "loss": 0.3705, "step": 36810 }, { "epoch": 31.91, "learning_rate": 1.4613986013986012e-06, "loss": 0.3915, "step": 36820 }, { "epoch": 31.91, "learning_rate": 1.4606993006993007e-06, "loss": 0.339, "step": 36830 }, { "epoch": 31.92, "learning_rate": 1.46e-06, "loss": 0.3448, "step": 36840 }, { "epoch": 31.93, "learning_rate": 1.4593006993006993e-06, "loss": 0.3134, "step": 36850 }, { "epoch": 31.94, "learning_rate": 1.4586013986013986e-06, "loss": 0.4355, "step": 36860 }, { "epoch": 31.95, "learning_rate": 1.4579020979020976e-06, "loss": 0.4304, "step": 36870 }, { "epoch": 31.96, "learning_rate": 1.4572027972027971e-06, "loss": 0.3529, "step": 36880 }, { "epoch": 31.97, "learning_rate": 1.4565034965034964e-06, "loss": 0.3889, "step": 36890 }, { "epoch": 31.98, "learning_rate": 1.4558041958041957e-06, "loss": 0.3798, "step": 36900 }, { "epoch": 31.98, "learning_rate": 1.455104895104895e-06, "loss": 0.4097, "step": 36910 }, { "epoch": 31.99, "learning_rate": 1.4544055944055945e-06, "loss": 0.3748, "step": 36920 }, { "epoch": 32.0, "eval_loss": 0.5464403033256531, "eval_runtime": 135.0985, "eval_samples_per_second": 3.938, "eval_steps_per_second": 1.969, "eval_wer": 0.24606286559105225, "step": 36928 }, { "epoch": 32.0, "learning_rate": 1.4537062937062936e-06, "loss": 0.4613, "step": 36930 }, { "epoch": 32.01, "learning_rate": 1.453006993006993e-06, "loss": 0.3701, "step": 36940 }, { "epoch": 32.02, "learning_rate": 1.4523076923076921e-06, "loss": 0.3776, "step": 36950 }, { "epoch": 32.03, "learning_rate": 1.4516083916083914e-06, "loss": 0.3505, "step": 36960 }, { "epoch": 32.04, "learning_rate": 1.450909090909091e-06, "loss": 0.383, "step": 36970 }, { "epoch": 32.05, "learning_rate": 1.45020979020979e-06, "loss": 0.3804, "step": 36980 }, { "epoch": 32.05, "learning_rate": 1.4495104895104895e-06, "loss": 0.4103, "step": 36990 }, { "epoch": 32.06, "learning_rate": 1.4488111888111888e-06, "loss": 0.3761, "step": 37000 }, { "epoch": 32.07, "learning_rate": 1.448111888111888e-06, "loss": 0.3826, "step": 37010 }, { "epoch": 32.08, "learning_rate": 1.4474125874125873e-06, "loss": 0.3426, "step": 37020 }, { "epoch": 32.09, "learning_rate": 1.4467132867132868e-06, "loss": 0.3708, "step": 37030 }, { "epoch": 32.1, "learning_rate": 1.446013986013986e-06, "loss": 0.3203, "step": 37040 }, { "epoch": 32.11, "learning_rate": 1.4453146853146852e-06, "loss": 0.3502, "step": 37050 }, { "epoch": 32.11, "learning_rate": 1.4446153846153845e-06, "loss": 0.3708, "step": 37060 }, { "epoch": 32.12, "learning_rate": 1.4439160839160838e-06, "loss": 0.3684, "step": 37070 }, { "epoch": 32.13, "learning_rate": 1.4432167832167833e-06, "loss": 0.4255, "step": 37080 }, { "epoch": 32.14, "learning_rate": 1.4425174825174823e-06, "loss": 0.4371, "step": 37090 }, { "epoch": 32.15, "learning_rate": 1.4418181818181818e-06, "loss": 0.3368, "step": 37100 }, { "epoch": 32.16, "learning_rate": 1.4411188811188811e-06, "loss": 0.3647, "step": 37110 }, { "epoch": 32.17, "learning_rate": 1.4404195804195804e-06, "loss": 0.3978, "step": 37120 }, { "epoch": 32.17, "learning_rate": 1.4397202797202797e-06, "loss": 0.4447, "step": 37130 }, { "epoch": 32.18, "learning_rate": 1.4390209790209788e-06, "loss": 0.3897, "step": 37140 }, { "epoch": 32.19, "learning_rate": 1.4383216783216783e-06, "loss": 0.3766, "step": 37150 }, { "epoch": 32.2, "learning_rate": 1.4376223776223775e-06, "loss": 0.3374, "step": 37160 }, { "epoch": 32.21, "learning_rate": 1.4369230769230768e-06, "loss": 0.3705, "step": 37170 }, { "epoch": 32.22, "learning_rate": 1.4362237762237761e-06, "loss": 0.4111, "step": 37180 }, { "epoch": 32.23, "learning_rate": 1.4355244755244756e-06, "loss": 0.359, "step": 37190 }, { "epoch": 32.24, "learning_rate": 1.4348251748251747e-06, "loss": 0.353, "step": 37200 }, { "epoch": 32.24, "learning_rate": 1.4341258741258742e-06, "loss": 0.3253, "step": 37210 }, { "epoch": 32.25, "learning_rate": 1.4334265734265733e-06, "loss": 0.3938, "step": 37220 }, { "epoch": 32.26, "learning_rate": 1.4327272727272725e-06, "loss": 0.3608, "step": 37230 }, { "epoch": 32.27, "learning_rate": 1.432027972027972e-06, "loss": 0.352, "step": 37240 }, { "epoch": 32.28, "learning_rate": 1.4313286713286711e-06, "loss": 0.3894, "step": 37250 }, { "epoch": 32.29, "learning_rate": 1.4306293706293706e-06, "loss": 0.3467, "step": 37260 }, { "epoch": 32.3, "learning_rate": 1.42993006993007e-06, "loss": 0.3469, "step": 37270 }, { "epoch": 32.3, "learning_rate": 1.4292307692307692e-06, "loss": 0.3764, "step": 37280 }, { "epoch": 32.31, "learning_rate": 1.4285314685314685e-06, "loss": 0.3941, "step": 37290 }, { "epoch": 32.32, "learning_rate": 1.427832167832168e-06, "loss": 0.3929, "step": 37300 }, { "epoch": 32.33, "learning_rate": 1.427132867132867e-06, "loss": 0.38, "step": 37310 }, { "epoch": 32.34, "learning_rate": 1.4264335664335663e-06, "loss": 0.3292, "step": 37320 }, { "epoch": 32.35, "learning_rate": 1.4257342657342656e-06, "loss": 0.3435, "step": 37330 }, { "epoch": 32.36, "learning_rate": 1.4250349650349649e-06, "loss": 0.4315, "step": 37340 }, { "epoch": 32.37, "learning_rate": 1.4243356643356644e-06, "loss": 0.3478, "step": 37350 }, { "epoch": 32.37, "learning_rate": 1.4236363636363635e-06, "loss": 0.4144, "step": 37360 }, { "epoch": 32.38, "learning_rate": 1.422937062937063e-06, "loss": 0.3293, "step": 37370 }, { "epoch": 32.39, "learning_rate": 1.4222377622377622e-06, "loss": 0.3359, "step": 37380 }, { "epoch": 32.4, "learning_rate": 1.4215384615384615e-06, "loss": 0.3422, "step": 37390 }, { "epoch": 32.41, "learning_rate": 1.4208391608391608e-06, "loss": 0.369, "step": 37400 }, { "epoch": 32.42, "learning_rate": 1.4201398601398599e-06, "loss": 0.3224, "step": 37410 }, { "epoch": 32.43, "learning_rate": 1.4194405594405594e-06, "loss": 0.4373, "step": 37420 }, { "epoch": 32.43, "learning_rate": 1.4187412587412587e-06, "loss": 0.3844, "step": 37430 }, { "epoch": 32.44, "learning_rate": 1.418041958041958e-06, "loss": 0.3759, "step": 37440 }, { "epoch": 32.45, "learning_rate": 1.4173426573426572e-06, "loss": 0.3449, "step": 37450 }, { "epoch": 32.46, "learning_rate": 1.4166433566433567e-06, "loss": 0.4016, "step": 37460 }, { "epoch": 32.47, "learning_rate": 1.4159440559440558e-06, "loss": 0.3822, "step": 37470 }, { "epoch": 32.48, "learning_rate": 1.4152447552447553e-06, "loss": 0.3682, "step": 37480 }, { "epoch": 32.49, "learning_rate": 1.4145454545454544e-06, "loss": 0.3673, "step": 37490 }, { "epoch": 32.5, "learning_rate": 1.4138461538461537e-06, "loss": 0.2964, "step": 37500 }, { "epoch": 32.5, "learning_rate": 1.4131468531468532e-06, "loss": 0.3916, "step": 37510 }, { "epoch": 32.51, "learning_rate": 1.4124475524475522e-06, "loss": 0.4394, "step": 37520 }, { "epoch": 32.52, "learning_rate": 1.4117482517482517e-06, "loss": 0.4339, "step": 37530 }, { "epoch": 32.53, "learning_rate": 1.411048951048951e-06, "loss": 0.3407, "step": 37540 }, { "epoch": 32.54, "learning_rate": 1.4103496503496503e-06, "loss": 0.3609, "step": 37550 }, { "epoch": 32.55, "learning_rate": 1.4096503496503496e-06, "loss": 0.3607, "step": 37560 }, { "epoch": 32.56, "learning_rate": 1.408951048951049e-06, "loss": 0.3941, "step": 37570 }, { "epoch": 32.56, "learning_rate": 1.4082517482517482e-06, "loss": 0.3341, "step": 37580 }, { "epoch": 32.57, "learning_rate": 1.4075524475524474e-06, "loss": 0.3668, "step": 37590 }, { "epoch": 32.58, "learning_rate": 1.4068531468531467e-06, "loss": 0.3347, "step": 37600 }, { "epoch": 32.59, "learning_rate": 1.406153846153846e-06, "loss": 0.322, "step": 37610 }, { "epoch": 32.6, "learning_rate": 1.4054545454545455e-06, "loss": 0.3625, "step": 37620 }, { "epoch": 32.61, "learning_rate": 1.4047552447552446e-06, "loss": 0.3698, "step": 37630 }, { "epoch": 32.62, "learning_rate": 1.404055944055944e-06, "loss": 0.3135, "step": 37640 }, { "epoch": 32.63, "learning_rate": 1.4033566433566434e-06, "loss": 0.4204, "step": 37650 }, { "epoch": 32.63, "learning_rate": 1.4026573426573427e-06, "loss": 0.4076, "step": 37660 }, { "epoch": 32.64, "learning_rate": 1.401958041958042e-06, "loss": 0.3556, "step": 37670 }, { "epoch": 32.65, "learning_rate": 1.401258741258741e-06, "loss": 0.3814, "step": 37680 }, { "epoch": 32.66, "learning_rate": 1.4005594405594405e-06, "loss": 0.3562, "step": 37690 }, { "epoch": 32.67, "learning_rate": 1.3998601398601398e-06, "loss": 0.3452, "step": 37700 }, { "epoch": 32.68, "learning_rate": 1.399160839160839e-06, "loss": 0.3243, "step": 37710 }, { "epoch": 32.69, "learning_rate": 1.3984615384615384e-06, "loss": 0.4003, "step": 37720 }, { "epoch": 32.69, "learning_rate": 1.3978321678321678e-06, "loss": 0.3779, "step": 37730 }, { "epoch": 32.7, "learning_rate": 1.3971328671328671e-06, "loss": 0.4263, "step": 37740 }, { "epoch": 32.71, "learning_rate": 1.3964335664335664e-06, "loss": 0.3623, "step": 37750 }, { "epoch": 32.72, "learning_rate": 1.3957342657342657e-06, "loss": 0.3627, "step": 37760 }, { "epoch": 32.73, "learning_rate": 1.395034965034965e-06, "loss": 0.3887, "step": 37770 }, { "epoch": 32.74, "learning_rate": 1.3943356643356643e-06, "loss": 0.3845, "step": 37780 }, { "epoch": 32.75, "learning_rate": 1.3936363636363635e-06, "loss": 0.4599, "step": 37790 }, { "epoch": 32.76, "learning_rate": 1.3929370629370628e-06, "loss": 0.3522, "step": 37800 }, { "epoch": 32.76, "learning_rate": 1.3922377622377621e-06, "loss": 0.3465, "step": 37810 }, { "epoch": 32.77, "learning_rate": 1.3915384615384616e-06, "loss": 0.4008, "step": 37820 }, { "epoch": 32.78, "learning_rate": 1.3908391608391607e-06, "loss": 0.3572, "step": 37830 }, { "epoch": 32.79, "learning_rate": 1.3901398601398602e-06, "loss": 0.329, "step": 37840 }, { "epoch": 32.8, "learning_rate": 1.3894405594405595e-06, "loss": 0.4115, "step": 37850 }, { "epoch": 32.81, "learning_rate": 1.3887412587412585e-06, "loss": 0.3476, "step": 37860 }, { "epoch": 32.82, "learning_rate": 1.388041958041958e-06, "loss": 0.4221, "step": 37870 }, { "epoch": 32.82, "learning_rate": 1.387342657342657e-06, "loss": 0.3899, "step": 37880 }, { "epoch": 32.83, "learning_rate": 1.3866433566433566e-06, "loss": 0.4039, "step": 37890 }, { "epoch": 32.84, "learning_rate": 1.3859440559440559e-06, "loss": 0.3687, "step": 37900 }, { "epoch": 32.85, "learning_rate": 1.3852447552447552e-06, "loss": 0.3789, "step": 37910 }, { "epoch": 32.86, "learning_rate": 1.3845454545454545e-06, "loss": 0.3715, "step": 37920 }, { "epoch": 32.87, "learning_rate": 1.383846153846154e-06, "loss": 0.3709, "step": 37930 }, { "epoch": 32.88, "learning_rate": 1.383146853146853e-06, "loss": 0.3607, "step": 37940 }, { "epoch": 32.89, "learning_rate": 1.3824475524475523e-06, "loss": 0.3614, "step": 37950 }, { "epoch": 32.89, "learning_rate": 1.3817482517482518e-06, "loss": 0.3373, "step": 37960 }, { "epoch": 32.9, "learning_rate": 1.3810489510489509e-06, "loss": 0.3845, "step": 37970 }, { "epoch": 32.91, "learning_rate": 1.3803496503496504e-06, "loss": 0.3576, "step": 37980 }, { "epoch": 32.92, "learning_rate": 1.3796503496503495e-06, "loss": 0.3313, "step": 37990 }, { "epoch": 32.93, "learning_rate": 1.378951048951049e-06, "loss": 0.3453, "step": 38000 }, { "epoch": 32.94, "learning_rate": 1.3782517482517482e-06, "loss": 0.3868, "step": 38010 }, { "epoch": 32.95, "learning_rate": 1.3775524475524475e-06, "loss": 0.367, "step": 38020 }, { "epoch": 32.95, "learning_rate": 1.3768531468531468e-06, "loss": 0.3803, "step": 38030 }, { "epoch": 32.96, "learning_rate": 1.376153846153846e-06, "loss": 0.3532, "step": 38040 }, { "epoch": 32.97, "learning_rate": 1.3754545454545454e-06, "loss": 0.3733, "step": 38050 }, { "epoch": 32.98, "learning_rate": 1.3747552447552447e-06, "loss": 0.2842, "step": 38060 }, { "epoch": 32.99, "learning_rate": 1.374055944055944e-06, "loss": 0.3842, "step": 38070 }, { "epoch": 33.0, "learning_rate": 1.3733566433566432e-06, "loss": 0.3839, "step": 38080 }, { "epoch": 33.0, "eval_loss": 0.5652355551719666, "eval_runtime": 135.8769, "eval_samples_per_second": 3.915, "eval_steps_per_second": 1.958, "eval_wer": 0.24747701999100083, "step": 38082 }, { "epoch": 33.01, "learning_rate": 1.3726573426573427e-06, "loss": 0.3689, "step": 38090 }, { "epoch": 33.02, "learning_rate": 1.3719580419580418e-06, "loss": 0.3708, "step": 38100 }, { "epoch": 33.02, "learning_rate": 1.3712587412587413e-06, "loss": 0.3431, "step": 38110 }, { "epoch": 33.03, "learning_rate": 1.3705594405594406e-06, "loss": 0.4184, "step": 38120 }, { "epoch": 33.04, "learning_rate": 1.3698601398601397e-06, "loss": 0.3241, "step": 38130 }, { "epoch": 33.05, "learning_rate": 1.3691608391608392e-06, "loss": 0.3318, "step": 38140 }, { "epoch": 33.06, "learning_rate": 1.3684615384615384e-06, "loss": 0.3082, "step": 38150 }, { "epoch": 33.07, "learning_rate": 1.3677622377622377e-06, "loss": 0.3692, "step": 38160 }, { "epoch": 33.08, "learning_rate": 1.367062937062937e-06, "loss": 0.3644, "step": 38170 }, { "epoch": 33.08, "learning_rate": 1.3663636363636363e-06, "loss": 0.3386, "step": 38180 }, { "epoch": 33.09, "learning_rate": 1.3656643356643356e-06, "loss": 0.415, "step": 38190 }, { "epoch": 33.1, "learning_rate": 1.364965034965035e-06, "loss": 0.3905, "step": 38200 }, { "epoch": 33.11, "learning_rate": 1.3642657342657342e-06, "loss": 0.3808, "step": 38210 }, { "epoch": 33.12, "learning_rate": 1.3635664335664334e-06, "loss": 0.4146, "step": 38220 }, { "epoch": 33.13, "learning_rate": 1.362867132867133e-06, "loss": 0.3925, "step": 38230 }, { "epoch": 33.14, "learning_rate": 1.362167832167832e-06, "loss": 0.4243, "step": 38240 }, { "epoch": 33.15, "learning_rate": 1.3614685314685315e-06, "loss": 0.3465, "step": 38250 }, { "epoch": 33.15, "learning_rate": 1.3607692307692306e-06, "loss": 0.3833, "step": 38260 }, { "epoch": 33.16, "learning_rate": 1.36006993006993e-06, "loss": 0.4024, "step": 38270 }, { "epoch": 33.17, "learning_rate": 1.3593706293706294e-06, "loss": 0.3583, "step": 38280 }, { "epoch": 33.18, "learning_rate": 1.3586713286713286e-06, "loss": 0.3401, "step": 38290 }, { "epoch": 33.19, "learning_rate": 1.357972027972028e-06, "loss": 0.3555, "step": 38300 }, { "epoch": 33.2, "learning_rate": 1.3572727272727272e-06, "loss": 0.3101, "step": 38310 }, { "epoch": 33.21, "learning_rate": 1.3565734265734265e-06, "loss": 0.3485, "step": 38320 }, { "epoch": 33.21, "learning_rate": 1.3558741258741258e-06, "loss": 0.4575, "step": 38330 }, { "epoch": 33.22, "learning_rate": 1.3551748251748253e-06, "loss": 0.4007, "step": 38340 }, { "epoch": 33.23, "learning_rate": 1.3544755244755244e-06, "loss": 0.3453, "step": 38350 }, { "epoch": 33.24, "learning_rate": 1.3537762237762239e-06, "loss": 0.387, "step": 38360 }, { "epoch": 33.25, "learning_rate": 1.353076923076923e-06, "loss": 0.3606, "step": 38370 }, { "epoch": 33.26, "learning_rate": 1.3523776223776222e-06, "loss": 0.3628, "step": 38380 }, { "epoch": 33.27, "learning_rate": 1.3516783216783217e-06, "loss": 0.345, "step": 38390 }, { "epoch": 33.28, "learning_rate": 1.3509790209790208e-06, "loss": 0.431, "step": 38400 }, { "epoch": 33.28, "learning_rate": 1.3502797202797203e-06, "loss": 0.373, "step": 38410 }, { "epoch": 33.29, "learning_rate": 1.3495804195804196e-06, "loss": 0.3685, "step": 38420 }, { "epoch": 33.3, "learning_rate": 1.3488811188811188e-06, "loss": 0.3631, "step": 38430 }, { "epoch": 33.31, "learning_rate": 1.3481818181818181e-06, "loss": 0.3509, "step": 38440 }, { "epoch": 33.32, "learning_rate": 1.3474825174825174e-06, "loss": 0.3536, "step": 38450 }, { "epoch": 33.33, "learning_rate": 1.3467832167832167e-06, "loss": 0.3496, "step": 38460 }, { "epoch": 33.34, "learning_rate": 1.346083916083916e-06, "loss": 0.3579, "step": 38470 }, { "epoch": 33.34, "learning_rate": 1.3453846153846153e-06, "loss": 0.3917, "step": 38480 }, { "epoch": 33.35, "learning_rate": 1.3446853146853146e-06, "loss": 0.3634, "step": 38490 }, { "epoch": 33.36, "learning_rate": 1.343986013986014e-06, "loss": 0.3654, "step": 38500 }, { "epoch": 33.37, "learning_rate": 1.3432867132867131e-06, "loss": 0.3681, "step": 38510 }, { "epoch": 33.38, "learning_rate": 1.3425874125874126e-06, "loss": 0.4137, "step": 38520 }, { "epoch": 33.39, "learning_rate": 1.3418881118881117e-06, "loss": 0.3998, "step": 38530 }, { "epoch": 33.4, "learning_rate": 1.3411888111888112e-06, "loss": 0.376, "step": 38540 }, { "epoch": 33.41, "learning_rate": 1.3404895104895105e-06, "loss": 0.3325, "step": 38550 }, { "epoch": 33.41, "learning_rate": 1.3397902097902096e-06, "loss": 0.3865, "step": 38560 }, { "epoch": 33.42, "learning_rate": 1.339090909090909e-06, "loss": 0.4339, "step": 38570 }, { "epoch": 33.43, "learning_rate": 1.3383916083916083e-06, "loss": 0.4056, "step": 38580 }, { "epoch": 33.44, "learning_rate": 1.3376923076923076e-06, "loss": 0.3689, "step": 38590 }, { "epoch": 33.45, "learning_rate": 1.336993006993007e-06, "loss": 0.3898, "step": 38600 }, { "epoch": 33.46, "learning_rate": 1.3362937062937064e-06, "loss": 0.3544, "step": 38610 }, { "epoch": 33.47, "learning_rate": 1.3355944055944055e-06, "loss": 0.3979, "step": 38620 }, { "epoch": 33.47, "learning_rate": 1.334895104895105e-06, "loss": 0.3858, "step": 38630 }, { "epoch": 33.48, "learning_rate": 1.334195804195804e-06, "loss": 0.4398, "step": 38640 }, { "epoch": 33.49, "learning_rate": 1.3334965034965033e-06, "loss": 0.3577, "step": 38650 }, { "epoch": 33.5, "learning_rate": 1.3327972027972028e-06, "loss": 0.3575, "step": 38660 }, { "epoch": 33.51, "learning_rate": 1.332097902097902e-06, "loss": 0.3101, "step": 38670 }, { "epoch": 33.52, "learning_rate": 1.3313986013986014e-06, "loss": 0.4451, "step": 38680 }, { "epoch": 33.53, "learning_rate": 1.3306993006993007e-06, "loss": 0.2943, "step": 38690 }, { "epoch": 33.54, "learning_rate": 1.33e-06, "loss": 0.3424, "step": 38700 }, { "epoch": 33.54, "learning_rate": 1.3293006993006993e-06, "loss": 0.3279, "step": 38710 }, { "epoch": 33.55, "learning_rate": 1.3286013986013985e-06, "loss": 0.3437, "step": 38720 }, { "epoch": 33.56, "learning_rate": 1.3279020979020978e-06, "loss": 0.36, "step": 38730 }, { "epoch": 33.57, "learning_rate": 1.3272027972027971e-06, "loss": 0.3833, "step": 38740 }, { "epoch": 33.58, "learning_rate": 1.3265034965034964e-06, "loss": 0.3473, "step": 38750 }, { "epoch": 33.59, "learning_rate": 1.3258041958041957e-06, "loss": 0.346, "step": 38760 }, { "epoch": 33.6, "learning_rate": 1.3251048951048952e-06, "loss": 0.3609, "step": 38770 }, { "epoch": 33.6, "learning_rate": 1.3244055944055943e-06, "loss": 0.3858, "step": 38780 }, { "epoch": 33.61, "learning_rate": 1.3237062937062937e-06, "loss": 0.3623, "step": 38790 }, { "epoch": 33.62, "learning_rate": 1.3230069930069928e-06, "loss": 0.3254, "step": 38800 }, { "epoch": 33.63, "learning_rate": 1.3223076923076923e-06, "loss": 0.3263, "step": 38810 }, { "epoch": 33.64, "learning_rate": 1.3216083916083916e-06, "loss": 0.3892, "step": 38820 }, { "epoch": 33.65, "learning_rate": 1.3209090909090907e-06, "loss": 0.3618, "step": 38830 }, { "epoch": 33.66, "learning_rate": 1.3202097902097902e-06, "loss": 0.3106, "step": 38840 }, { "epoch": 33.67, "learning_rate": 1.3195104895104895e-06, "loss": 0.3613, "step": 38850 }, { "epoch": 33.67, "learning_rate": 1.3188111888111887e-06, "loss": 0.3396, "step": 38860 }, { "epoch": 33.68, "learning_rate": 1.318111888111888e-06, "loss": 0.356, "step": 38870 }, { "epoch": 33.69, "learning_rate": 1.3174125874125875e-06, "loss": 0.4044, "step": 38880 }, { "epoch": 33.7, "learning_rate": 1.3167132867132866e-06, "loss": 0.3763, "step": 38890 }, { "epoch": 33.71, "learning_rate": 1.316013986013986e-06, "loss": 0.3754, "step": 38900 }, { "epoch": 33.72, "learning_rate": 1.3153146853146852e-06, "loss": 0.3176, "step": 38910 }, { "epoch": 33.73, "learning_rate": 1.3146153846153845e-06, "loss": 0.3711, "step": 38920 }, { "epoch": 33.73, "learning_rate": 1.313916083916084e-06, "loss": 0.3626, "step": 38930 }, { "epoch": 33.74, "learning_rate": 1.313216783216783e-06, "loss": 0.3064, "step": 38940 }, { "epoch": 33.75, "learning_rate": 1.3125174825174825e-06, "loss": 0.4134, "step": 38950 }, { "epoch": 33.76, "learning_rate": 1.3118181818181818e-06, "loss": 0.3612, "step": 38960 }, { "epoch": 33.77, "learning_rate": 1.311118881118881e-06, "loss": 0.4237, "step": 38970 }, { "epoch": 33.78, "learning_rate": 1.3104195804195804e-06, "loss": 0.3579, "step": 38980 }, { "epoch": 33.79, "learning_rate": 1.3097202797202797e-06, "loss": 0.3854, "step": 38990 }, { "epoch": 33.8, "learning_rate": 1.309020979020979e-06, "loss": 0.3347, "step": 39000 }, { "epoch": 33.8, "learning_rate": 1.3083216783216782e-06, "loss": 0.3272, "step": 39010 }, { "epoch": 33.81, "learning_rate": 1.3076223776223775e-06, "loss": 0.387, "step": 39020 }, { "epoch": 33.82, "learning_rate": 1.3069230769230768e-06, "loss": 0.4064, "step": 39030 }, { "epoch": 33.83, "learning_rate": 1.3062237762237763e-06, "loss": 0.3116, "step": 39040 }, { "epoch": 33.84, "learning_rate": 1.3055244755244754e-06, "loss": 0.3533, "step": 39050 }, { "epoch": 33.85, "learning_rate": 1.3048251748251749e-06, "loss": 0.3612, "step": 39060 }, { "epoch": 33.86, "learning_rate": 1.304125874125874e-06, "loss": 0.388, "step": 39070 }, { "epoch": 33.86, "learning_rate": 1.3034265734265734e-06, "loss": 0.4011, "step": 39080 }, { "epoch": 33.87, "learning_rate": 1.3027272727272727e-06, "loss": 0.3565, "step": 39090 }, { "epoch": 33.88, "learning_rate": 1.3020279720279718e-06, "loss": 0.3031, "step": 39100 }, { "epoch": 33.89, "learning_rate": 1.3013286713286713e-06, "loss": 0.3112, "step": 39110 }, { "epoch": 33.9, "learning_rate": 1.3006293706293706e-06, "loss": 0.3636, "step": 39120 }, { "epoch": 33.91, "learning_rate": 1.2999300699300699e-06, "loss": 0.3724, "step": 39130 }, { "epoch": 33.92, "learning_rate": 1.2992307692307692e-06, "loss": 0.3513, "step": 39140 }, { "epoch": 33.93, "learning_rate": 1.2985314685314687e-06, "loss": 0.4349, "step": 39150 }, { "epoch": 33.93, "learning_rate": 1.2978321678321677e-06, "loss": 0.3918, "step": 39160 }, { "epoch": 33.94, "learning_rate": 1.2971328671328672e-06, "loss": 0.4047, "step": 39170 }, { "epoch": 33.95, "learning_rate": 1.2964335664335663e-06, "loss": 0.3356, "step": 39180 }, { "epoch": 33.96, "learning_rate": 1.2957342657342656e-06, "loss": 0.4049, "step": 39190 }, { "epoch": 33.97, "learning_rate": 1.295034965034965e-06, "loss": 0.3867, "step": 39200 }, { "epoch": 33.98, "learning_rate": 1.2943356643356642e-06, "loss": 0.3492, "step": 39210 }, { "epoch": 33.99, "learning_rate": 1.2936363636363636e-06, "loss": 0.4248, "step": 39220 }, { "epoch": 33.99, "learning_rate": 1.292937062937063e-06, "loss": 0.3691, "step": 39230 }, { "epoch": 34.0, "eval_loss": 0.5551154017448425, "eval_runtime": 137.8613, "eval_samples_per_second": 3.859, "eval_steps_per_second": 1.929, "eval_wer": 0.24278459857298965, "step": 39236 }, { "epoch": 34.0, "learning_rate": 1.2922377622377622e-06, "loss": 0.4403, "step": 39240 }, { "epoch": 34.01, "learning_rate": 1.2915384615384615e-06, "loss": 0.3549, "step": 39250 }, { "epoch": 34.02, "learning_rate": 1.2908391608391608e-06, "loss": 0.3839, "step": 39260 }, { "epoch": 34.03, "learning_rate": 1.29013986013986e-06, "loss": 0.351, "step": 39270 }, { "epoch": 34.04, "learning_rate": 1.2894405594405594e-06, "loss": 0.3648, "step": 39280 }, { "epoch": 34.05, "learning_rate": 1.2887412587412586e-06, "loss": 0.3786, "step": 39290 }, { "epoch": 34.06, "learning_rate": 1.288041958041958e-06, "loss": 0.3918, "step": 39300 }, { "epoch": 34.06, "learning_rate": 1.2873426573426574e-06, "loss": 0.3271, "step": 39310 }, { "epoch": 34.07, "learning_rate": 1.2866433566433565e-06, "loss": 0.3704, "step": 39320 }, { "epoch": 34.08, "learning_rate": 1.285944055944056e-06, "loss": 0.3887, "step": 39330 }, { "epoch": 34.09, "learning_rate": 1.285244755244755e-06, "loss": 0.3977, "step": 39340 }, { "epoch": 34.1, "learning_rate": 1.2845454545454544e-06, "loss": 0.3211, "step": 39350 }, { "epoch": 34.11, "learning_rate": 1.2838461538461539e-06, "loss": 0.4011, "step": 39360 }, { "epoch": 34.12, "learning_rate": 1.283146853146853e-06, "loss": 0.4222, "step": 39370 }, { "epoch": 34.12, "learning_rate": 1.2824475524475524e-06, "loss": 0.4083, "step": 39380 }, { "epoch": 34.13, "learning_rate": 1.2817482517482517e-06, "loss": 0.3787, "step": 39390 }, { "epoch": 34.14, "learning_rate": 1.281048951048951e-06, "loss": 0.4088, "step": 39400 }, { "epoch": 34.15, "learning_rate": 1.2803496503496503e-06, "loss": 0.3065, "step": 39410 }, { "epoch": 34.16, "learning_rate": 1.2796503496503498e-06, "loss": 0.3769, "step": 39420 }, { "epoch": 34.17, "learning_rate": 1.2789510489510488e-06, "loss": 0.4346, "step": 39430 }, { "epoch": 34.18, "learning_rate": 1.2782517482517481e-06, "loss": 0.2899, "step": 39440 }, { "epoch": 34.19, "learning_rate": 1.2775524475524474e-06, "loss": 0.3924, "step": 39450 }, { "epoch": 34.19, "learning_rate": 1.2768531468531467e-06, "loss": 0.3546, "step": 39460 }, { "epoch": 34.2, "learning_rate": 1.2761538461538462e-06, "loss": 0.3824, "step": 39470 }, { "epoch": 34.21, "learning_rate": 1.2754545454545453e-06, "loss": 0.3687, "step": 39480 }, { "epoch": 34.22, "learning_rate": 1.2747552447552448e-06, "loss": 0.3505, "step": 39490 }, { "epoch": 34.23, "learning_rate": 1.274055944055944e-06, "loss": 0.3921, "step": 39500 }, { "epoch": 34.24, "learning_rate": 1.2733566433566433e-06, "loss": 0.3381, "step": 39510 }, { "epoch": 34.25, "learning_rate": 1.2726573426573426e-06, "loss": 0.3819, "step": 39520 }, { "epoch": 34.25, "learning_rate": 1.2719580419580417e-06, "loss": 0.3564, "step": 39530 }, { "epoch": 34.26, "learning_rate": 1.2712587412587412e-06, "loss": 0.3359, "step": 39540 }, { "epoch": 34.27, "learning_rate": 1.2705594405594405e-06, "loss": 0.3467, "step": 39550 }, { "epoch": 34.28, "learning_rate": 1.2698601398601398e-06, "loss": 0.3431, "step": 39560 }, { "epoch": 34.29, "learning_rate": 1.269160839160839e-06, "loss": 0.3082, "step": 39570 }, { "epoch": 34.3, "learning_rate": 1.2684615384615385e-06, "loss": 0.4237, "step": 39580 }, { "epoch": 34.31, "learning_rate": 1.2677622377622376e-06, "loss": 0.3363, "step": 39590 }, { "epoch": 34.32, "learning_rate": 1.2670629370629371e-06, "loss": 0.3542, "step": 39600 }, { "epoch": 34.32, "learning_rate": 1.2663636363636364e-06, "loss": 0.3788, "step": 39610 }, { "epoch": 34.33, "learning_rate": 1.2656643356643355e-06, "loss": 0.3864, "step": 39620 }, { "epoch": 34.34, "learning_rate": 1.264965034965035e-06, "loss": 0.4107, "step": 39630 }, { "epoch": 34.35, "learning_rate": 1.264265734265734e-06, "loss": 0.3733, "step": 39640 }, { "epoch": 34.36, "learning_rate": 1.2635664335664335e-06, "loss": 0.353, "step": 39650 }, { "epoch": 34.37, "learning_rate": 1.2628671328671328e-06, "loss": 0.4167, "step": 39660 }, { "epoch": 34.38, "learning_rate": 1.2621678321678321e-06, "loss": 0.35, "step": 39670 }, { "epoch": 34.38, "learning_rate": 1.2614685314685314e-06, "loss": 0.3884, "step": 39680 }, { "epoch": 34.39, "learning_rate": 1.260769230769231e-06, "loss": 0.308, "step": 39690 }, { "epoch": 34.4, "learning_rate": 1.26006993006993e-06, "loss": 0.3529, "step": 39700 }, { "epoch": 34.41, "learning_rate": 1.2593706293706293e-06, "loss": 0.3589, "step": 39710 }, { "epoch": 34.42, "learning_rate": 1.2586713286713285e-06, "loss": 0.3543, "step": 39720 }, { "epoch": 34.43, "learning_rate": 1.2579720279720278e-06, "loss": 0.3261, "step": 39730 }, { "epoch": 34.44, "learning_rate": 1.2572727272727273e-06, "loss": 0.3342, "step": 39740 }, { "epoch": 34.45, "learning_rate": 1.2565734265734264e-06, "loss": 0.3243, "step": 39750 }, { "epoch": 34.45, "learning_rate": 1.255874125874126e-06, "loss": 0.3558, "step": 39760 }, { "epoch": 34.46, "learning_rate": 1.2551748251748252e-06, "loss": 0.3326, "step": 39770 }, { "epoch": 34.47, "learning_rate": 1.2544755244755245e-06, "loss": 0.375, "step": 39780 }, { "epoch": 34.48, "learning_rate": 1.2537762237762238e-06, "loss": 0.4022, "step": 39790 }, { "epoch": 34.49, "learning_rate": 1.2530769230769228e-06, "loss": 0.3326, "step": 39800 }, { "epoch": 34.5, "learning_rate": 1.2523776223776223e-06, "loss": 0.3484, "step": 39810 }, { "epoch": 34.51, "learning_rate": 1.2516783216783216e-06, "loss": 0.3685, "step": 39820 }, { "epoch": 34.51, "learning_rate": 1.2509790209790209e-06, "loss": 0.3734, "step": 39830 }, { "epoch": 34.52, "learning_rate": 1.2502797202797202e-06, "loss": 0.3993, "step": 39840 }, { "epoch": 34.53, "learning_rate": 1.2495804195804197e-06, "loss": 0.3761, "step": 39850 }, { "epoch": 34.54, "learning_rate": 1.2488811188811187e-06, "loss": 0.3446, "step": 39860 }, { "epoch": 34.55, "learning_rate": 1.2481818181818182e-06, "loss": 0.3621, "step": 39870 }, { "epoch": 34.56, "learning_rate": 1.2474825174825175e-06, "loss": 0.3581, "step": 39880 }, { "epoch": 34.57, "learning_rate": 1.2467832167832166e-06, "loss": 0.3283, "step": 39890 }, { "epoch": 34.58, "learning_rate": 1.246083916083916e-06, "loss": 0.3868, "step": 39900 }, { "epoch": 34.58, "learning_rate": 1.2453846153846152e-06, "loss": 0.3612, "step": 39910 }, { "epoch": 34.59, "learning_rate": 1.2446853146853147e-06, "loss": 0.3328, "step": 39920 }, { "epoch": 34.6, "learning_rate": 1.243986013986014e-06, "loss": 0.3535, "step": 39930 }, { "epoch": 34.61, "learning_rate": 1.2432867132867132e-06, "loss": 0.3693, "step": 39940 }, { "epoch": 34.62, "learning_rate": 1.2425874125874125e-06, "loss": 0.3924, "step": 39950 }, { "epoch": 34.63, "learning_rate": 1.241888111888112e-06, "loss": 0.3339, "step": 39960 }, { "epoch": 34.64, "learning_rate": 1.241188811188811e-06, "loss": 0.3502, "step": 39970 }, { "epoch": 34.64, "learning_rate": 1.2404895104895104e-06, "loss": 0.416, "step": 39980 }, { "epoch": 34.65, "learning_rate": 1.2397902097902097e-06, "loss": 0.3613, "step": 39990 }, { "epoch": 34.66, "learning_rate": 1.239090909090909e-06, "loss": 0.3711, "step": 40000 }, { "epoch": 34.67, "learning_rate": 1.2383916083916084e-06, "loss": 0.3933, "step": 40010 }, { "epoch": 34.68, "learning_rate": 1.2376923076923075e-06, "loss": 0.3666, "step": 40020 }, { "epoch": 34.69, "learning_rate": 1.236993006993007e-06, "loss": 0.3581, "step": 40030 }, { "epoch": 34.7, "learning_rate": 1.2362937062937063e-06, "loss": 0.4526, "step": 40040 }, { "epoch": 34.71, "learning_rate": 1.2355944055944056e-06, "loss": 0.3394, "step": 40050 }, { "epoch": 34.71, "learning_rate": 1.2348951048951049e-06, "loss": 0.349, "step": 40060 }, { "epoch": 34.72, "learning_rate": 1.234195804195804e-06, "loss": 0.3608, "step": 40070 }, { "epoch": 34.73, "learning_rate": 1.2334965034965034e-06, "loss": 0.4293, "step": 40080 }, { "epoch": 34.74, "learning_rate": 1.2327972027972027e-06, "loss": 0.4366, "step": 40090 }, { "epoch": 34.75, "learning_rate": 1.232097902097902e-06, "loss": 0.3568, "step": 40100 }, { "epoch": 34.76, "learning_rate": 1.2313986013986013e-06, "loss": 0.2909, "step": 40110 }, { "epoch": 34.77, "learning_rate": 1.2306993006993008e-06, "loss": 0.3152, "step": 40120 }, { "epoch": 34.77, "learning_rate": 1.2299999999999999e-06, "loss": 0.3114, "step": 40130 }, { "epoch": 34.78, "learning_rate": 1.2293006993006994e-06, "loss": 0.3518, "step": 40140 }, { "epoch": 34.79, "learning_rate": 1.2286013986013987e-06, "loss": 0.3207, "step": 40150 }, { "epoch": 34.8, "learning_rate": 1.2279020979020977e-06, "loss": 0.348, "step": 40160 }, { "epoch": 34.81, "learning_rate": 1.2272027972027972e-06, "loss": 0.335, "step": 40170 }, { "epoch": 34.82, "learning_rate": 1.2265034965034963e-06, "loss": 0.3758, "step": 40180 }, { "epoch": 34.83, "learning_rate": 1.2258041958041958e-06, "loss": 0.3648, "step": 40190 }, { "epoch": 34.83, "learning_rate": 1.225104895104895e-06, "loss": 0.4195, "step": 40200 }, { "epoch": 34.84, "learning_rate": 1.2244055944055944e-06, "loss": 0.3287, "step": 40210 }, { "epoch": 34.85, "learning_rate": 1.2237062937062936e-06, "loss": 0.388, "step": 40220 }, { "epoch": 34.86, "learning_rate": 1.2230069930069931e-06, "loss": 0.3598, "step": 40230 }, { "epoch": 34.87, "learning_rate": 1.2223076923076922e-06, "loss": 0.3694, "step": 40240 }, { "epoch": 34.88, "learning_rate": 1.2216083916083915e-06, "loss": 0.3836, "step": 40250 }, { "epoch": 34.89, "learning_rate": 1.2209090909090908e-06, "loss": 0.3677, "step": 40260 }, { "epoch": 34.9, "learning_rate": 1.22020979020979e-06, "loss": 0.3912, "step": 40270 }, { "epoch": 34.9, "learning_rate": 1.2195104895104896e-06, "loss": 0.3673, "step": 40280 }, { "epoch": 34.91, "learning_rate": 1.2188111888111886e-06, "loss": 0.3944, "step": 40290 }, { "epoch": 34.92, "learning_rate": 1.2181118881118881e-06, "loss": 0.3404, "step": 40300 }, { "epoch": 34.93, "learning_rate": 1.2174125874125874e-06, "loss": 0.3558, "step": 40310 }, { "epoch": 34.94, "learning_rate": 1.2167132867132867e-06, "loss": 0.3658, "step": 40320 }, { "epoch": 34.95, "learning_rate": 1.216013986013986e-06, "loss": 0.3326, "step": 40330 }, { "epoch": 34.96, "learning_rate": 1.215314685314685e-06, "loss": 0.355, "step": 40340 }, { "epoch": 34.96, "learning_rate": 1.2146153846153846e-06, "loss": 0.3233, "step": 40350 }, { "epoch": 34.97, "learning_rate": 1.2139160839160839e-06, "loss": 0.3928, "step": 40360 }, { "epoch": 34.98, "learning_rate": 1.2132167832167831e-06, "loss": 0.342, "step": 40370 }, { "epoch": 34.99, "learning_rate": 1.2125174825174824e-06, "loss": 0.3841, "step": 40380 }, { "epoch": 35.0, "learning_rate": 1.211818181818182e-06, "loss": 0.3076, "step": 40390 }, { "epoch": 35.0, "eval_loss": 0.555358350276947, "eval_runtime": 136.1151, "eval_samples_per_second": 3.908, "eval_steps_per_second": 1.954, "eval_wer": 0.24631998457286108, "step": 40390 }, { "epoch": 35.01, "learning_rate": 1.211118881118881e-06, "loss": 0.3906, "step": 40400 }, { "epoch": 35.02, "learning_rate": 1.2104195804195803e-06, "loss": 0.3476, "step": 40410 }, { "epoch": 35.03, "learning_rate": 1.2097202797202798e-06, "loss": 0.3169, "step": 40420 }, { "epoch": 35.03, "learning_rate": 1.2090209790209788e-06, "loss": 0.3608, "step": 40430 }, { "epoch": 35.04, "learning_rate": 1.2083216783216783e-06, "loss": 0.3543, "step": 40440 }, { "epoch": 35.05, "learning_rate": 1.2076223776223774e-06, "loss": 0.3396, "step": 40450 }, { "epoch": 35.06, "learning_rate": 1.206923076923077e-06, "loss": 0.3822, "step": 40460 }, { "epoch": 35.07, "learning_rate": 1.2062237762237762e-06, "loss": 0.368, "step": 40470 }, { "epoch": 35.08, "learning_rate": 1.2055244755244755e-06, "loss": 0.3727, "step": 40480 }, { "epoch": 35.09, "learning_rate": 1.2048251748251748e-06, "loss": 0.4509, "step": 40490 }, { "epoch": 35.1, "learning_rate": 1.204125874125874e-06, "loss": 0.3545, "step": 40500 }, { "epoch": 35.1, "learning_rate": 1.2034265734265733e-06, "loss": 0.3603, "step": 40510 }, { "epoch": 35.11, "learning_rate": 1.2027272727272726e-06, "loss": 0.3675, "step": 40520 }, { "epoch": 35.12, "learning_rate": 1.202027972027972e-06, "loss": 0.3915, "step": 40530 }, { "epoch": 35.13, "learning_rate": 1.2013286713286712e-06, "loss": 0.3879, "step": 40540 }, { "epoch": 35.14, "learning_rate": 1.2006293706293707e-06, "loss": 0.3236, "step": 40550 }, { "epoch": 35.15, "learning_rate": 1.1999300699300698e-06, "loss": 0.3697, "step": 40560 }, { "epoch": 35.16, "learning_rate": 1.1992307692307693e-06, "loss": 0.2743, "step": 40570 }, { "epoch": 35.16, "learning_rate": 1.1985314685314686e-06, "loss": 0.3614, "step": 40580 }, { "epoch": 35.17, "learning_rate": 1.1978321678321676e-06, "loss": 0.3894, "step": 40590 }, { "epoch": 35.18, "learning_rate": 1.1971328671328671e-06, "loss": 0.3921, "step": 40600 }, { "epoch": 35.19, "learning_rate": 1.1964335664335662e-06, "loss": 0.3577, "step": 40610 }, { "epoch": 35.2, "learning_rate": 1.1957342657342657e-06, "loss": 0.3331, "step": 40620 }, { "epoch": 35.21, "learning_rate": 1.195034965034965e-06, "loss": 0.3841, "step": 40630 }, { "epoch": 35.22, "learning_rate": 1.1943356643356643e-06, "loss": 0.337, "step": 40640 }, { "epoch": 35.23, "learning_rate": 1.1936363636363635e-06, "loss": 0.3891, "step": 40650 }, { "epoch": 35.23, "learning_rate": 1.192937062937063e-06, "loss": 0.3329, "step": 40660 }, { "epoch": 35.24, "learning_rate": 1.1922377622377621e-06, "loss": 0.3652, "step": 40670 }, { "epoch": 35.25, "learning_rate": 1.1915384615384614e-06, "loss": 0.3531, "step": 40680 }, { "epoch": 35.26, "learning_rate": 1.190839160839161e-06, "loss": 0.4004, "step": 40690 }, { "epoch": 35.27, "learning_rate": 1.19013986013986e-06, "loss": 0.3696, "step": 40700 }, { "epoch": 35.28, "learning_rate": 1.1894405594405595e-06, "loss": 0.3911, "step": 40710 }, { "epoch": 35.29, "learning_rate": 1.1887412587412585e-06, "loss": 0.4062, "step": 40720 }, { "epoch": 35.29, "learning_rate": 1.188041958041958e-06, "loss": 0.4332, "step": 40730 }, { "epoch": 35.3, "learning_rate": 1.1873426573426573e-06, "loss": 0.41, "step": 40740 }, { "epoch": 35.31, "learning_rate": 1.1866433566433566e-06, "loss": 0.3732, "step": 40750 }, { "epoch": 35.32, "learning_rate": 1.185944055944056e-06, "loss": 0.3851, "step": 40760 }, { "epoch": 35.33, "learning_rate": 1.1852447552447552e-06, "loss": 0.3678, "step": 40770 }, { "epoch": 35.34, "learning_rate": 1.1845454545454545e-06, "loss": 0.4117, "step": 40780 }, { "epoch": 35.35, "learning_rate": 1.1838461538461538e-06, "loss": 0.4182, "step": 40790 }, { "epoch": 35.36, "learning_rate": 1.183146853146853e-06, "loss": 0.4155, "step": 40800 }, { "epoch": 35.36, "learning_rate": 1.1824475524475523e-06, "loss": 0.3544, "step": 40810 }, { "epoch": 35.37, "learning_rate": 1.1817482517482518e-06, "loss": 0.3307, "step": 40820 }, { "epoch": 35.38, "learning_rate": 1.1810489510489509e-06, "loss": 0.341, "step": 40830 }, { "epoch": 35.39, "learning_rate": 1.1803496503496504e-06, "loss": 0.3709, "step": 40840 }, { "epoch": 35.4, "learning_rate": 1.1796503496503497e-06, "loss": 0.3244, "step": 40850 }, { "epoch": 35.41, "learning_rate": 1.1789510489510487e-06, "loss": 0.3738, "step": 40860 }, { "epoch": 35.42, "learning_rate": 1.1782517482517482e-06, "loss": 0.3641, "step": 40870 }, { "epoch": 35.42, "learning_rate": 1.1775524475524475e-06, "loss": 0.3363, "step": 40880 }, { "epoch": 35.43, "learning_rate": 1.1768531468531468e-06, "loss": 0.3307, "step": 40890 }, { "epoch": 35.44, "learning_rate": 1.176153846153846e-06, "loss": 0.4423, "step": 40900 }, { "epoch": 35.45, "learning_rate": 1.1754545454545454e-06, "loss": 0.3662, "step": 40910 }, { "epoch": 35.46, "learning_rate": 1.1747552447552447e-06, "loss": 0.3772, "step": 40920 }, { "epoch": 35.47, "learning_rate": 1.1740559440559442e-06, "loss": 0.415, "step": 40930 }, { "epoch": 35.48, "learning_rate": 1.1733566433566432e-06, "loss": 0.4153, "step": 40940 }, { "epoch": 35.49, "learning_rate": 1.1726573426573425e-06, "loss": 0.3248, "step": 40950 }, { "epoch": 35.49, "learning_rate": 1.171958041958042e-06, "loss": 0.3395, "step": 40960 }, { "epoch": 35.5, "learning_rate": 1.171258741258741e-06, "loss": 0.3559, "step": 40970 }, { "epoch": 35.51, "learning_rate": 1.1705594405594406e-06, "loss": 0.4002, "step": 40980 }, { "epoch": 35.52, "learning_rate": 1.1698601398601397e-06, "loss": 0.299, "step": 40990 }, { "epoch": 35.53, "learning_rate": 1.1691608391608392e-06, "loss": 0.39, "step": 41000 }, { "epoch": 35.54, "learning_rate": 1.1684615384615384e-06, "loss": 0.3827, "step": 41010 }, { "epoch": 35.55, "learning_rate": 1.1677622377622377e-06, "loss": 0.318, "step": 41020 }, { "epoch": 35.55, "learning_rate": 1.167062937062937e-06, "loss": 0.3562, "step": 41030 }, { "epoch": 35.56, "learning_rate": 1.1663636363636363e-06, "loss": 0.3558, "step": 41040 }, { "epoch": 35.57, "learning_rate": 1.1656643356643356e-06, "loss": 0.3021, "step": 41050 }, { "epoch": 35.58, "learning_rate": 1.1649650349650349e-06, "loss": 0.3554, "step": 41060 }, { "epoch": 35.59, "learning_rate": 1.1642657342657344e-06, "loss": 0.3894, "step": 41070 }, { "epoch": 35.6, "learning_rate": 1.1635664335664334e-06, "loss": 0.3829, "step": 41080 }, { "epoch": 35.61, "learning_rate": 1.162867132867133e-06, "loss": 0.3827, "step": 41090 }, { "epoch": 35.61, "learning_rate": 1.162167832167832e-06, "loss": 0.3726, "step": 41100 }, { "epoch": 35.62, "learning_rate": 1.1614685314685315e-06, "loss": 0.3703, "step": 41110 }, { "epoch": 35.63, "learning_rate": 1.1607692307692308e-06, "loss": 0.3142, "step": 41120 }, { "epoch": 35.64, "learning_rate": 1.1600699300699299e-06, "loss": 0.3549, "step": 41130 }, { "epoch": 35.65, "learning_rate": 1.1593706293706294e-06, "loss": 0.3436, "step": 41140 }, { "epoch": 35.66, "learning_rate": 1.1586713286713287e-06, "loss": 0.3383, "step": 41150 }, { "epoch": 35.67, "learning_rate": 1.157972027972028e-06, "loss": 0.3643, "step": 41160 }, { "epoch": 35.68, "learning_rate": 1.1572727272727272e-06, "loss": 0.3612, "step": 41170 }, { "epoch": 35.68, "learning_rate": 1.1565734265734265e-06, "loss": 0.3992, "step": 41180 }, { "epoch": 35.69, "learning_rate": 1.1558741258741258e-06, "loss": 0.428, "step": 41190 }, { "epoch": 35.7, "learning_rate": 1.1551748251748253e-06, "loss": 0.3955, "step": 41200 }, { "epoch": 35.71, "learning_rate": 1.1544755244755244e-06, "loss": 0.3796, "step": 41210 }, { "epoch": 35.72, "learning_rate": 1.1537762237762236e-06, "loss": 0.3313, "step": 41220 }, { "epoch": 35.73, "learning_rate": 1.1530769230769231e-06, "loss": 0.3473, "step": 41230 }, { "epoch": 35.74, "learning_rate": 1.1523776223776222e-06, "loss": 0.4113, "step": 41240 }, { "epoch": 35.74, "learning_rate": 1.1516783216783217e-06, "loss": 0.3303, "step": 41250 }, { "epoch": 35.75, "learning_rate": 1.1509790209790208e-06, "loss": 0.3426, "step": 41260 }, { "epoch": 35.76, "learning_rate": 1.1502797202797203e-06, "loss": 0.3911, "step": 41270 }, { "epoch": 35.77, "learning_rate": 1.1495804195804196e-06, "loss": 0.3745, "step": 41280 }, { "epoch": 35.78, "learning_rate": 1.1488811188811189e-06, "loss": 0.3718, "step": 41290 }, { "epoch": 35.79, "learning_rate": 1.1481818181818181e-06, "loss": 0.3834, "step": 41300 }, { "epoch": 35.8, "learning_rate": 1.1474825174825174e-06, "loss": 0.3581, "step": 41310 }, { "epoch": 35.81, "learning_rate": 1.1467832167832167e-06, "loss": 0.3344, "step": 41320 }, { "epoch": 35.81, "learning_rate": 1.146083916083916e-06, "loss": 0.3605, "step": 41330 }, { "epoch": 35.82, "learning_rate": 1.1453846153846155e-06, "loss": 0.3628, "step": 41340 }, { "epoch": 35.83, "learning_rate": 1.1446853146853146e-06, "loss": 0.3644, "step": 41350 }, { "epoch": 35.84, "learning_rate": 1.143986013986014e-06, "loss": 0.4126, "step": 41360 }, { "epoch": 35.85, "learning_rate": 1.1432867132867131e-06, "loss": 0.3505, "step": 41370 }, { "epoch": 35.86, "learning_rate": 1.1425874125874124e-06, "loss": 0.3332, "step": 41380 }, { "epoch": 35.87, "learning_rate": 1.141888111888112e-06, "loss": 0.3638, "step": 41390 }, { "epoch": 35.87, "learning_rate": 1.141188811188811e-06, "loss": 0.3721, "step": 41400 }, { "epoch": 35.88, "learning_rate": 1.1404895104895105e-06, "loss": 0.3965, "step": 41410 }, { "epoch": 35.89, "learning_rate": 1.1397902097902098e-06, "loss": 0.3817, "step": 41420 }, { "epoch": 35.9, "learning_rate": 1.139090909090909e-06, "loss": 0.3677, "step": 41430 }, { "epoch": 35.91, "learning_rate": 1.1383916083916083e-06, "loss": 0.3984, "step": 41440 }, { "epoch": 35.92, "learning_rate": 1.1376923076923076e-06, "loss": 0.3994, "step": 41450 }, { "epoch": 35.93, "learning_rate": 1.136993006993007e-06, "loss": 0.4064, "step": 41460 }, { "epoch": 35.94, "learning_rate": 1.1362937062937062e-06, "loss": 0.3398, "step": 41470 }, { "epoch": 35.94, "learning_rate": 1.1355944055944055e-06, "loss": 0.3784, "step": 41480 }, { "epoch": 35.95, "learning_rate": 1.1348951048951048e-06, "loss": 0.3623, "step": 41490 }, { "epoch": 35.96, "learning_rate": 1.1341958041958043e-06, "loss": 0.3722, "step": 41500 }, { "epoch": 35.97, "learning_rate": 1.1334965034965033e-06, "loss": 0.3532, "step": 41510 }, { "epoch": 35.98, "learning_rate": 1.1327972027972028e-06, "loss": 0.363, "step": 41520 }, { "epoch": 35.99, "learning_rate": 1.132097902097902e-06, "loss": 0.3761, "step": 41530 }, { "epoch": 36.0, "learning_rate": 1.1313986013986014e-06, "loss": 0.3886, "step": 41540 }, { "epoch": 36.0, "eval_loss": 0.558751106262207, "eval_runtime": 137.2985, "eval_samples_per_second": 3.875, "eval_steps_per_second": 1.937, "eval_wer": 0.24612714533650445, "step": 41544 }, { "epoch": 36.01, "learning_rate": 1.1306993006993007e-06, "loss": 0.3106, "step": 41550 }, { "epoch": 36.01, "learning_rate": 1.1299999999999998e-06, "loss": 0.3924, "step": 41560 }, { "epoch": 36.02, "learning_rate": 1.1293006993006993e-06, "loss": 0.346, "step": 41570 }, { "epoch": 36.03, "learning_rate": 1.1286013986013986e-06, "loss": 0.3785, "step": 41580 }, { "epoch": 36.04, "learning_rate": 1.1279020979020978e-06, "loss": 0.3385, "step": 41590 }, { "epoch": 36.05, "learning_rate": 1.1272027972027971e-06, "loss": 0.3389, "step": 41600 }, { "epoch": 36.06, "learning_rate": 1.1265034965034966e-06, "loss": 0.3237, "step": 41610 }, { "epoch": 36.07, "learning_rate": 1.1258041958041957e-06, "loss": 0.3436, "step": 41620 }, { "epoch": 36.07, "learning_rate": 1.1251048951048952e-06, "loss": 0.3671, "step": 41630 }, { "epoch": 36.08, "learning_rate": 1.1244055944055943e-06, "loss": 0.4029, "step": 41640 }, { "epoch": 36.09, "learning_rate": 1.1237062937062935e-06, "loss": 0.3575, "step": 41650 }, { "epoch": 36.1, "learning_rate": 1.123006993006993e-06, "loss": 0.3549, "step": 41660 }, { "epoch": 36.11, "learning_rate": 1.1223076923076921e-06, "loss": 0.3174, "step": 41670 }, { "epoch": 36.12, "learning_rate": 1.1216083916083916e-06, "loss": 0.3726, "step": 41680 }, { "epoch": 36.13, "learning_rate": 1.120909090909091e-06, "loss": 0.3989, "step": 41690 }, { "epoch": 36.14, "learning_rate": 1.1202097902097902e-06, "loss": 0.3642, "step": 41700 }, { "epoch": 36.14, "learning_rate": 1.1195104895104895e-06, "loss": 0.3407, "step": 41710 }, { "epoch": 36.15, "learning_rate": 1.1188111888111888e-06, "loss": 0.3471, "step": 41720 }, { "epoch": 36.16, "learning_rate": 1.118111888111888e-06, "loss": 0.3973, "step": 41730 }, { "epoch": 36.17, "learning_rate": 1.1174125874125873e-06, "loss": 0.3655, "step": 41740 }, { "epoch": 36.18, "learning_rate": 1.1167132867132866e-06, "loss": 0.354, "step": 41750 }, { "epoch": 36.19, "learning_rate": 1.116013986013986e-06, "loss": 0.3486, "step": 41760 }, { "epoch": 36.2, "learning_rate": 1.1153146853146854e-06, "loss": 0.3796, "step": 41770 }, { "epoch": 36.2, "learning_rate": 1.1146153846153845e-06, "loss": 0.3631, "step": 41780 }, { "epoch": 36.21, "learning_rate": 1.113916083916084e-06, "loss": 0.3843, "step": 41790 }, { "epoch": 36.22, "learning_rate": 1.113216783216783e-06, "loss": 0.3272, "step": 41800 }, { "epoch": 36.23, "learning_rate": 1.1125174825174825e-06, "loss": 0.3259, "step": 41810 }, { "epoch": 36.24, "learning_rate": 1.1118181818181818e-06, "loss": 0.3588, "step": 41820 }, { "epoch": 36.25, "learning_rate": 1.1111188811188809e-06, "loss": 0.3609, "step": 41830 }, { "epoch": 36.26, "learning_rate": 1.1104195804195804e-06, "loss": 0.4064, "step": 41840 }, { "epoch": 36.27, "learning_rate": 1.1097902097902096e-06, "loss": 0.3674, "step": 41850 }, { "epoch": 36.27, "learning_rate": 1.1090909090909091e-06, "loss": 0.3626, "step": 41860 }, { "epoch": 36.28, "learning_rate": 1.1083916083916082e-06, "loss": 0.309, "step": 41870 }, { "epoch": 36.29, "learning_rate": 1.1076923076923077e-06, "loss": 0.3654, "step": 41880 }, { "epoch": 36.3, "learning_rate": 1.106993006993007e-06, "loss": 0.3853, "step": 41890 }, { "epoch": 36.31, "learning_rate": 1.1062937062937063e-06, "loss": 0.4294, "step": 41900 }, { "epoch": 36.32, "learning_rate": 1.1055944055944056e-06, "loss": 0.3728, "step": 41910 }, { "epoch": 36.33, "learning_rate": 1.1048951048951046e-06, "loss": 0.355, "step": 41920 }, { "epoch": 36.33, "learning_rate": 1.1041958041958041e-06, "loss": 0.3343, "step": 41930 }, { "epoch": 36.34, "learning_rate": 1.1034965034965034e-06, "loss": 0.3595, "step": 41940 }, { "epoch": 36.35, "learning_rate": 1.1027972027972027e-06, "loss": 0.3631, "step": 41950 }, { "epoch": 36.36, "learning_rate": 1.102097902097902e-06, "loss": 0.3551, "step": 41960 }, { "epoch": 36.37, "learning_rate": 1.1013986013986015e-06, "loss": 0.3313, "step": 41970 }, { "epoch": 36.38, "learning_rate": 1.1006993006993006e-06, "loss": 0.3695, "step": 41980 }, { "epoch": 36.39, "learning_rate": 1.1e-06, "loss": 0.3779, "step": 41990 }, { "epoch": 36.39, "learning_rate": 1.0993006993006993e-06, "loss": 0.3474, "step": 42000 }, { "epoch": 36.4, "learning_rate": 1.0986013986013984e-06, "loss": 0.3375, "step": 42010 }, { "epoch": 36.41, "learning_rate": 1.097902097902098e-06, "loss": 0.3587, "step": 42020 }, { "epoch": 36.42, "learning_rate": 1.097202797202797e-06, "loss": 0.366, "step": 42030 }, { "epoch": 36.43, "learning_rate": 1.0965034965034965e-06, "loss": 0.3674, "step": 42040 }, { "epoch": 36.44, "learning_rate": 1.0958041958041958e-06, "loss": 0.3443, "step": 42050 }, { "epoch": 36.45, "learning_rate": 1.095104895104895e-06, "loss": 0.3428, "step": 42060 }, { "epoch": 36.46, "learning_rate": 1.0944055944055943e-06, "loss": 0.3715, "step": 42070 }, { "epoch": 36.46, "learning_rate": 1.0937062937062938e-06, "loss": 0.3847, "step": 42080 }, { "epoch": 36.47, "learning_rate": 1.093006993006993e-06, "loss": 0.3805, "step": 42090 }, { "epoch": 36.48, "learning_rate": 1.0923076923076922e-06, "loss": 0.4727, "step": 42100 }, { "epoch": 36.49, "learning_rate": 1.0916083916083915e-06, "loss": 0.4032, "step": 42110 }, { "epoch": 36.5, "learning_rate": 1.0909090909090908e-06, "loss": 0.3729, "step": 42120 }, { "epoch": 36.51, "learning_rate": 1.0902097902097903e-06, "loss": 0.3935, "step": 42130 }, { "epoch": 36.52, "learning_rate": 1.0895104895104893e-06, "loss": 0.4142, "step": 42140 }, { "epoch": 36.52, "learning_rate": 1.0888111888111888e-06, "loss": 0.4086, "step": 42150 }, { "epoch": 36.53, "learning_rate": 1.0881118881118881e-06, "loss": 0.3511, "step": 42160 }, { "epoch": 36.54, "learning_rate": 1.0874125874125874e-06, "loss": 0.3229, "step": 42170 }, { "epoch": 36.55, "learning_rate": 1.0867132867132867e-06, "loss": 0.3741, "step": 42180 }, { "epoch": 36.56, "learning_rate": 1.0860139860139858e-06, "loss": 0.3672, "step": 42190 }, { "epoch": 36.57, "learning_rate": 1.0853146853146853e-06, "loss": 0.3957, "step": 42200 }, { "epoch": 36.58, "learning_rate": 1.0846153846153845e-06, "loss": 0.3929, "step": 42210 }, { "epoch": 36.59, "learning_rate": 1.0839160839160838e-06, "loss": 0.3221, "step": 42220 }, { "epoch": 36.59, "learning_rate": 1.0832167832167831e-06, "loss": 0.359, "step": 42230 }, { "epoch": 36.6, "learning_rate": 1.0825174825174826e-06, "loss": 0.31, "step": 42240 }, { "epoch": 36.61, "learning_rate": 1.0818181818181817e-06, "loss": 0.3487, "step": 42250 }, { "epoch": 36.62, "learning_rate": 1.0811188811188812e-06, "loss": 0.389, "step": 42260 }, { "epoch": 36.63, "learning_rate": 1.0804195804195805e-06, "loss": 0.3275, "step": 42270 }, { "epoch": 36.64, "learning_rate": 1.0797202797202795e-06, "loss": 0.3415, "step": 42280 }, { "epoch": 36.65, "learning_rate": 1.079020979020979e-06, "loss": 0.3731, "step": 42290 }, { "epoch": 36.65, "learning_rate": 1.0783216783216781e-06, "loss": 0.3501, "step": 42300 }, { "epoch": 36.66, "learning_rate": 1.0776223776223776e-06, "loss": 0.3296, "step": 42310 }, { "epoch": 36.67, "learning_rate": 1.0769230769230769e-06, "loss": 0.3729, "step": 42320 }, { "epoch": 36.68, "learning_rate": 1.0762237762237762e-06, "loss": 0.3756, "step": 42330 }, { "epoch": 36.69, "learning_rate": 1.0755244755244755e-06, "loss": 0.2828, "step": 42340 }, { "epoch": 36.7, "learning_rate": 1.074825174825175e-06, "loss": 0.3814, "step": 42350 }, { "epoch": 36.71, "learning_rate": 1.074125874125874e-06, "loss": 0.3449, "step": 42360 }, { "epoch": 36.72, "learning_rate": 1.0734265734265733e-06, "loss": 0.3393, "step": 42370 }, { "epoch": 36.72, "learning_rate": 1.0727272727272726e-06, "loss": 0.5535, "step": 42380 }, { "epoch": 36.73, "learning_rate": 1.0720279720279719e-06, "loss": 0.3223, "step": 42390 }, { "epoch": 36.74, "learning_rate": 1.0713286713286714e-06, "loss": 0.422, "step": 42400 }, { "epoch": 36.75, "learning_rate": 1.0706293706293705e-06, "loss": 0.3859, "step": 42410 }, { "epoch": 36.76, "learning_rate": 1.06993006993007e-06, "loss": 0.3511, "step": 42420 }, { "epoch": 36.77, "learning_rate": 1.0692307692307692e-06, "loss": 0.3707, "step": 42430 }, { "epoch": 36.78, "learning_rate": 1.0685314685314685e-06, "loss": 0.3629, "step": 42440 }, { "epoch": 36.78, "learning_rate": 1.0678321678321678e-06, "loss": 0.2954, "step": 42450 }, { "epoch": 36.79, "learning_rate": 1.0671328671328669e-06, "loss": 0.3542, "step": 42460 }, { "epoch": 36.8, "learning_rate": 1.0664335664335664e-06, "loss": 0.3539, "step": 42470 }, { "epoch": 36.81, "learning_rate": 1.0657342657342657e-06, "loss": 0.3929, "step": 42480 }, { "epoch": 36.82, "learning_rate": 1.065034965034965e-06, "loss": 0.4005, "step": 42490 }, { "epoch": 36.83, "learning_rate": 1.0643356643356642e-06, "loss": 0.3936, "step": 42500 }, { "epoch": 36.84, "learning_rate": 1.0636363636363637e-06, "loss": 0.3981, "step": 42510 }, { "epoch": 36.85, "learning_rate": 1.0629370629370628e-06, "loss": 0.3591, "step": 42520 }, { "epoch": 36.85, "learning_rate": 1.0622377622377623e-06, "loss": 0.3683, "step": 42530 }, { "epoch": 36.86, "learning_rate": 1.0615384615384616e-06, "loss": 0.3906, "step": 42540 }, { "epoch": 36.87, "learning_rate": 1.0608391608391607e-06, "loss": 0.3424, "step": 42550 }, { "epoch": 36.88, "learning_rate": 1.0601398601398602e-06, "loss": 0.4172, "step": 42560 }, { "epoch": 36.89, "learning_rate": 1.0594405594405592e-06, "loss": 0.2909, "step": 42570 }, { "epoch": 36.9, "learning_rate": 1.0587412587412587e-06, "loss": 0.3886, "step": 42580 }, { "epoch": 36.91, "learning_rate": 1.058041958041958e-06, "loss": 0.3914, "step": 42590 }, { "epoch": 36.91, "learning_rate": 1.0573426573426573e-06, "loss": 0.3627, "step": 42600 }, { "epoch": 36.92, "learning_rate": 1.0566433566433566e-06, "loss": 0.3297, "step": 42610 }, { "epoch": 36.93, "learning_rate": 1.055944055944056e-06, "loss": 0.4152, "step": 42620 }, { "epoch": 36.94, "learning_rate": 1.0552447552447552e-06, "loss": 0.3648, "step": 42630 }, { "epoch": 36.95, "learning_rate": 1.0545454545454544e-06, "loss": 0.3864, "step": 42640 }, { "epoch": 36.96, "learning_rate": 1.0538461538461537e-06, "loss": 0.345, "step": 42650 }, { "epoch": 36.97, "learning_rate": 1.053146853146853e-06, "loss": 0.3624, "step": 42660 }, { "epoch": 36.98, "learning_rate": 1.0524475524475525e-06, "loss": 0.3598, "step": 42670 }, { "epoch": 36.98, "learning_rate": 1.0517482517482516e-06, "loss": 0.3666, "step": 42680 }, { "epoch": 36.99, "learning_rate": 1.051048951048951e-06, "loss": 0.41, "step": 42690 }, { "epoch": 37.0, "eval_loss": 0.5600542426109314, "eval_runtime": 136.3308, "eval_samples_per_second": 3.902, "eval_steps_per_second": 1.951, "eval_wer": 0.2506910072636112, "step": 42698 }, { "epoch": 37.0, "learning_rate": 1.0503496503496504e-06, "loss": 0.3753, "step": 42700 }, { "epoch": 37.01, "learning_rate": 1.0496503496503496e-06, "loss": 0.3875, "step": 42710 }, { "epoch": 37.02, "learning_rate": 1.048951048951049e-06, "loss": 0.3963, "step": 42720 }, { "epoch": 37.03, "learning_rate": 1.0482517482517482e-06, "loss": 0.3604, "step": 42730 }, { "epoch": 37.04, "learning_rate": 1.0475524475524475e-06, "loss": 0.4096, "step": 42740 }, { "epoch": 37.05, "learning_rate": 1.0468531468531468e-06, "loss": 0.3517, "step": 42750 }, { "epoch": 37.05, "learning_rate": 1.046153846153846e-06, "loss": 0.3432, "step": 42760 }, { "epoch": 37.06, "learning_rate": 1.0454545454545454e-06, "loss": 0.4349, "step": 42770 }, { "epoch": 37.07, "learning_rate": 1.0447552447552449e-06, "loss": 0.3735, "step": 42780 }, { "epoch": 37.08, "learning_rate": 1.044055944055944e-06, "loss": 0.407, "step": 42790 }, { "epoch": 37.09, "learning_rate": 1.0433566433566434e-06, "loss": 0.3428, "step": 42800 }, { "epoch": 37.1, "learning_rate": 1.0426573426573427e-06, "loss": 0.353, "step": 42810 }, { "epoch": 37.11, "learning_rate": 1.0419580419580418e-06, "loss": 0.3502, "step": 42820 }, { "epoch": 37.11, "learning_rate": 1.0412587412587413e-06, "loss": 0.3917, "step": 42830 }, { "epoch": 37.12, "learning_rate": 1.0405594405594404e-06, "loss": 0.4072, "step": 42840 }, { "epoch": 37.13, "learning_rate": 1.0398601398601399e-06, "loss": 0.3533, "step": 42850 }, { "epoch": 37.14, "learning_rate": 1.0391608391608391e-06, "loss": 0.3397, "step": 42860 }, { "epoch": 37.15, "learning_rate": 1.0384615384615384e-06, "loss": 0.394, "step": 42870 }, { "epoch": 37.16, "learning_rate": 1.0377622377622377e-06, "loss": 0.3791, "step": 42880 }, { "epoch": 37.17, "learning_rate": 1.0370629370629372e-06, "loss": 0.3509, "step": 42890 }, { "epoch": 37.17, "learning_rate": 1.0363636363636363e-06, "loss": 0.4394, "step": 42900 }, { "epoch": 37.18, "learning_rate": 1.0356643356643356e-06, "loss": 0.357, "step": 42910 }, { "epoch": 37.19, "learning_rate": 1.034965034965035e-06, "loss": 0.305, "step": 42920 }, { "epoch": 37.2, "learning_rate": 1.0342657342657341e-06, "loss": 0.3295, "step": 42930 }, { "epoch": 37.21, "learning_rate": 1.0335664335664336e-06, "loss": 0.4157, "step": 42940 }, { "epoch": 37.22, "learning_rate": 1.0328671328671327e-06, "loss": 0.386, "step": 42950 }, { "epoch": 37.23, "learning_rate": 1.0321678321678322e-06, "loss": 0.3664, "step": 42960 }, { "epoch": 37.24, "learning_rate": 1.0314685314685315e-06, "loss": 0.3553, "step": 42970 }, { "epoch": 37.24, "learning_rate": 1.0307692307692306e-06, "loss": 0.359, "step": 42980 }, { "epoch": 37.25, "learning_rate": 1.03006993006993e-06, "loss": 0.3668, "step": 42990 }, { "epoch": 37.26, "learning_rate": 1.0293706293706293e-06, "loss": 0.84, "step": 43000 }, { "epoch": 37.27, "learning_rate": 1.0286713286713286e-06, "loss": 0.4169, "step": 43010 }, { "epoch": 37.28, "learning_rate": 1.027972027972028e-06, "loss": 0.4215, "step": 43020 }, { "epoch": 37.29, "learning_rate": 1.0272727272727272e-06, "loss": 0.3693, "step": 43030 }, { "epoch": 37.3, "learning_rate": 1.0265734265734265e-06, "loss": 0.3395, "step": 43040 }, { "epoch": 37.3, "learning_rate": 1.025874125874126e-06, "loss": 0.3611, "step": 43050 }, { "epoch": 37.31, "learning_rate": 1.025174825174825e-06, "loss": 0.3396, "step": 43060 }, { "epoch": 37.32, "learning_rate": 1.0244755244755243e-06, "loss": 0.4121, "step": 43070 }, { "epoch": 37.33, "learning_rate": 1.0237762237762238e-06, "loss": 0.3261, "step": 43080 }, { "epoch": 37.34, "learning_rate": 1.023076923076923e-06, "loss": 0.3397, "step": 43090 }, { "epoch": 37.35, "learning_rate": 1.0223776223776224e-06, "loss": 0.2939, "step": 43100 }, { "epoch": 37.36, "learning_rate": 1.0216783216783215e-06, "loss": 0.3971, "step": 43110 }, { "epoch": 37.37, "learning_rate": 1.020979020979021e-06, "loss": 0.369, "step": 43120 }, { "epoch": 37.37, "learning_rate": 1.0202797202797203e-06, "loss": 0.367, "step": 43130 }, { "epoch": 37.38, "learning_rate": 1.0195804195804195e-06, "loss": 0.3512, "step": 43140 }, { "epoch": 37.39, "learning_rate": 1.0188811188811188e-06, "loss": 0.403, "step": 43150 }, { "epoch": 37.4, "learning_rate": 1.0181818181818181e-06, "loss": 0.3309, "step": 43160 }, { "epoch": 37.41, "learning_rate": 1.0174825174825174e-06, "loss": 0.3211, "step": 43170 }, { "epoch": 37.42, "learning_rate": 1.0167832167832167e-06, "loss": 0.3635, "step": 43180 }, { "epoch": 37.43, "learning_rate": 1.0160839160839162e-06, "loss": 0.3595, "step": 43190 }, { "epoch": 37.43, "learning_rate": 1.0153846153846153e-06, "loss": 0.3189, "step": 43200 }, { "epoch": 37.44, "learning_rate": 1.0146853146853148e-06, "loss": 0.3031, "step": 43210 }, { "epoch": 37.45, "learning_rate": 1.0139860139860138e-06, "loss": 0.3341, "step": 43220 }, { "epoch": 37.46, "learning_rate": 1.0132867132867133e-06, "loss": 0.3429, "step": 43230 }, { "epoch": 37.47, "learning_rate": 1.0125874125874126e-06, "loss": 0.3394, "step": 43240 }, { "epoch": 37.48, "learning_rate": 1.0118881118881117e-06, "loss": 0.3817, "step": 43250 }, { "epoch": 37.49, "learning_rate": 1.0111888111888112e-06, "loss": 0.3684, "step": 43260 }, { "epoch": 37.5, "learning_rate": 1.0104895104895105e-06, "loss": 0.3615, "step": 43270 }, { "epoch": 37.5, "learning_rate": 1.0097902097902098e-06, "loss": 0.364, "step": 43280 }, { "epoch": 37.51, "learning_rate": 1.009090909090909e-06, "loss": 0.44, "step": 43290 }, { "epoch": 37.52, "learning_rate": 1.0083916083916083e-06, "loss": 0.3402, "step": 43300 }, { "epoch": 37.53, "learning_rate": 1.0076923076923076e-06, "loss": 0.3225, "step": 43310 }, { "epoch": 37.54, "learning_rate": 1.006993006993007e-06, "loss": 0.3241, "step": 43320 }, { "epoch": 37.55, "learning_rate": 1.0062937062937062e-06, "loss": 0.3411, "step": 43330 }, { "epoch": 37.56, "learning_rate": 1.0055944055944055e-06, "loss": 0.35, "step": 43340 }, { "epoch": 37.56, "learning_rate": 1.004895104895105e-06, "loss": 0.3763, "step": 43350 }, { "epoch": 37.57, "learning_rate": 1.004195804195804e-06, "loss": 0.3327, "step": 43360 }, { "epoch": 37.58, "learning_rate": 1.0034965034965035e-06, "loss": 0.3849, "step": 43370 }, { "epoch": 37.59, "learning_rate": 1.0027972027972026e-06, "loss": 0.3767, "step": 43380 }, { "epoch": 37.6, "learning_rate": 1.002097902097902e-06, "loss": 0.4381, "step": 43390 }, { "epoch": 37.61, "learning_rate": 1.0013986013986014e-06, "loss": 0.4041, "step": 43400 }, { "epoch": 37.62, "learning_rate": 1.0006993006993007e-06, "loss": 0.3674, "step": 43410 }, { "epoch": 37.63, "learning_rate": 1e-06, "loss": 0.3349, "step": 43420 }, { "epoch": 37.63, "learning_rate": 9.993006993006992e-07, "loss": 0.344, "step": 43430 }, { "epoch": 37.64, "learning_rate": 9.986013986013985e-07, "loss": 0.3806, "step": 43440 }, { "epoch": 37.65, "learning_rate": 9.979020979020978e-07, "loss": 0.3198, "step": 43450 }, { "epoch": 37.66, "learning_rate": 9.972027972027973e-07, "loss": 0.3704, "step": 43460 }, { "epoch": 37.67, "learning_rate": 9.965034965034964e-07, "loss": 0.3334, "step": 43470 }, { "epoch": 37.68, "learning_rate": 9.958041958041957e-07, "loss": 0.3586, "step": 43480 }, { "epoch": 37.69, "learning_rate": 9.95104895104895e-07, "loss": 0.3963, "step": 43490 }, { "epoch": 37.69, "learning_rate": 9.944055944055944e-07, "loss": 0.3769, "step": 43500 }, { "epoch": 37.7, "learning_rate": 9.937062937062937e-07, "loss": 0.3593, "step": 43510 }, { "epoch": 37.71, "learning_rate": 9.93006993006993e-07, "loss": 0.3758, "step": 43520 }, { "epoch": 37.72, "learning_rate": 9.923076923076923e-07, "loss": 0.3967, "step": 43530 }, { "epoch": 37.73, "learning_rate": 9.916083916083916e-07, "loss": 0.3647, "step": 43540 }, { "epoch": 37.74, "learning_rate": 9.909090909090909e-07, "loss": 0.3461, "step": 43550 }, { "epoch": 37.75, "learning_rate": 9.902097902097902e-07, "loss": 0.3963, "step": 43560 }, { "epoch": 37.76, "learning_rate": 9.895104895104894e-07, "loss": 0.3842, "step": 43570 }, { "epoch": 37.76, "learning_rate": 9.888111888111887e-07, "loss": 0.3668, "step": 43580 }, { "epoch": 37.77, "learning_rate": 9.88111888111888e-07, "loss": 0.3835, "step": 43590 }, { "epoch": 37.78, "learning_rate": 9.874125874125873e-07, "loss": 0.3577, "step": 43600 }, { "epoch": 37.79, "learning_rate": 9.867132867132866e-07, "loss": 0.3185, "step": 43610 }, { "epoch": 37.8, "learning_rate": 9.86013986013986e-07, "loss": 0.3138, "step": 43620 }, { "epoch": 37.81, "learning_rate": 9.853146853146854e-07, "loss": 0.3538, "step": 43630 }, { "epoch": 37.82, "learning_rate": 9.846153846153847e-07, "loss": 0.3668, "step": 43640 }, { "epoch": 37.82, "learning_rate": 9.839160839160837e-07, "loss": 0.37, "step": 43650 }, { "epoch": 37.83, "learning_rate": 9.832167832167832e-07, "loss": 0.3803, "step": 43660 }, { "epoch": 37.84, "learning_rate": 9.825174825174825e-07, "loss": 0.3459, "step": 43670 }, { "epoch": 37.85, "learning_rate": 9.818181818181818e-07, "loss": 0.4266, "step": 43680 }, { "epoch": 37.86, "learning_rate": 9.81118881118881e-07, "loss": 0.3547, "step": 43690 }, { "epoch": 37.87, "learning_rate": 9.804195804195804e-07, "loss": 0.3848, "step": 43700 }, { "epoch": 37.88, "learning_rate": 9.797202797202796e-07, "loss": 0.3814, "step": 43710 }, { "epoch": 37.89, "learning_rate": 9.79020979020979e-07, "loss": 0.3339, "step": 43720 }, { "epoch": 37.89, "learning_rate": 9.783216783216782e-07, "loss": 0.3518, "step": 43730 }, { "epoch": 37.9, "learning_rate": 9.776223776223775e-07, "loss": 0.3501, "step": 43740 }, { "epoch": 37.91, "learning_rate": 9.769230769230768e-07, "loss": 0.4146, "step": 43750 }, { "epoch": 37.92, "learning_rate": 9.76223776223776e-07, "loss": 0.3855, "step": 43760 }, { "epoch": 37.93, "learning_rate": 9.755244755244756e-07, "loss": 0.3061, "step": 43770 }, { "epoch": 37.94, "learning_rate": 9.748251748251749e-07, "loss": 0.3929, "step": 43780 }, { "epoch": 37.95, "learning_rate": 9.741258741258741e-07, "loss": 0.3627, "step": 43790 }, { "epoch": 37.95, "learning_rate": 9.734265734265734e-07, "loss": 0.3824, "step": 43800 }, { "epoch": 37.96, "learning_rate": 9.727272727272727e-07, "loss": 0.3575, "step": 43810 }, { "epoch": 37.97, "learning_rate": 9.72027972027972e-07, "loss": 0.3515, "step": 43820 }, { "epoch": 37.98, "learning_rate": 9.713286713286713e-07, "loss": 0.3463, "step": 43830 }, { "epoch": 37.99, "learning_rate": 9.706293706293706e-07, "loss": 0.3723, "step": 43840 }, { "epoch": 38.0, "learning_rate": 9.699300699300699e-07, "loss": 0.3595, "step": 43850 }, { "epoch": 38.0, "eval_loss": 0.5644901990890503, "eval_runtime": 138.0216, "eval_samples_per_second": 3.854, "eval_steps_per_second": 1.927, "eval_wer": 0.24252747959118082, "step": 43852 }, { "epoch": 38.01, "learning_rate": 9.692307692307691e-07, "loss": 0.3875, "step": 43860 }, { "epoch": 38.02, "learning_rate": 9.685314685314684e-07, "loss": 0.3265, "step": 43870 }, { "epoch": 38.02, "learning_rate": 9.678321678321677e-07, "loss": 0.3206, "step": 43880 }, { "epoch": 38.03, "learning_rate": 9.671328671328672e-07, "loss": 0.3687, "step": 43890 }, { "epoch": 38.04, "learning_rate": 9.664335664335665e-07, "loss": 0.3597, "step": 43900 }, { "epoch": 38.05, "learning_rate": 9.657342657342656e-07, "loss": 0.3749, "step": 43910 }, { "epoch": 38.06, "learning_rate": 9.650349650349648e-07, "loss": 0.4115, "step": 43920 }, { "epoch": 38.07, "learning_rate": 9.643356643356643e-07, "loss": 0.3816, "step": 43930 }, { "epoch": 38.08, "learning_rate": 9.636363636363636e-07, "loss": 0.3347, "step": 43940 }, { "epoch": 38.08, "learning_rate": 9.62937062937063e-07, "loss": 0.3663, "step": 43950 }, { "epoch": 38.09, "learning_rate": 9.622377622377622e-07, "loss": 0.3175, "step": 43960 }, { "epoch": 38.1, "learning_rate": 9.615384615384615e-07, "loss": 0.4146, "step": 43970 }, { "epoch": 38.11, "learning_rate": 9.608391608391608e-07, "loss": 0.3256, "step": 43980 }, { "epoch": 38.12, "learning_rate": 9.6013986013986e-07, "loss": 0.3867, "step": 43990 }, { "epoch": 38.13, "learning_rate": 9.594405594405593e-07, "loss": 0.3616, "step": 44000 }, { "epoch": 38.14, "learning_rate": 9.587412587412586e-07, "loss": 0.382, "step": 44010 }, { "epoch": 38.15, "learning_rate": 9.58041958041958e-07, "loss": 0.368, "step": 44020 }, { "epoch": 38.15, "learning_rate": 9.573426573426572e-07, "loss": 0.387, "step": 44030 }, { "epoch": 38.16, "learning_rate": 9.566433566433567e-07, "loss": 0.3909, "step": 44040 }, { "epoch": 38.17, "learning_rate": 9.55944055944056e-07, "loss": 0.3383, "step": 44050 }, { "epoch": 38.18, "learning_rate": 9.552447552447553e-07, "loss": 0.338, "step": 44060 }, { "epoch": 38.19, "learning_rate": 9.545454545454546e-07, "loss": 0.3665, "step": 44070 }, { "epoch": 38.2, "learning_rate": 9.538461538461538e-07, "loss": 0.3143, "step": 44080 }, { "epoch": 38.21, "learning_rate": 9.53146853146853e-07, "loss": 0.357, "step": 44090 }, { "epoch": 38.21, "learning_rate": 9.524475524475524e-07, "loss": 0.361, "step": 44100 }, { "epoch": 38.22, "learning_rate": 9.517482517482517e-07, "loss": 0.3403, "step": 44110 }, { "epoch": 38.23, "learning_rate": 9.51048951048951e-07, "loss": 0.4304, "step": 44120 }, { "epoch": 38.24, "learning_rate": 9.503496503496503e-07, "loss": 0.3789, "step": 44130 }, { "epoch": 38.25, "learning_rate": 9.496503496503497e-07, "loss": 0.4432, "step": 44140 }, { "epoch": 38.26, "learning_rate": 9.489510489510489e-07, "loss": 0.3962, "step": 44150 }, { "epoch": 38.27, "learning_rate": 9.482517482517482e-07, "loss": 0.3889, "step": 44160 }, { "epoch": 38.28, "learning_rate": 9.475524475524476e-07, "loss": 0.3886, "step": 44170 }, { "epoch": 38.28, "learning_rate": 9.468531468531468e-07, "loss": 0.3698, "step": 44180 }, { "epoch": 38.29, "learning_rate": 9.461538461538461e-07, "loss": 0.363, "step": 44190 }, { "epoch": 38.3, "learning_rate": 9.454545454545454e-07, "loss": 0.3795, "step": 44200 }, { "epoch": 38.31, "learning_rate": 9.447552447552448e-07, "loss": 0.3191, "step": 44210 }, { "epoch": 38.32, "learning_rate": 9.44055944055944e-07, "loss": 0.3204, "step": 44220 }, { "epoch": 38.33, "learning_rate": 9.433566433566433e-07, "loss": 0.3443, "step": 44230 }, { "epoch": 38.34, "learning_rate": 9.426573426573426e-07, "loss": 0.3001, "step": 44240 }, { "epoch": 38.34, "learning_rate": 9.41958041958042e-07, "loss": 0.3616, "step": 44250 }, { "epoch": 38.35, "learning_rate": 9.412587412587412e-07, "loss": 0.3068, "step": 44260 }, { "epoch": 38.36, "learning_rate": 9.405594405594405e-07, "loss": 0.3636, "step": 44270 }, { "epoch": 38.37, "learning_rate": 9.398601398601398e-07, "loss": 0.3701, "step": 44280 }, { "epoch": 38.38, "learning_rate": 9.391608391608391e-07, "loss": 0.3862, "step": 44290 }, { "epoch": 38.39, "learning_rate": 9.384615384615384e-07, "loss": 0.4033, "step": 44300 }, { "epoch": 38.4, "learning_rate": 9.377622377622377e-07, "loss": 0.3917, "step": 44310 }, { "epoch": 38.41, "learning_rate": 9.37062937062937e-07, "loss": 0.3281, "step": 44320 }, { "epoch": 38.41, "learning_rate": 9.363636363636364e-07, "loss": 0.3073, "step": 44330 }, { "epoch": 38.42, "learning_rate": 9.356643356643357e-07, "loss": 0.3964, "step": 44340 }, { "epoch": 38.43, "learning_rate": 9.349650349650349e-07, "loss": 0.3475, "step": 44350 }, { "epoch": 38.44, "learning_rate": 9.342657342657341e-07, "loss": 0.3904, "step": 44360 }, { "epoch": 38.45, "learning_rate": 9.335664335664335e-07, "loss": 0.3616, "step": 44370 }, { "epoch": 38.46, "learning_rate": 9.328671328671328e-07, "loss": 0.3734, "step": 44380 }, { "epoch": 38.47, "learning_rate": 9.321678321678321e-07, "loss": 0.3758, "step": 44390 }, { "epoch": 38.47, "learning_rate": 9.314685314685314e-07, "loss": 0.3554, "step": 44400 }, { "epoch": 38.48, "learning_rate": 9.307692307692308e-07, "loss": 0.3412, "step": 44410 }, { "epoch": 38.49, "learning_rate": 9.300699300699301e-07, "loss": 0.3786, "step": 44420 }, { "epoch": 38.5, "learning_rate": 9.293706293706293e-07, "loss": 0.329, "step": 44430 }, { "epoch": 38.51, "learning_rate": 9.286713286713286e-07, "loss": 0.3826, "step": 44440 }, { "epoch": 38.52, "learning_rate": 9.279720279720279e-07, "loss": 0.382, "step": 44450 }, { "epoch": 38.53, "learning_rate": 9.272727272727272e-07, "loss": 0.345, "step": 44460 }, { "epoch": 38.54, "learning_rate": 9.265734265734265e-07, "loss": 0.4207, "step": 44470 }, { "epoch": 38.54, "learning_rate": 9.258741258741259e-07, "loss": 0.3646, "step": 44480 }, { "epoch": 38.55, "learning_rate": 9.251748251748252e-07, "loss": 0.3903, "step": 44490 }, { "epoch": 38.56, "learning_rate": 9.244755244755244e-07, "loss": 0.3991, "step": 44500 }, { "epoch": 38.57, "learning_rate": 9.237762237762237e-07, "loss": 0.3537, "step": 44510 }, { "epoch": 38.58, "learning_rate": 9.230769230769231e-07, "loss": 0.355, "step": 44520 }, { "epoch": 38.59, "learning_rate": 9.223776223776223e-07, "loss": 0.3738, "step": 44530 }, { "epoch": 38.6, "learning_rate": 9.216783216783216e-07, "loss": 0.3995, "step": 44540 }, { "epoch": 38.6, "learning_rate": 9.209790209790209e-07, "loss": 0.3621, "step": 44550 }, { "epoch": 38.61, "learning_rate": 9.202797202797203e-07, "loss": 0.3447, "step": 44560 }, { "epoch": 38.62, "learning_rate": 9.195804195804196e-07, "loss": 0.3588, "step": 44570 }, { "epoch": 38.63, "learning_rate": 9.188811188811188e-07, "loss": 0.3549, "step": 44580 }, { "epoch": 38.64, "learning_rate": 9.181818181818181e-07, "loss": 0.3609, "step": 44590 }, { "epoch": 38.65, "learning_rate": 9.174825174825175e-07, "loss": 0.3788, "step": 44600 }, { "epoch": 38.66, "learning_rate": 9.167832167832168e-07, "loss": 0.3588, "step": 44610 }, { "epoch": 38.67, "learning_rate": 9.16083916083916e-07, "loss": 0.3362, "step": 44620 }, { "epoch": 38.67, "learning_rate": 9.153846153846153e-07, "loss": 0.3101, "step": 44630 }, { "epoch": 38.68, "learning_rate": 9.146853146853147e-07, "loss": 0.3447, "step": 44640 }, { "epoch": 38.69, "learning_rate": 9.139860139860139e-07, "loss": 0.4118, "step": 44650 }, { "epoch": 38.7, "learning_rate": 9.132867132867132e-07, "loss": 0.3416, "step": 44660 }, { "epoch": 38.71, "learning_rate": 9.125874125874126e-07, "loss": 0.324, "step": 44670 }, { "epoch": 38.72, "learning_rate": 9.118881118881119e-07, "loss": 0.2899, "step": 44680 }, { "epoch": 38.73, "learning_rate": 9.111888111888112e-07, "loss": 0.4077, "step": 44690 }, { "epoch": 38.73, "learning_rate": 9.104895104895104e-07, "loss": 0.3471, "step": 44700 }, { "epoch": 38.74, "learning_rate": 9.097902097902098e-07, "loss": 0.4073, "step": 44710 }, { "epoch": 38.75, "learning_rate": 9.09090909090909e-07, "loss": 0.3735, "step": 44720 }, { "epoch": 38.76, "learning_rate": 9.083916083916083e-07, "loss": 0.383, "step": 44730 }, { "epoch": 38.77, "learning_rate": 9.076923076923076e-07, "loss": 0.3692, "step": 44740 }, { "epoch": 38.78, "learning_rate": 9.06993006993007e-07, "loss": 0.3726, "step": 44750 }, { "epoch": 38.79, "learning_rate": 9.062937062937063e-07, "loss": 0.419, "step": 44760 }, { "epoch": 38.8, "learning_rate": 9.055944055944056e-07, "loss": 0.3219, "step": 44770 }, { "epoch": 38.8, "learning_rate": 9.048951048951049e-07, "loss": 0.333, "step": 44780 }, { "epoch": 38.81, "learning_rate": 9.041958041958041e-07, "loss": 0.3529, "step": 44790 }, { "epoch": 38.82, "learning_rate": 9.034965034965034e-07, "loss": 0.3975, "step": 44800 }, { "epoch": 38.83, "learning_rate": 9.027972027972027e-07, "loss": 0.3833, "step": 44810 }, { "epoch": 38.84, "learning_rate": 9.02097902097902e-07, "loss": 0.3765, "step": 44820 }, { "epoch": 38.85, "learning_rate": 9.013986013986014e-07, "loss": 0.3236, "step": 44830 }, { "epoch": 38.86, "learning_rate": 9.006993006993007e-07, "loss": 0.3945, "step": 44840 }, { "epoch": 38.86, "learning_rate": 9e-07, "loss": 0.3876, "step": 44850 }, { "epoch": 38.87, "learning_rate": 8.993006993006992e-07, "loss": 0.3197, "step": 44860 }, { "epoch": 38.88, "learning_rate": 8.986013986013986e-07, "loss": 0.3528, "step": 44870 }, { "epoch": 38.89, "learning_rate": 8.979020979020978e-07, "loss": 0.3329, "step": 44880 }, { "epoch": 38.9, "learning_rate": 8.972027972027971e-07, "loss": 0.378, "step": 44890 }, { "epoch": 38.91, "learning_rate": 8.965034965034964e-07, "loss": 0.3684, "step": 44900 }, { "epoch": 38.92, "learning_rate": 8.958041958041958e-07, "loss": 0.3379, "step": 44910 }, { "epoch": 38.93, "learning_rate": 8.951048951048951e-07, "loss": 0.4082, "step": 44920 }, { "epoch": 38.93, "learning_rate": 8.944055944055943e-07, "loss": 0.4096, "step": 44930 }, { "epoch": 38.94, "learning_rate": 8.937062937062937e-07, "loss": 0.3939, "step": 44940 }, { "epoch": 38.95, "learning_rate": 8.93006993006993e-07, "loss": 0.3941, "step": 44950 }, { "epoch": 38.96, "learning_rate": 8.923076923076923e-07, "loss": 0.3486, "step": 44960 }, { "epoch": 38.97, "learning_rate": 8.916083916083915e-07, "loss": 0.365, "step": 44970 }, { "epoch": 38.98, "learning_rate": 8.909090909090909e-07, "loss": 0.3748, "step": 44980 }, { "epoch": 38.99, "learning_rate": 8.902097902097902e-07, "loss": 0.3601, "step": 44990 }, { "epoch": 38.99, "learning_rate": 8.895104895104894e-07, "loss": 0.4174, "step": 45000 }, { "epoch": 39.0, "eval_loss": 0.5560790300369263, "eval_runtime": 134.861, "eval_samples_per_second": 3.945, "eval_steps_per_second": 1.972, "eval_wer": 0.2422060808639198, "step": 45006 }, { "epoch": 39.0, "learning_rate": 8.888111888111887e-07, "loss": 0.3254, "step": 45010 }, { "epoch": 39.01, "learning_rate": 8.881118881118881e-07, "loss": 0.3612, "step": 45020 }, { "epoch": 39.02, "learning_rate": 8.874125874125874e-07, "loss": 0.3244, "step": 45030 }, { "epoch": 39.03, "learning_rate": 8.867132867132867e-07, "loss": 0.3464, "step": 45040 }, { "epoch": 39.04, "learning_rate": 8.86013986013986e-07, "loss": 0.3929, "step": 45050 }, { "epoch": 39.05, "learning_rate": 8.853146853146853e-07, "loss": 0.3325, "step": 45060 }, { "epoch": 39.06, "learning_rate": 8.846153846153846e-07, "loss": 0.3727, "step": 45070 }, { "epoch": 39.06, "learning_rate": 8.839160839160838e-07, "loss": 0.3336, "step": 45080 }, { "epoch": 39.07, "learning_rate": 8.832167832167831e-07, "loss": 0.365, "step": 45090 }, { "epoch": 39.08, "learning_rate": 8.825174825174825e-07, "loss": 0.3776, "step": 45100 }, { "epoch": 39.09, "learning_rate": 8.818181818181818e-07, "loss": 0.3349, "step": 45110 }, { "epoch": 39.1, "learning_rate": 8.811188811188811e-07, "loss": 0.3766, "step": 45120 }, { "epoch": 39.11, "learning_rate": 8.804195804195805e-07, "loss": 0.3304, "step": 45130 }, { "epoch": 39.12, "learning_rate": 8.797202797202798e-07, "loss": 0.3559, "step": 45140 }, { "epoch": 39.12, "learning_rate": 8.790209790209789e-07, "loss": 0.3789, "step": 45150 }, { "epoch": 39.13, "learning_rate": 8.783216783216782e-07, "loss": 0.3489, "step": 45160 }, { "epoch": 39.14, "learning_rate": 8.776223776223776e-07, "loss": 0.3391, "step": 45170 }, { "epoch": 39.15, "learning_rate": 8.769230769230769e-07, "loss": 0.3677, "step": 45180 }, { "epoch": 39.16, "learning_rate": 8.762237762237762e-07, "loss": 0.3268, "step": 45190 }, { "epoch": 39.17, "learning_rate": 8.755244755244755e-07, "loss": 0.3579, "step": 45200 }, { "epoch": 39.18, "learning_rate": 8.748251748251749e-07, "loss": 0.3822, "step": 45210 }, { "epoch": 39.19, "learning_rate": 8.741258741258741e-07, "loss": 0.3721, "step": 45220 }, { "epoch": 39.19, "learning_rate": 8.734265734265733e-07, "loss": 0.3749, "step": 45230 }, { "epoch": 39.2, "learning_rate": 8.727272727272726e-07, "loss": 0.3774, "step": 45240 }, { "epoch": 39.21, "learning_rate": 8.72027972027972e-07, "loss": 0.4054, "step": 45250 }, { "epoch": 39.22, "learning_rate": 8.713286713286713e-07, "loss": 0.3563, "step": 45260 }, { "epoch": 39.23, "learning_rate": 8.706293706293706e-07, "loss": 0.3177, "step": 45270 }, { "epoch": 39.24, "learning_rate": 8.699300699300699e-07, "loss": 0.3767, "step": 45280 }, { "epoch": 39.25, "learning_rate": 8.692307692307692e-07, "loss": 0.3558, "step": 45290 }, { "epoch": 39.25, "learning_rate": 8.685314685314685e-07, "loss": 0.367, "step": 45300 }, { "epoch": 39.26, "learning_rate": 8.678321678321678e-07, "loss": 0.3671, "step": 45310 }, { "epoch": 39.27, "learning_rate": 8.67132867132867e-07, "loss": 0.3949, "step": 45320 }, { "epoch": 39.28, "learning_rate": 8.664335664335664e-07, "loss": 0.3387, "step": 45330 }, { "epoch": 39.29, "learning_rate": 8.657342657342657e-07, "loss": 0.3181, "step": 45340 }, { "epoch": 39.3, "learning_rate": 8.65034965034965e-07, "loss": 0.4401, "step": 45350 }, { "epoch": 39.31, "learning_rate": 8.644055944055943e-07, "loss": 1.004, "step": 45360 }, { "epoch": 39.32, "learning_rate": 8.637062937062937e-07, "loss": 0.3415, "step": 45370 }, { "epoch": 39.32, "learning_rate": 8.63006993006993e-07, "loss": 0.3209, "step": 45380 }, { "epoch": 39.33, "learning_rate": 8.623076923076923e-07, "loss": 0.3658, "step": 45390 }, { "epoch": 39.34, "learning_rate": 8.616083916083916e-07, "loss": 0.3934, "step": 45400 }, { "epoch": 39.35, "learning_rate": 8.60909090909091e-07, "loss": 0.3391, "step": 45410 }, { "epoch": 39.36, "learning_rate": 8.602097902097901e-07, "loss": 0.3803, "step": 45420 }, { "epoch": 39.37, "learning_rate": 8.595104895104894e-07, "loss": 0.3205, "step": 45430 }, { "epoch": 39.38, "learning_rate": 8.588111888111887e-07, "loss": 0.3482, "step": 45440 }, { "epoch": 39.38, "learning_rate": 8.581118881118881e-07, "loss": 0.327, "step": 45450 }, { "epoch": 39.39, "learning_rate": 8.574125874125874e-07, "loss": 0.3618, "step": 45460 }, { "epoch": 39.4, "learning_rate": 8.567132867132867e-07, "loss": 0.2993, "step": 45470 }, { "epoch": 39.41, "learning_rate": 8.56013986013986e-07, "loss": 0.3172, "step": 45480 }, { "epoch": 39.42, "learning_rate": 8.553146853146853e-07, "loss": 0.3522, "step": 45490 }, { "epoch": 39.43, "learning_rate": 8.546153846153846e-07, "loss": 0.4131, "step": 45500 }, { "epoch": 39.44, "learning_rate": 8.539160839160838e-07, "loss": 0.3244, "step": 45510 }, { "epoch": 39.45, "learning_rate": 8.532167832167831e-07, "loss": 0.4001, "step": 45520 }, { "epoch": 39.45, "learning_rate": 8.525174825174825e-07, "loss": 0.3875, "step": 45530 }, { "epoch": 39.46, "learning_rate": 8.518181818181818e-07, "loss": 0.3784, "step": 45540 }, { "epoch": 39.47, "learning_rate": 8.51118881118881e-07, "loss": 0.3371, "step": 45550 }, { "epoch": 39.48, "learning_rate": 8.504195804195804e-07, "loss": 0.3874, "step": 45560 }, { "epoch": 39.49, "learning_rate": 8.497202797202797e-07, "loss": 0.4045, "step": 45570 }, { "epoch": 39.5, "learning_rate": 8.49020979020979e-07, "loss": 0.3472, "step": 45580 }, { "epoch": 39.51, "learning_rate": 8.483216783216783e-07, "loss": 0.3323, "step": 45590 }, { "epoch": 39.51, "learning_rate": 8.476223776223776e-07, "loss": 0.3584, "step": 45600 }, { "epoch": 39.52, "learning_rate": 8.469230769230769e-07, "loss": 0.3508, "step": 45610 }, { "epoch": 39.53, "learning_rate": 8.462237762237762e-07, "loss": 0.3475, "step": 45620 }, { "epoch": 39.54, "learning_rate": 8.455244755244754e-07, "loss": 0.3261, "step": 45630 }, { "epoch": 39.55, "learning_rate": 8.448251748251748e-07, "loss": 0.3484, "step": 45640 }, { "epoch": 39.56, "learning_rate": 8.441258741258741e-07, "loss": 0.3232, "step": 45650 }, { "epoch": 39.57, "learning_rate": 8.434265734265734e-07, "loss": 0.3817, "step": 45660 }, { "epoch": 39.58, "learning_rate": 8.427272727272727e-07, "loss": 0.3977, "step": 45670 }, { "epoch": 39.58, "learning_rate": 8.420279720279721e-07, "loss": 0.3844, "step": 45680 }, { "epoch": 39.59, "learning_rate": 8.413286713286713e-07, "loss": 0.4122, "step": 45690 }, { "epoch": 39.6, "learning_rate": 8.406293706293705e-07, "loss": 0.3463, "step": 45700 }, { "epoch": 39.61, "learning_rate": 8.399300699300698e-07, "loss": 0.3676, "step": 45710 }, { "epoch": 39.62, "learning_rate": 8.392307692307692e-07, "loss": 0.3153, "step": 45720 }, { "epoch": 39.63, "learning_rate": 8.385314685314685e-07, "loss": 0.3782, "step": 45730 }, { "epoch": 39.64, "learning_rate": 8.378321678321678e-07, "loss": 0.3946, "step": 45740 }, { "epoch": 39.64, "learning_rate": 8.371328671328672e-07, "loss": 0.337, "step": 45750 }, { "epoch": 39.65, "learning_rate": 8.364335664335665e-07, "loss": 0.343, "step": 45760 }, { "epoch": 39.66, "learning_rate": 8.357342657342656e-07, "loss": 0.4086, "step": 45770 }, { "epoch": 39.67, "learning_rate": 8.350349650349649e-07, "loss": 0.3289, "step": 45780 }, { "epoch": 39.68, "learning_rate": 8.343356643356643e-07, "loss": 0.3764, "step": 45790 }, { "epoch": 39.69, "learning_rate": 8.336363636363636e-07, "loss": 0.4078, "step": 45800 }, { "epoch": 39.7, "learning_rate": 8.329370629370629e-07, "loss": 0.3649, "step": 45810 }, { "epoch": 39.71, "learning_rate": 8.322377622377622e-07, "loss": 0.3192, "step": 45820 }, { "epoch": 39.71, "learning_rate": 8.315384615384616e-07, "loss": 0.3186, "step": 45830 }, { "epoch": 39.72, "learning_rate": 8.308391608391609e-07, "loss": 0.3843, "step": 45840 }, { "epoch": 39.73, "learning_rate": 8.301398601398601e-07, "loss": 0.4289, "step": 45850 }, { "epoch": 39.74, "learning_rate": 8.294405594405593e-07, "loss": 0.3832, "step": 45860 }, { "epoch": 39.75, "learning_rate": 8.287412587412587e-07, "loss": 0.3709, "step": 45870 }, { "epoch": 39.76, "learning_rate": 8.28041958041958e-07, "loss": 0.3485, "step": 45880 }, { "epoch": 39.77, "learning_rate": 8.273426573426573e-07, "loss": 0.4107, "step": 45890 }, { "epoch": 39.77, "learning_rate": 8.266433566433566e-07, "loss": 0.3506, "step": 45900 }, { "epoch": 39.78, "learning_rate": 8.25944055944056e-07, "loss": 0.3926, "step": 45910 }, { "epoch": 39.79, "learning_rate": 8.252447552447552e-07, "loss": 0.3188, "step": 45920 }, { "epoch": 39.8, "learning_rate": 8.245454545454545e-07, "loss": 0.3841, "step": 45930 }, { "epoch": 39.81, "learning_rate": 8.238461538461538e-07, "loss": 0.33, "step": 45940 }, { "epoch": 39.82, "learning_rate": 8.231468531468531e-07, "loss": 0.4078, "step": 45950 }, { "epoch": 39.83, "learning_rate": 8.224475524475524e-07, "loss": 0.3734, "step": 45960 }, { "epoch": 39.83, "learning_rate": 8.217482517482517e-07, "loss": 0.433, "step": 45970 }, { "epoch": 39.84, "learning_rate": 8.21048951048951e-07, "loss": 0.3371, "step": 45980 }, { "epoch": 39.85, "learning_rate": 8.203496503496503e-07, "loss": 0.3286, "step": 45990 }, { "epoch": 39.86, "learning_rate": 8.196503496503496e-07, "loss": 0.3165, "step": 46000 }, { "epoch": 39.87, "learning_rate": 8.189510489510489e-07, "loss": 0.3681, "step": 46010 }, { "epoch": 39.88, "learning_rate": 8.182517482517483e-07, "loss": 0.4005, "step": 46020 }, { "epoch": 39.89, "learning_rate": 8.175524475524476e-07, "loss": 0.3461, "step": 46030 }, { "epoch": 39.9, "learning_rate": 8.168531468531468e-07, "loss": 0.3826, "step": 46040 }, { "epoch": 39.9, "learning_rate": 8.16153846153846e-07, "loss": 0.3303, "step": 46050 }, { "epoch": 39.91, "learning_rate": 8.154545454545454e-07, "loss": 0.3725, "step": 46060 }, { "epoch": 39.92, "learning_rate": 8.147552447552447e-07, "loss": 0.3333, "step": 46070 }, { "epoch": 39.93, "learning_rate": 8.14055944055944e-07, "loss": 0.3256, "step": 46080 }, { "epoch": 39.94, "learning_rate": 8.133566433566433e-07, "loss": 0.3596, "step": 46090 }, { "epoch": 39.95, "learning_rate": 8.126573426573427e-07, "loss": 0.3749, "step": 46100 }, { "epoch": 39.96, "learning_rate": 8.11958041958042e-07, "loss": 0.3801, "step": 46110 }, { "epoch": 39.96, "learning_rate": 8.112587412587413e-07, "loss": 0.3549, "step": 46120 }, { "epoch": 39.97, "learning_rate": 8.105594405594404e-07, "loss": 0.2963, "step": 46130 }, { "epoch": 39.98, "learning_rate": 8.098601398601398e-07, "loss": 0.3943, "step": 46140 }, { "epoch": 39.99, "learning_rate": 8.091608391608391e-07, "loss": 0.4128, "step": 46150 }, { "epoch": 40.0, "learning_rate": 8.084615384615384e-07, "loss": 0.3801, "step": 46160 }, { "epoch": 40.0, "eval_loss": 0.555422306060791, "eval_runtime": 135.1325, "eval_samples_per_second": 3.937, "eval_steps_per_second": 1.968, "eval_wer": 0.24265603908208525, "step": 46160 }, { "epoch": 40.01, "learning_rate": 8.077622377622377e-07, "loss": 0.3376, "step": 46170 }, { "epoch": 40.02, "learning_rate": 8.070629370629371e-07, "loss": 0.3705, "step": 46180 }, { "epoch": 40.03, "learning_rate": 8.063636363636364e-07, "loss": 0.3501, "step": 46190 }, { "epoch": 40.03, "learning_rate": 8.056643356643356e-07, "loss": 0.3822, "step": 46200 }, { "epoch": 40.04, "learning_rate": 8.049650349650349e-07, "loss": 0.4096, "step": 46210 }, { "epoch": 40.05, "learning_rate": 8.042657342657342e-07, "loss": 0.3671, "step": 46220 }, { "epoch": 40.06, "learning_rate": 8.035664335664335e-07, "loss": 0.3587, "step": 46230 }, { "epoch": 40.07, "learning_rate": 8.028671328671328e-07, "loss": 0.3556, "step": 46240 }, { "epoch": 40.08, "learning_rate": 8.021678321678321e-07, "loss": 0.3804, "step": 46250 }, { "epoch": 40.09, "learning_rate": 8.014685314685315e-07, "loss": 0.3352, "step": 46260 }, { "epoch": 40.1, "learning_rate": 8.007692307692308e-07, "loss": 0.3717, "step": 46270 }, { "epoch": 40.1, "learning_rate": 8.0006993006993e-07, "loss": 0.3979, "step": 46280 }, { "epoch": 40.11, "learning_rate": 7.993706293706294e-07, "loss": 0.339, "step": 46290 }, { "epoch": 40.12, "learning_rate": 7.986713286713286e-07, "loss": 0.3293, "step": 46300 }, { "epoch": 40.13, "learning_rate": 7.979720279720279e-07, "loss": 0.434, "step": 46310 }, { "epoch": 40.14, "learning_rate": 7.972727272727272e-07, "loss": 0.3497, "step": 46320 }, { "epoch": 40.15, "learning_rate": 7.965734265734266e-07, "loss": 0.3962, "step": 46330 }, { "epoch": 40.16, "learning_rate": 7.958741258741259e-07, "loss": 0.3041, "step": 46340 }, { "epoch": 40.16, "learning_rate": 7.951748251748251e-07, "loss": 0.3659, "step": 46350 }, { "epoch": 40.17, "learning_rate": 7.944755244755244e-07, "loss": 0.3684, "step": 46360 }, { "epoch": 40.18, "learning_rate": 7.937762237762238e-07, "loss": 0.3591, "step": 46370 }, { "epoch": 40.19, "learning_rate": 7.930769230769231e-07, "loss": 0.3384, "step": 46380 }, { "epoch": 40.2, "learning_rate": 7.923776223776223e-07, "loss": 0.3565, "step": 46390 }, { "epoch": 40.21, "learning_rate": 7.916783216783216e-07, "loss": 0.3494, "step": 46400 }, { "epoch": 40.22, "learning_rate": 7.90979020979021e-07, "loss": 0.3633, "step": 46410 }, { "epoch": 40.23, "learning_rate": 7.902797202797202e-07, "loss": 0.3559, "step": 46420 }, { "epoch": 40.23, "learning_rate": 7.895804195804195e-07, "loss": 0.3643, "step": 46430 }, { "epoch": 40.24, "learning_rate": 7.888811188811188e-07, "loss": 0.3674, "step": 46440 }, { "epoch": 40.25, "learning_rate": 7.881818181818182e-07, "loss": 0.3457, "step": 46450 }, { "epoch": 40.26, "learning_rate": 7.874825174825175e-07, "loss": 0.428, "step": 46460 }, { "epoch": 40.27, "learning_rate": 7.867832167832168e-07, "loss": 0.3056, "step": 46470 }, { "epoch": 40.28, "learning_rate": 7.86083916083916e-07, "loss": 0.3643, "step": 46480 }, { "epoch": 40.29, "learning_rate": 7.853846153846153e-07, "loss": 0.3634, "step": 46490 }, { "epoch": 40.29, "learning_rate": 7.846853146853146e-07, "loss": 0.3273, "step": 46500 }, { "epoch": 40.3, "learning_rate": 7.839860139860139e-07, "loss": 0.3266, "step": 46510 }, { "epoch": 40.31, "learning_rate": 7.832867132867133e-07, "loss": 0.386, "step": 46520 }, { "epoch": 40.32, "learning_rate": 7.825874125874126e-07, "loss": 0.3992, "step": 46530 }, { "epoch": 40.33, "learning_rate": 7.818881118881119e-07, "loss": 0.3818, "step": 46540 }, { "epoch": 40.34, "learning_rate": 7.811888111888112e-07, "loss": 0.3936, "step": 46550 }, { "epoch": 40.35, "learning_rate": 7.804895104895105e-07, "loss": 0.3577, "step": 46560 }, { "epoch": 40.36, "learning_rate": 7.797902097902097e-07, "loss": 0.3625, "step": 46570 }, { "epoch": 40.36, "learning_rate": 7.79090909090909e-07, "loss": 0.325, "step": 46580 }, { "epoch": 40.37, "learning_rate": 7.783916083916083e-07, "loss": 0.2867, "step": 46590 }, { "epoch": 40.38, "learning_rate": 7.776923076923077e-07, "loss": 0.3772, "step": 46600 }, { "epoch": 40.39, "learning_rate": 7.76993006993007e-07, "loss": 0.4338, "step": 46610 }, { "epoch": 40.4, "learning_rate": 7.762937062937063e-07, "loss": 0.2842, "step": 46620 }, { "epoch": 40.41, "learning_rate": 7.755944055944055e-07, "loss": 0.3428, "step": 46630 }, { "epoch": 40.42, "learning_rate": 7.748951048951049e-07, "loss": 0.3017, "step": 46640 }, { "epoch": 40.42, "learning_rate": 7.741958041958042e-07, "loss": 0.377, "step": 46650 }, { "epoch": 40.43, "learning_rate": 7.734965034965034e-07, "loss": 0.3507, "step": 46660 }, { "epoch": 40.44, "learning_rate": 7.727972027972027e-07, "loss": 0.4011, "step": 46670 }, { "epoch": 40.45, "learning_rate": 7.720979020979021e-07, "loss": 0.3269, "step": 46680 }, { "epoch": 40.46, "learning_rate": 7.713986013986014e-07, "loss": 0.3637, "step": 46690 }, { "epoch": 40.47, "learning_rate": 7.706993006993006e-07, "loss": 0.3921, "step": 46700 }, { "epoch": 40.48, "learning_rate": 7.699999999999999e-07, "loss": 0.3854, "step": 46710 }, { "epoch": 40.49, "learning_rate": 7.693006993006993e-07, "loss": 0.3721, "step": 46720 }, { "epoch": 40.49, "learning_rate": 7.686013986013986e-07, "loss": 0.3072, "step": 46730 }, { "epoch": 40.5, "learning_rate": 7.679020979020979e-07, "loss": 0.3823, "step": 46740 }, { "epoch": 40.51, "learning_rate": 7.672027972027971e-07, "loss": 0.428, "step": 46750 }, { "epoch": 40.52, "learning_rate": 7.665034965034965e-07, "loss": 0.391, "step": 46760 }, { "epoch": 40.53, "learning_rate": 7.658041958041958e-07, "loss": 0.388, "step": 46770 }, { "epoch": 40.54, "learning_rate": 7.65104895104895e-07, "loss": 0.3316, "step": 46780 }, { "epoch": 40.55, "learning_rate": 7.644055944055944e-07, "loss": 0.3006, "step": 46790 }, { "epoch": 40.55, "learning_rate": 7.637062937062937e-07, "loss": 0.3454, "step": 46800 }, { "epoch": 40.56, "learning_rate": 7.63006993006993e-07, "loss": 0.3911, "step": 46810 }, { "epoch": 40.57, "learning_rate": 7.623076923076923e-07, "loss": 0.4216, "step": 46820 }, { "epoch": 40.58, "learning_rate": 7.616083916083916e-07, "loss": 0.3473, "step": 46830 }, { "epoch": 40.59, "learning_rate": 7.609090909090909e-07, "loss": 0.318, "step": 46840 }, { "epoch": 40.6, "learning_rate": 7.602097902097901e-07, "loss": 0.3566, "step": 46850 }, { "epoch": 40.61, "learning_rate": 7.595104895104894e-07, "loss": 0.4275, "step": 46860 }, { "epoch": 40.61, "learning_rate": 7.588111888111888e-07, "loss": 0.3429, "step": 46870 }, { "epoch": 40.62, "learning_rate": 7.581118881118881e-07, "loss": 0.3497, "step": 46880 }, { "epoch": 40.63, "learning_rate": 7.574125874125874e-07, "loss": 0.3578, "step": 46890 }, { "epoch": 40.64, "learning_rate": 7.567132867132867e-07, "loss": 0.3595, "step": 46900 }, { "epoch": 40.65, "learning_rate": 7.560139860139861e-07, "loss": 0.3588, "step": 46910 }, { "epoch": 40.66, "learning_rate": 7.553146853146852e-07, "loss": 0.3881, "step": 46920 }, { "epoch": 40.67, "learning_rate": 7.546153846153845e-07, "loss": 0.3375, "step": 46930 }, { "epoch": 40.68, "learning_rate": 7.539160839160838e-07, "loss": 0.304, "step": 46940 }, { "epoch": 40.68, "learning_rate": 7.532167832167832e-07, "loss": 0.3907, "step": 46950 }, { "epoch": 40.69, "learning_rate": 7.525174825174825e-07, "loss": 0.3802, "step": 46960 }, { "epoch": 40.7, "learning_rate": 7.518181818181818e-07, "loss": 0.3624, "step": 46970 }, { "epoch": 40.71, "learning_rate": 7.511188811188811e-07, "loss": 0.3823, "step": 46980 }, { "epoch": 40.72, "learning_rate": 7.504195804195804e-07, "loss": 0.3714, "step": 46990 }, { "epoch": 40.73, "learning_rate": 7.497202797202797e-07, "loss": 0.3438, "step": 47000 }, { "epoch": 40.74, "learning_rate": 7.490209790209789e-07, "loss": 0.3373, "step": 47010 }, { "epoch": 40.74, "learning_rate": 7.483216783216783e-07, "loss": 0.3587, "step": 47020 }, { "epoch": 40.75, "learning_rate": 7.476223776223776e-07, "loss": 0.3786, "step": 47030 }, { "epoch": 40.76, "learning_rate": 7.469230769230769e-07, "loss": 0.3028, "step": 47040 }, { "epoch": 40.77, "learning_rate": 7.462237762237762e-07, "loss": 0.3495, "step": 47050 }, { "epoch": 40.78, "learning_rate": 7.455244755244756e-07, "loss": 0.3871, "step": 47060 }, { "epoch": 40.79, "learning_rate": 7.448251748251748e-07, "loss": 0.3675, "step": 47070 }, { "epoch": 40.8, "learning_rate": 7.441258741258741e-07, "loss": 0.3547, "step": 47080 }, { "epoch": 40.81, "learning_rate": 7.434265734265734e-07, "loss": 0.3329, "step": 47090 }, { "epoch": 40.81, "learning_rate": 7.427272727272727e-07, "loss": 0.3788, "step": 47100 }, { "epoch": 40.82, "learning_rate": 7.42027972027972e-07, "loss": 0.3157, "step": 47110 }, { "epoch": 40.83, "learning_rate": 7.413286713286713e-07, "loss": 0.3474, "step": 47120 }, { "epoch": 40.84, "learning_rate": 7.406293706293705e-07, "loss": 0.3536, "step": 47130 }, { "epoch": 40.85, "learning_rate": 7.399300699300699e-07, "loss": 0.3388, "step": 47140 }, { "epoch": 40.86, "learning_rate": 7.392307692307692e-07, "loss": 0.3879, "step": 47150 }, { "epoch": 40.87, "learning_rate": 7.385314685314685e-07, "loss": 0.4051, "step": 47160 }, { "epoch": 40.87, "learning_rate": 7.378321678321678e-07, "loss": 0.3227, "step": 47170 }, { "epoch": 40.88, "learning_rate": 7.371328671328672e-07, "loss": 0.3035, "step": 47180 }, { "epoch": 40.89, "learning_rate": 7.364335664335664e-07, "loss": 0.3333, "step": 47190 }, { "epoch": 40.9, "learning_rate": 7.357342657342656e-07, "loss": 0.3611, "step": 47200 }, { "epoch": 40.91, "learning_rate": 7.350349650349649e-07, "loss": 0.4021, "step": 47210 }, { "epoch": 40.92, "learning_rate": 7.343356643356643e-07, "loss": 0.3797, "step": 47220 }, { "epoch": 40.93, "learning_rate": 7.336363636363636e-07, "loss": 0.3672, "step": 47230 }, { "epoch": 40.94, "learning_rate": 7.329370629370629e-07, "loss": 0.3057, "step": 47240 }, { "epoch": 40.94, "learning_rate": 7.322377622377623e-07, "loss": 0.3187, "step": 47250 }, { "epoch": 40.95, "learning_rate": 7.315384615384616e-07, "loss": 0.3606, "step": 47260 }, { "epoch": 40.96, "learning_rate": 7.308391608391608e-07, "loss": 0.3516, "step": 47270 }, { "epoch": 40.97, "learning_rate": 7.3013986013986e-07, "loss": 0.3528, "step": 47280 }, { "epoch": 40.98, "learning_rate": 7.294405594405594e-07, "loss": 0.397, "step": 47290 }, { "epoch": 40.99, "learning_rate": 7.287412587412587e-07, "loss": 0.3507, "step": 47300 }, { "epoch": 41.0, "learning_rate": 7.28041958041958e-07, "loss": 0.3513, "step": 47310 }, { "epoch": 41.0, "eval_loss": 0.559901773929596, "eval_runtime": 136.925, "eval_samples_per_second": 3.885, "eval_steps_per_second": 1.943, "eval_wer": 0.24201324162756316, "step": 47314 }, { "epoch": 41.01, "learning_rate": 7.273426573426573e-07, "loss": 0.3905, "step": 47320 }, { "epoch": 41.01, "learning_rate": 7.266433566433567e-07, "loss": 0.3763, "step": 47330 }, { "epoch": 41.02, "learning_rate": 7.25944055944056e-07, "loss": 0.3119, "step": 47340 }, { "epoch": 41.03, "learning_rate": 7.252447552447552e-07, "loss": 0.3404, "step": 47350 }, { "epoch": 41.04, "learning_rate": 7.245454545454544e-07, "loss": 0.3944, "step": 47360 }, { "epoch": 41.05, "learning_rate": 7.238461538461538e-07, "loss": 0.4, "step": 47370 }, { "epoch": 41.06, "learning_rate": 7.231468531468531e-07, "loss": 0.3483, "step": 47380 }, { "epoch": 41.07, "learning_rate": 7.224475524475524e-07, "loss": 0.345, "step": 47390 }, { "epoch": 41.07, "learning_rate": 7.217482517482517e-07, "loss": 0.3332, "step": 47400 }, { "epoch": 41.08, "learning_rate": 7.210489510489511e-07, "loss": 0.3213, "step": 47410 }, { "epoch": 41.09, "learning_rate": 7.203496503496503e-07, "loss": 0.3375, "step": 47420 }, { "epoch": 41.1, "learning_rate": 7.196503496503496e-07, "loss": 0.3356, "step": 47430 }, { "epoch": 41.11, "learning_rate": 7.189510489510489e-07, "loss": 0.3306, "step": 47440 }, { "epoch": 41.12, "learning_rate": 7.182517482517482e-07, "loss": 0.4358, "step": 47450 }, { "epoch": 41.13, "learning_rate": 7.175524475524475e-07, "loss": 0.4413, "step": 47460 }, { "epoch": 41.14, "learning_rate": 7.168531468531468e-07, "loss": 0.3332, "step": 47470 }, { "epoch": 41.14, "learning_rate": 7.161538461538461e-07, "loss": 0.369, "step": 47480 }, { "epoch": 41.15, "learning_rate": 7.154545454545454e-07, "loss": 0.3748, "step": 47490 }, { "epoch": 41.16, "learning_rate": 7.147552447552447e-07, "loss": 0.3464, "step": 47500 }, { "epoch": 41.17, "learning_rate": 7.14055944055944e-07, "loss": 0.3844, "step": 47510 }, { "epoch": 41.18, "learning_rate": 7.133566433566434e-07, "loss": 0.3767, "step": 47520 }, { "epoch": 41.19, "learning_rate": 7.126573426573427e-07, "loss": 0.3676, "step": 47530 }, { "epoch": 41.2, "learning_rate": 7.119580419580419e-07, "loss": 0.3877, "step": 47540 }, { "epoch": 41.2, "learning_rate": 7.112587412587412e-07, "loss": 0.3902, "step": 47550 }, { "epoch": 41.21, "learning_rate": 7.105594405594406e-07, "loss": 0.3718, "step": 47560 }, { "epoch": 41.22, "learning_rate": 7.098601398601398e-07, "loss": 0.3501, "step": 47570 }, { "epoch": 41.23, "learning_rate": 7.091608391608391e-07, "loss": 0.3736, "step": 47580 }, { "epoch": 41.24, "learning_rate": 7.084615384615384e-07, "loss": 0.3599, "step": 47590 }, { "epoch": 41.25, "learning_rate": 7.077622377622378e-07, "loss": 0.3664, "step": 47600 }, { "epoch": 41.26, "learning_rate": 7.070629370629371e-07, "loss": 0.3893, "step": 47610 }, { "epoch": 41.27, "learning_rate": 7.063636363636364e-07, "loss": 0.3887, "step": 47620 }, { "epoch": 41.27, "learning_rate": 7.056643356643355e-07, "loss": 0.3254, "step": 47630 }, { "epoch": 41.28, "learning_rate": 7.049650349650349e-07, "loss": 0.3702, "step": 47640 }, { "epoch": 41.29, "learning_rate": 7.042657342657342e-07, "loss": 0.3874, "step": 47650 }, { "epoch": 41.3, "learning_rate": 7.035664335664335e-07, "loss": 0.3469, "step": 47660 }, { "epoch": 41.31, "learning_rate": 7.028671328671328e-07, "loss": 0.3587, "step": 47670 }, { "epoch": 41.32, "learning_rate": 7.021678321678322e-07, "loss": 0.3572, "step": 47680 }, { "epoch": 41.33, "learning_rate": 7.014685314685315e-07, "loss": 0.3382, "step": 47690 }, { "epoch": 41.33, "learning_rate": 7.007692307692308e-07, "loss": 0.3692, "step": 47700 }, { "epoch": 41.34, "learning_rate": 7.0006993006993e-07, "loss": 0.3552, "step": 47710 }, { "epoch": 41.35, "learning_rate": 6.993706293706293e-07, "loss": 0.3536, "step": 47720 }, { "epoch": 41.36, "learning_rate": 6.986713286713286e-07, "loss": 0.3274, "step": 47730 }, { "epoch": 41.37, "learning_rate": 6.979720279720279e-07, "loss": 0.368, "step": 47740 }, { "epoch": 41.38, "learning_rate": 6.972727272727273e-07, "loss": 0.4008, "step": 47750 }, { "epoch": 41.39, "learning_rate": 6.965734265734266e-07, "loss": 0.3336, "step": 47760 }, { "epoch": 41.39, "learning_rate": 6.958741258741259e-07, "loss": 0.3342, "step": 47770 }, { "epoch": 41.4, "learning_rate": 6.951748251748251e-07, "loss": 0.3587, "step": 47780 }, { "epoch": 41.41, "learning_rate": 6.944755244755245e-07, "loss": 0.371, "step": 47790 }, { "epoch": 41.42, "learning_rate": 6.937762237762237e-07, "loss": 0.3359, "step": 47800 }, { "epoch": 41.43, "learning_rate": 6.93076923076923e-07, "loss": 0.3806, "step": 47810 }, { "epoch": 41.44, "learning_rate": 6.923776223776223e-07, "loss": 0.369, "step": 47820 }, { "epoch": 41.45, "learning_rate": 6.916783216783217e-07, "loss": 0.3462, "step": 47830 }, { "epoch": 41.46, "learning_rate": 6.90979020979021e-07, "loss": 0.2829, "step": 47840 }, { "epoch": 41.46, "learning_rate": 6.902797202797202e-07, "loss": 0.3493, "step": 47850 }, { "epoch": 41.47, "learning_rate": 6.895804195804195e-07, "loss": 0.3654, "step": 47860 }, { "epoch": 41.48, "learning_rate": 6.888811188811189e-07, "loss": 0.3211, "step": 47870 }, { "epoch": 41.49, "learning_rate": 6.881818181818182e-07, "loss": 0.3532, "step": 47880 }, { "epoch": 41.5, "learning_rate": 6.874825174825174e-07, "loss": 0.3522, "step": 47890 }, { "epoch": 41.51, "learning_rate": 6.867832167832167e-07, "loss": 0.3524, "step": 47900 }, { "epoch": 41.52, "learning_rate": 6.860839160839161e-07, "loss": 0.3416, "step": 47910 }, { "epoch": 41.52, "learning_rate": 6.853846153846153e-07, "loss": 0.3726, "step": 47920 }, { "epoch": 41.53, "learning_rate": 6.846853146853146e-07, "loss": 0.3733, "step": 47930 }, { "epoch": 41.54, "learning_rate": 6.839860139860139e-07, "loss": 0.3302, "step": 47940 }, { "epoch": 41.55, "learning_rate": 6.832867132867133e-07, "loss": 0.368, "step": 47950 }, { "epoch": 41.56, "learning_rate": 6.825874125874126e-07, "loss": 0.3841, "step": 47960 }, { "epoch": 41.57, "learning_rate": 6.818881118881119e-07, "loss": 0.3956, "step": 47970 }, { "epoch": 41.58, "learning_rate": 6.811888111888111e-07, "loss": 0.3752, "step": 47980 }, { "epoch": 41.59, "learning_rate": 6.804895104895104e-07, "loss": 0.3636, "step": 47990 }, { "epoch": 41.59, "learning_rate": 6.797902097902097e-07, "loss": 0.3978, "step": 48000 }, { "epoch": 41.6, "learning_rate": 6.79090909090909e-07, "loss": 0.368, "step": 48010 }, { "epoch": 41.61, "learning_rate": 6.783916083916084e-07, "loss": 0.4165, "step": 48020 }, { "epoch": 41.62, "learning_rate": 6.776923076923077e-07, "loss": 0.3761, "step": 48030 }, { "epoch": 41.63, "learning_rate": 6.76993006993007e-07, "loss": 0.3411, "step": 48040 }, { "epoch": 41.64, "learning_rate": 6.762937062937063e-07, "loss": 0.3551, "step": 48050 }, { "epoch": 41.65, "learning_rate": 6.755944055944057e-07, "loss": 0.4011, "step": 48060 }, { "epoch": 41.65, "learning_rate": 6.748951048951048e-07, "loss": 0.3244, "step": 48070 }, { "epoch": 41.66, "learning_rate": 6.741958041958041e-07, "loss": 0.3954, "step": 48080 }, { "epoch": 41.67, "learning_rate": 6.734965034965034e-07, "loss": 0.3258, "step": 48090 }, { "epoch": 41.68, "learning_rate": 6.727972027972028e-07, "loss": 0.3887, "step": 48100 }, { "epoch": 41.69, "learning_rate": 6.720979020979021e-07, "loss": 0.3747, "step": 48110 }, { "epoch": 41.7, "learning_rate": 6.713986013986014e-07, "loss": 0.4292, "step": 48120 }, { "epoch": 41.71, "learning_rate": 6.706993006993007e-07, "loss": 0.3614, "step": 48130 }, { "epoch": 41.72, "learning_rate": 6.7e-07, "loss": 0.3716, "step": 48140 }, { "epoch": 41.72, "learning_rate": 6.693006993006993e-07, "loss": 0.3525, "step": 48150 }, { "epoch": 41.73, "learning_rate": 6.686013986013985e-07, "loss": 0.379, "step": 48160 }, { "epoch": 41.74, "learning_rate": 6.679020979020978e-07, "loss": 0.3761, "step": 48170 }, { "epoch": 41.75, "learning_rate": 6.672027972027972e-07, "loss": 0.4308, "step": 48180 }, { "epoch": 41.76, "learning_rate": 6.665034965034965e-07, "loss": 0.3468, "step": 48190 }, { "epoch": 41.77, "learning_rate": 6.658041958041958e-07, "loss": 0.3229, "step": 48200 }, { "epoch": 41.78, "learning_rate": 6.65104895104895e-07, "loss": 0.3045, "step": 48210 }, { "epoch": 41.78, "learning_rate": 6.644055944055944e-07, "loss": 0.3951, "step": 48220 }, { "epoch": 41.79, "learning_rate": 6.637062937062937e-07, "loss": 0.352, "step": 48230 }, { "epoch": 41.8, "learning_rate": 6.63006993006993e-07, "loss": 0.2722, "step": 48240 }, { "epoch": 41.81, "learning_rate": 6.623076923076923e-07, "loss": 0.3191, "step": 48250 }, { "epoch": 41.82, "learning_rate": 6.616083916083916e-07, "loss": 0.3697, "step": 48260 }, { "epoch": 41.83, "learning_rate": 6.609090909090909e-07, "loss": 0.3631, "step": 48270 }, { "epoch": 41.84, "learning_rate": 6.602097902097901e-07, "loss": 0.3518, "step": 48280 }, { "epoch": 41.85, "learning_rate": 6.595104895104895e-07, "loss": 0.2858, "step": 48290 }, { "epoch": 41.85, "learning_rate": 6.588111888111888e-07, "loss": 0.3709, "step": 48300 }, { "epoch": 41.86, "learning_rate": 6.581118881118881e-07, "loss": 0.3929, "step": 48310 }, { "epoch": 41.87, "learning_rate": 6.574125874125874e-07, "loss": 0.3, "step": 48320 }, { "epoch": 41.88, "learning_rate": 6.567132867132867e-07, "loss": 0.3737, "step": 48330 }, { "epoch": 41.89, "learning_rate": 6.56013986013986e-07, "loss": 0.3676, "step": 48340 }, { "epoch": 41.9, "learning_rate": 6.553146853146852e-07, "loss": 0.373, "step": 48350 }, { "epoch": 41.91, "learning_rate": 6.546153846153845e-07, "loss": 0.3846, "step": 48360 }, { "epoch": 41.91, "learning_rate": 6.539160839160839e-07, "loss": 0.3561, "step": 48370 }, { "epoch": 41.92, "learning_rate": 6.532167832167832e-07, "loss": 0.3453, "step": 48380 }, { "epoch": 41.93, "learning_rate": 6.525174825174825e-07, "loss": 0.3311, "step": 48390 }, { "epoch": 41.94, "learning_rate": 6.518181818181818e-07, "loss": 0.3983, "step": 48400 }, { "epoch": 41.95, "learning_rate": 6.511188811188812e-07, "loss": 0.3875, "step": 48410 }, { "epoch": 41.96, "learning_rate": 6.504195804195803e-07, "loss": 0.3334, "step": 48420 }, { "epoch": 41.97, "learning_rate": 6.497202797202796e-07, "loss": 0.4028, "step": 48430 }, { "epoch": 41.98, "learning_rate": 6.490209790209789e-07, "loss": 0.3421, "step": 48440 }, { "epoch": 41.98, "learning_rate": 6.483216783216783e-07, "loss": 0.3155, "step": 48450 }, { "epoch": 41.99, "learning_rate": 6.476223776223776e-07, "loss": 0.3739, "step": 48460 }, { "epoch": 42.0, "eval_loss": 0.5668932199478149, "eval_runtime": 136.0754, "eval_samples_per_second": 3.91, "eval_steps_per_second": 1.955, "eval_wer": 0.24175612264575433, "step": 48468 }, { "epoch": 42.0, "learning_rate": 6.469230769230769e-07, "loss": 0.3767, "step": 48470 }, { "epoch": 42.01, "learning_rate": 6.462237762237763e-07, "loss": 0.389, "step": 48480 }, { "epoch": 42.02, "learning_rate": 6.455244755244756e-07, "loss": 0.3434, "step": 48490 }, { "epoch": 42.03, "learning_rate": 6.448251748251748e-07, "loss": 0.3547, "step": 48500 }, { "epoch": 42.04, "learning_rate": 6.44125874125874e-07, "loss": 0.3653, "step": 48510 }, { "epoch": 42.05, "learning_rate": 6.434265734265734e-07, "loss": 0.357, "step": 48520 }, { "epoch": 42.05, "learning_rate": 6.427272727272727e-07, "loss": 0.3694, "step": 48530 }, { "epoch": 42.06, "learning_rate": 6.42027972027972e-07, "loss": 0.3616, "step": 48540 }, { "epoch": 42.07, "learning_rate": 6.413286713286713e-07, "loss": 0.3419, "step": 48550 }, { "epoch": 42.08, "learning_rate": 6.406293706293707e-07, "loss": 0.385, "step": 48560 }, { "epoch": 42.09, "learning_rate": 6.399300699300699e-07, "loss": 0.3177, "step": 48570 }, { "epoch": 42.1, "learning_rate": 6.392307692307692e-07, "loss": 0.3408, "step": 48580 }, { "epoch": 42.11, "learning_rate": 6.385314685314685e-07, "loss": 0.3393, "step": 48590 }, { "epoch": 42.11, "learning_rate": 6.378321678321678e-07, "loss": 0.3989, "step": 48600 }, { "epoch": 42.12, "learning_rate": 6.371328671328671e-07, "loss": 0.3204, "step": 48610 }, { "epoch": 42.13, "learning_rate": 6.364335664335664e-07, "loss": 0.3511, "step": 48620 }, { "epoch": 42.14, "learning_rate": 6.357342657342657e-07, "loss": 0.3581, "step": 48630 }, { "epoch": 42.15, "learning_rate": 6.35034965034965e-07, "loss": 0.3515, "step": 48640 }, { "epoch": 42.16, "learning_rate": 6.343356643356643e-07, "loss": 0.3076, "step": 48650 }, { "epoch": 42.17, "learning_rate": 6.336363636363636e-07, "loss": 0.3228, "step": 48660 }, { "epoch": 42.17, "learning_rate": 6.329370629370629e-07, "loss": 0.3846, "step": 48670 }, { "epoch": 42.18, "learning_rate": 6.322377622377623e-07, "loss": 0.3596, "step": 48680 }, { "epoch": 42.19, "learning_rate": 6.315384615384615e-07, "loss": 0.2774, "step": 48690 }, { "epoch": 42.2, "learning_rate": 6.308391608391608e-07, "loss": 0.299, "step": 48700 }, { "epoch": 42.21, "learning_rate": 6.3013986013986e-07, "loss": 0.3831, "step": 48710 }, { "epoch": 42.22, "learning_rate": 6.294405594405594e-07, "loss": 0.3012, "step": 48720 }, { "epoch": 42.23, "learning_rate": 6.287412587412587e-07, "loss": 0.4169, "step": 48730 }, { "epoch": 42.24, "learning_rate": 6.28041958041958e-07, "loss": 0.3375, "step": 48740 }, { "epoch": 42.24, "learning_rate": 6.273426573426574e-07, "loss": 0.3376, "step": 48750 }, { "epoch": 42.25, "learning_rate": 6.266433566433567e-07, "loss": 0.3196, "step": 48760 }, { "epoch": 42.26, "learning_rate": 6.25944055944056e-07, "loss": 0.353, "step": 48770 }, { "epoch": 42.27, "learning_rate": 6.252447552447551e-07, "loss": 0.359, "step": 48780 }, { "epoch": 42.28, "learning_rate": 6.245454545454545e-07, "loss": 0.3557, "step": 48790 }, { "epoch": 42.29, "learning_rate": 6.238461538461538e-07, "loss": 0.3828, "step": 48800 }, { "epoch": 42.3, "learning_rate": 6.231468531468531e-07, "loss": 0.4027, "step": 48810 }, { "epoch": 42.3, "learning_rate": 6.224475524475524e-07, "loss": 0.3855, "step": 48820 }, { "epoch": 42.31, "learning_rate": 6.217482517482518e-07, "loss": 0.3452, "step": 48830 }, { "epoch": 42.32, "learning_rate": 6.210489510489511e-07, "loss": 0.4077, "step": 48840 }, { "epoch": 42.33, "learning_rate": 6.203496503496504e-07, "loss": 0.3513, "step": 48850 }, { "epoch": 42.34, "learning_rate": 6.196503496503495e-07, "loss": 0.4098, "step": 48860 }, { "epoch": 42.35, "learning_rate": 6.189510489510489e-07, "loss": 0.3481, "step": 48870 }, { "epoch": 42.36, "learning_rate": 6.182517482517482e-07, "loss": 0.3485, "step": 48880 }, { "epoch": 42.37, "learning_rate": 6.175524475524475e-07, "loss": 0.322, "step": 48890 }, { "epoch": 42.37, "learning_rate": 6.168531468531468e-07, "loss": 0.3485, "step": 48900 }, { "epoch": 42.38, "learning_rate": 6.161538461538462e-07, "loss": 0.3846, "step": 48910 }, { "epoch": 42.39, "learning_rate": 6.154545454545455e-07, "loss": 0.3714, "step": 48920 }, { "epoch": 42.4, "learning_rate": 6.147552447552447e-07, "loss": 0.3733, "step": 48930 }, { "epoch": 42.41, "learning_rate": 6.14055944055944e-07, "loss": 0.3456, "step": 48940 }, { "epoch": 42.42, "learning_rate": 6.133566433566433e-07, "loss": 0.3564, "step": 48950 }, { "epoch": 42.43, "learning_rate": 6.126573426573426e-07, "loss": 0.3668, "step": 48960 }, { "epoch": 42.43, "learning_rate": 6.119580419580419e-07, "loss": 0.3504, "step": 48970 }, { "epoch": 42.44, "learning_rate": 6.112587412587413e-07, "loss": 0.3736, "step": 48980 }, { "epoch": 42.45, "learning_rate": 6.105594405594406e-07, "loss": 0.4041, "step": 48990 }, { "epoch": 42.46, "learning_rate": 6.098601398601398e-07, "loss": 0.4201, "step": 49000 }, { "epoch": 42.47, "learning_rate": 6.091608391608391e-07, "loss": 0.3436, "step": 49010 }, { "epoch": 42.48, "learning_rate": 6.084615384615385e-07, "loss": 0.3663, "step": 49020 }, { "epoch": 42.49, "learning_rate": 6.077622377622378e-07, "loss": 0.3723, "step": 49030 }, { "epoch": 42.5, "learning_rate": 6.07062937062937e-07, "loss": 0.3465, "step": 49040 }, { "epoch": 42.5, "learning_rate": 6.063636363636363e-07, "loss": 0.3464, "step": 49050 }, { "epoch": 42.51, "learning_rate": 6.056643356643357e-07, "loss": 0.3682, "step": 49060 }, { "epoch": 42.52, "learning_rate": 6.049650349650349e-07, "loss": 0.3549, "step": 49070 }, { "epoch": 42.53, "learning_rate": 6.042657342657342e-07, "loss": 0.397, "step": 49080 }, { "epoch": 42.54, "learning_rate": 6.035664335664335e-07, "loss": 0.3514, "step": 49090 }, { "epoch": 42.55, "learning_rate": 6.028671328671329e-07, "loss": 0.3532, "step": 49100 }, { "epoch": 42.56, "learning_rate": 6.021678321678322e-07, "loss": 0.3897, "step": 49110 }, { "epoch": 42.56, "learning_rate": 6.014685314685315e-07, "loss": 0.3663, "step": 49120 }, { "epoch": 42.57, "learning_rate": 6.007692307692307e-07, "loss": 0.3393, "step": 49130 }, { "epoch": 42.58, "learning_rate": 6.0006993006993e-07, "loss": 0.3473, "step": 49140 }, { "epoch": 42.59, "learning_rate": 5.993706293706293e-07, "loss": 0.3699, "step": 49150 }, { "epoch": 42.6, "learning_rate": 5.986713286713286e-07, "loss": 0.4025, "step": 49160 }, { "epoch": 42.61, "learning_rate": 5.979720279720279e-07, "loss": 0.3543, "step": 49170 }, { "epoch": 42.62, "learning_rate": 5.972727272727273e-07, "loss": 0.3318, "step": 49180 }, { "epoch": 42.63, "learning_rate": 5.965734265734266e-07, "loss": 0.3419, "step": 49190 }, { "epoch": 42.63, "learning_rate": 5.958741258741259e-07, "loss": 0.3452, "step": 49200 }, { "epoch": 42.64, "learning_rate": 5.951748251748253e-07, "loss": 0.385, "step": 49210 }, { "epoch": 42.65, "learning_rate": 5.944755244755244e-07, "loss": 0.4066, "step": 49220 }, { "epoch": 42.66, "learning_rate": 5.937762237762237e-07, "loss": 0.3566, "step": 49230 }, { "epoch": 42.67, "learning_rate": 5.93076923076923e-07, "loss": 0.3442, "step": 49240 }, { "epoch": 42.68, "learning_rate": 5.923776223776224e-07, "loss": 0.3464, "step": 49250 }, { "epoch": 42.69, "learning_rate": 5.916783216783217e-07, "loss": 0.3406, "step": 49260 }, { "epoch": 42.69, "learning_rate": 5.90979020979021e-07, "loss": 0.3679, "step": 49270 }, { "epoch": 42.7, "learning_rate": 5.902797202797202e-07, "loss": 0.3481, "step": 49280 }, { "epoch": 42.71, "learning_rate": 5.895804195804196e-07, "loss": 0.3361, "step": 49290 }, { "epoch": 42.72, "learning_rate": 5.888811188811188e-07, "loss": 0.3668, "step": 49300 }, { "epoch": 42.73, "learning_rate": 5.881818181818181e-07, "loss": 0.3632, "step": 49310 }, { "epoch": 42.74, "learning_rate": 5.874825174825174e-07, "loss": 0.391, "step": 49320 }, { "epoch": 42.75, "learning_rate": 5.867832167832168e-07, "loss": 0.3493, "step": 49330 }, { "epoch": 42.76, "learning_rate": 5.860839160839161e-07, "loss": 0.3616, "step": 49340 }, { "epoch": 42.76, "learning_rate": 5.853846153846154e-07, "loss": 0.4051, "step": 49350 }, { "epoch": 42.77, "learning_rate": 5.846853146853146e-07, "loss": 0.3538, "step": 49360 }, { "epoch": 42.78, "learning_rate": 5.83986013986014e-07, "loss": 0.4155, "step": 49370 }, { "epoch": 42.79, "learning_rate": 5.832867132867133e-07, "loss": 0.3261, "step": 49380 }, { "epoch": 42.8, "learning_rate": 5.825874125874125e-07, "loss": 0.3531, "step": 49390 }, { "epoch": 42.81, "learning_rate": 5.818881118881118e-07, "loss": 0.3218, "step": 49400 }, { "epoch": 42.82, "learning_rate": 5.811888111888112e-07, "loss": 0.3846, "step": 49410 }, { "epoch": 42.82, "learning_rate": 5.804895104895105e-07, "loss": 0.3391, "step": 49420 }, { "epoch": 42.83, "learning_rate": 5.797902097902097e-07, "loss": 0.345, "step": 49430 }, { "epoch": 42.84, "learning_rate": 5.79090909090909e-07, "loss": 0.3244, "step": 49440 }, { "epoch": 42.85, "learning_rate": 5.783916083916084e-07, "loss": 0.386, "step": 49450 }, { "epoch": 42.86, "learning_rate": 5.776923076923077e-07, "loss": 0.4148, "step": 49460 }, { "epoch": 42.87, "learning_rate": 5.76993006993007e-07, "loss": 0.3254, "step": 49470 }, { "epoch": 42.88, "learning_rate": 5.762937062937062e-07, "loss": 0.3659, "step": 49480 }, { "epoch": 42.89, "learning_rate": 5.755944055944056e-07, "loss": 0.3793, "step": 49490 }, { "epoch": 42.89, "learning_rate": 5.748951048951048e-07, "loss": 0.3521, "step": 49500 }, { "epoch": 42.9, "learning_rate": 5.741958041958041e-07, "loss": 0.3591, "step": 49510 }, { "epoch": 42.91, "learning_rate": 5.734965034965035e-07, "loss": 0.3978, "step": 49520 }, { "epoch": 42.92, "learning_rate": 5.727972027972028e-07, "loss": 0.3468, "step": 49530 }, { "epoch": 42.93, "learning_rate": 5.720979020979021e-07, "loss": 0.381, "step": 49540 }, { "epoch": 42.94, "learning_rate": 5.713986013986014e-07, "loss": 0.3439, "step": 49550 }, { "epoch": 42.95, "learning_rate": 5.706993006993008e-07, "loss": 0.3546, "step": 49560 }, { "epoch": 42.95, "learning_rate": 5.699999999999999e-07, "loss": 0.3392, "step": 49570 }, { "epoch": 42.96, "learning_rate": 5.693006993006992e-07, "loss": 0.3253, "step": 49580 }, { "epoch": 42.97, "learning_rate": 5.686013986013985e-07, "loss": 0.3876, "step": 49590 }, { "epoch": 42.98, "learning_rate": 5.679020979020979e-07, "loss": 0.3507, "step": 49600 }, { "epoch": 42.99, "learning_rate": 5.672027972027972e-07, "loss": 0.3843, "step": 49610 }, { "epoch": 43.0, "learning_rate": 5.665034965034965e-07, "loss": 0.3702, "step": 49620 }, { "epoch": 43.0, "eval_loss": 0.5646147727966309, "eval_runtime": 138.0762, "eval_samples_per_second": 3.853, "eval_steps_per_second": 1.926, "eval_wer": 0.24413447322748602, "step": 49622 }, { "epoch": 43.01, "learning_rate": 5.658041958041958e-07, "loss": 0.4483, "step": 49630 }, { "epoch": 43.02, "learning_rate": 5.651048951048952e-07, "loss": 0.3129, "step": 49640 }, { "epoch": 43.02, "learning_rate": 5.644055944055944e-07, "loss": 0.3615, "step": 49650 }, { "epoch": 43.03, "learning_rate": 5.637062937062936e-07, "loss": 0.4337, "step": 49660 }, { "epoch": 43.04, "learning_rate": 5.630069930069929e-07, "loss": 0.3558, "step": 49670 }, { "epoch": 43.05, "learning_rate": 5.623076923076923e-07, "loss": 0.3202, "step": 49680 }, { "epoch": 43.06, "learning_rate": 5.616083916083916e-07, "loss": 0.3395, "step": 49690 }, { "epoch": 43.07, "learning_rate": 5.609090909090909e-07, "loss": 0.3591, "step": 49700 }, { "epoch": 43.08, "learning_rate": 5.602097902097903e-07, "loss": 0.4359, "step": 49710 }, { "epoch": 43.08, "learning_rate": 5.595104895104895e-07, "loss": 0.3346, "step": 49720 }, { "epoch": 43.09, "learning_rate": 5.588111888111888e-07, "loss": 0.3803, "step": 49730 }, { "epoch": 43.1, "learning_rate": 5.581118881118881e-07, "loss": 0.3718, "step": 49740 }, { "epoch": 43.11, "learning_rate": 5.574125874125874e-07, "loss": 0.335, "step": 49750 }, { "epoch": 43.12, "learning_rate": 5.567132867132867e-07, "loss": 0.3856, "step": 49760 }, { "epoch": 43.13, "learning_rate": 5.56083916083916e-07, "loss": 0.3488, "step": 49770 }, { "epoch": 43.14, "learning_rate": 5.553846153846153e-07, "loss": 0.3367, "step": 49780 }, { "epoch": 43.15, "learning_rate": 5.546853146853146e-07, "loss": 0.3346, "step": 49790 }, { "epoch": 43.15, "learning_rate": 5.53986013986014e-07, "loss": 0.3368, "step": 49800 }, { "epoch": 43.16, "learning_rate": 5.532867132867133e-07, "loss": 0.3931, "step": 49810 }, { "epoch": 43.17, "learning_rate": 5.525874125874126e-07, "loss": 0.3877, "step": 49820 }, { "epoch": 43.18, "learning_rate": 5.51888111888112e-07, "loss": 0.3382, "step": 49830 }, { "epoch": 43.19, "learning_rate": 5.511888111888111e-07, "loss": 0.3488, "step": 49840 }, { "epoch": 43.2, "learning_rate": 5.504895104895104e-07, "loss": 0.3033, "step": 49850 }, { "epoch": 43.21, "learning_rate": 5.497902097902097e-07, "loss": 0.3465, "step": 49860 }, { "epoch": 43.21, "learning_rate": 5.490909090909091e-07, "loss": 0.3864, "step": 49870 }, { "epoch": 43.22, "learning_rate": 5.483916083916084e-07, "loss": 0.3856, "step": 49880 }, { "epoch": 43.23, "learning_rate": 5.476923076923077e-07, "loss": 0.3992, "step": 49890 }, { "epoch": 43.24, "learning_rate": 5.46993006993007e-07, "loss": 0.351, "step": 49900 }, { "epoch": 43.25, "learning_rate": 5.462937062937063e-07, "loss": 0.3492, "step": 49910 }, { "epoch": 43.26, "learning_rate": 5.455944055944056e-07, "loss": 0.3662, "step": 49920 }, { "epoch": 43.27, "learning_rate": 5.448951048951048e-07, "loss": 0.3553, "step": 49930 }, { "epoch": 43.28, "learning_rate": 5.441958041958041e-07, "loss": 0.403, "step": 49940 }, { "epoch": 43.28, "learning_rate": 5.434965034965035e-07, "loss": 0.3562, "step": 49950 }, { "epoch": 43.29, "learning_rate": 5.427972027972028e-07, "loss": 0.3855, "step": 49960 }, { "epoch": 43.3, "learning_rate": 5.420979020979021e-07, "loss": 0.3589, "step": 49970 }, { "epoch": 43.31, "learning_rate": 5.413986013986013e-07, "loss": 0.3787, "step": 49980 }, { "epoch": 43.32, "learning_rate": 5.406993006993007e-07, "loss": 0.3631, "step": 49990 }, { "epoch": 43.33, "learning_rate": 5.4e-07, "loss": 0.3099, "step": 50000 }, { "epoch": 43.34, "learning_rate": 5.393006993006993e-07, "loss": 0.349, "step": 50010 }, { "epoch": 43.34, "learning_rate": 5.386013986013985e-07, "loss": 0.4186, "step": 50020 }, { "epoch": 43.35, "learning_rate": 5.379020979020979e-07, "loss": 0.349, "step": 50030 }, { "epoch": 43.36, "learning_rate": 5.372027972027972e-07, "loss": 0.377, "step": 50040 }, { "epoch": 43.37, "learning_rate": 5.365034965034964e-07, "loss": 0.3425, "step": 50050 }, { "epoch": 43.38, "learning_rate": 5.358041958041957e-07, "loss": 0.3438, "step": 50060 }, { "epoch": 43.39, "learning_rate": 5.351048951048951e-07, "loss": 0.385, "step": 50070 }, { "epoch": 43.4, "learning_rate": 5.344055944055944e-07, "loss": 0.3116, "step": 50080 }, { "epoch": 43.41, "learning_rate": 5.337062937062937e-07, "loss": 0.3366, "step": 50090 }, { "epoch": 43.41, "learning_rate": 5.330069930069931e-07, "loss": 0.347, "step": 50100 }, { "epoch": 43.42, "learning_rate": 5.323076923076923e-07, "loss": 0.359, "step": 50110 }, { "epoch": 43.43, "learning_rate": 5.316083916083915e-07, "loss": 0.3482, "step": 50120 }, { "epoch": 43.44, "learning_rate": 5.309090909090908e-07, "loss": 0.4245, "step": 50130 }, { "epoch": 43.45, "learning_rate": 5.302097902097902e-07, "loss": 0.4013, "step": 50140 }, { "epoch": 43.46, "learning_rate": 5.295104895104895e-07, "loss": 0.3183, "step": 50150 }, { "epoch": 43.47, "learning_rate": 5.288111888111888e-07, "loss": 0.3847, "step": 50160 }, { "epoch": 43.47, "learning_rate": 5.281118881118881e-07, "loss": 0.3408, "step": 50170 }, { "epoch": 43.48, "learning_rate": 5.274125874125875e-07, "loss": 0.3204, "step": 50180 }, { "epoch": 43.49, "learning_rate": 5.267132867132868e-07, "loss": 0.3748, "step": 50190 }, { "epoch": 43.5, "learning_rate": 5.260139860139859e-07, "loss": 0.3272, "step": 50200 }, { "epoch": 43.51, "learning_rate": 5.253146853146852e-07, "loss": 0.3443, "step": 50210 }, { "epoch": 43.52, "learning_rate": 5.246153846153846e-07, "loss": 0.334, "step": 50220 }, { "epoch": 43.53, "learning_rate": 5.239160839160839e-07, "loss": 0.3717, "step": 50230 }, { "epoch": 43.54, "learning_rate": 5.232167832167832e-07, "loss": 0.3835, "step": 50240 }, { "epoch": 43.54, "learning_rate": 5.225174825174825e-07, "loss": 0.3446, "step": 50250 }, { "epoch": 43.55, "learning_rate": 5.218181818181819e-07, "loss": 0.3764, "step": 50260 }, { "epoch": 43.56, "learning_rate": 5.211188811188811e-07, "loss": 0.3715, "step": 50270 }, { "epoch": 43.57, "learning_rate": 5.204195804195804e-07, "loss": 0.3868, "step": 50280 }, { "epoch": 43.58, "learning_rate": 5.197202797202796e-07, "loss": 0.3194, "step": 50290 }, { "epoch": 43.59, "learning_rate": 5.19020979020979e-07, "loss": 0.3496, "step": 50300 }, { "epoch": 43.6, "learning_rate": 5.183216783216783e-07, "loss": 0.3352, "step": 50310 }, { "epoch": 43.6, "learning_rate": 5.176223776223776e-07, "loss": 0.3579, "step": 50320 }, { "epoch": 43.61, "learning_rate": 5.16923076923077e-07, "loss": 0.3405, "step": 50330 }, { "epoch": 43.62, "learning_rate": 5.162237762237762e-07, "loss": 0.3587, "step": 50340 }, { "epoch": 43.63, "learning_rate": 5.155244755244755e-07, "loss": 0.3614, "step": 50350 }, { "epoch": 43.64, "learning_rate": 5.148251748251748e-07, "loss": 0.3478, "step": 50360 }, { "epoch": 43.65, "learning_rate": 5.141258741258741e-07, "loss": 0.3754, "step": 50370 }, { "epoch": 43.66, "learning_rate": 5.134265734265734e-07, "loss": 0.3146, "step": 50380 }, { "epoch": 43.67, "learning_rate": 5.127272727272727e-07, "loss": 0.3599, "step": 50390 }, { "epoch": 43.67, "learning_rate": 5.12027972027972e-07, "loss": 0.3302, "step": 50400 }, { "epoch": 43.68, "learning_rate": 5.113286713286713e-07, "loss": 0.3394, "step": 50410 }, { "epoch": 43.69, "learning_rate": 5.106293706293706e-07, "loss": 0.3385, "step": 50420 }, { "epoch": 43.7, "learning_rate": 5.099300699300699e-07, "loss": 0.3213, "step": 50430 }, { "epoch": 43.71, "learning_rate": 5.092307692307692e-07, "loss": 0.3575, "step": 50440 }, { "epoch": 43.72, "learning_rate": 5.085314685314686e-07, "loss": 0.3492, "step": 50450 }, { "epoch": 43.73, "learning_rate": 5.078321678321678e-07, "loss": 0.3904, "step": 50460 }, { "epoch": 43.73, "learning_rate": 5.071328671328671e-07, "loss": 0.388, "step": 50470 }, { "epoch": 43.74, "learning_rate": 5.064335664335663e-07, "loss": 0.4397, "step": 50480 }, { "epoch": 43.75, "learning_rate": 5.057342657342657e-07, "loss": 0.3186, "step": 50490 }, { "epoch": 43.76, "learning_rate": 5.05034965034965e-07, "loss": 0.3315, "step": 50500 }, { "epoch": 43.77, "learning_rate": 5.043356643356643e-07, "loss": 0.3556, "step": 50510 }, { "epoch": 43.78, "learning_rate": 5.036363636363636e-07, "loss": 0.4012, "step": 50520 }, { "epoch": 43.79, "learning_rate": 5.02937062937063e-07, "loss": 0.3227, "step": 50530 }, { "epoch": 43.8, "learning_rate": 5.022377622377623e-07, "loss": 0.3532, "step": 50540 }, { "epoch": 43.8, "learning_rate": 5.015384615384614e-07, "loss": 0.3468, "step": 50550 }, { "epoch": 43.81, "learning_rate": 5.008391608391607e-07, "loss": 0.3401, "step": 50560 }, { "epoch": 43.82, "learning_rate": 5.001398601398601e-07, "loss": 0.3841, "step": 50570 }, { "epoch": 43.83, "learning_rate": 4.995104895104895e-07, "loss": 0.3204, "step": 50580 }, { "epoch": 43.84, "learning_rate": 4.988111888111888e-07, "loss": 0.3945, "step": 50590 }, { "epoch": 43.85, "learning_rate": 4.98111888111888e-07, "loss": 0.3158, "step": 50600 }, { "epoch": 43.86, "learning_rate": 4.974125874125874e-07, "loss": 0.3709, "step": 50610 }, { "epoch": 43.86, "learning_rate": 4.967132867132867e-07, "loss": 0.3594, "step": 50620 }, { "epoch": 43.87, "learning_rate": 4.96013986013986e-07, "loss": 0.2674, "step": 50630 }, { "epoch": 43.88, "learning_rate": 4.953146853146853e-07, "loss": 0.3399, "step": 50640 }, { "epoch": 43.89, "learning_rate": 4.946153846153846e-07, "loss": 0.3651, "step": 50650 }, { "epoch": 43.9, "learning_rate": 4.939160839160839e-07, "loss": 0.3881, "step": 50660 }, { "epoch": 43.91, "learning_rate": 4.932167832167831e-07, "loss": 0.3616, "step": 50670 }, { "epoch": 43.92, "learning_rate": 4.925174825174824e-07, "loss": 0.3515, "step": 50680 }, { "epoch": 43.93, "learning_rate": 4.918181818181818e-07, "loss": 0.383, "step": 50690 }, { "epoch": 43.93, "learning_rate": 4.911188811188811e-07, "loss": 0.3215, "step": 50700 }, { "epoch": 43.94, "learning_rate": 4.904195804195804e-07, "loss": 0.3708, "step": 50710 }, { "epoch": 43.95, "learning_rate": 4.897202797202797e-07, "loss": 0.4286, "step": 50720 }, { "epoch": 43.96, "learning_rate": 4.89020979020979e-07, "loss": 0.4208, "step": 50730 }, { "epoch": 43.97, "learning_rate": 4.883216783216784e-07, "loss": 0.3737, "step": 50740 }, { "epoch": 43.98, "learning_rate": 4.876223776223776e-07, "loss": 0.299, "step": 50750 }, { "epoch": 43.99, "learning_rate": 4.869230769230769e-07, "loss": 0.4187, "step": 50760 }, { "epoch": 43.99, "learning_rate": 4.862237762237762e-07, "loss": 0.3444, "step": 50770 }, { "epoch": 44.0, "eval_loss": 0.565770149230957, "eval_runtime": 137.6557, "eval_samples_per_second": 3.865, "eval_steps_per_second": 1.932, "eval_wer": 0.24130616442758887, "step": 50776 }, { "epoch": 44.0, "learning_rate": 4.855244755244755e-07, "loss": 0.325, "step": 50780 }, { "epoch": 44.01, "learning_rate": 4.848251748251748e-07, "loss": 0.3413, "step": 50790 }, { "epoch": 44.02, "learning_rate": 4.841258741258741e-07, "loss": 0.3148, "step": 50800 }, { "epoch": 44.03, "learning_rate": 4.834265734265734e-07, "loss": 0.4056, "step": 50810 }, { "epoch": 44.04, "learning_rate": 4.827272727272727e-07, "loss": 0.3773, "step": 50820 }, { "epoch": 44.05, "learning_rate": 4.82027972027972e-07, "loss": 0.3485, "step": 50830 }, { "epoch": 44.06, "learning_rate": 4.813286713286713e-07, "loss": 0.3589, "step": 50840 }, { "epoch": 44.06, "learning_rate": 4.806293706293706e-07, "loss": 0.3755, "step": 50850 }, { "epoch": 44.07, "learning_rate": 4.799300699300699e-07, "loss": 0.3676, "step": 50860 }, { "epoch": 44.08, "learning_rate": 4.792307692307692e-07, "loss": 0.3682, "step": 50870 }, { "epoch": 44.09, "learning_rate": 4.785314685314686e-07, "loss": 0.3834, "step": 50880 }, { "epoch": 44.1, "learning_rate": 4.778321678321677e-07, "loss": 0.4024, "step": 50890 }, { "epoch": 44.11, "learning_rate": 4.771328671328671e-07, "loss": 0.3543, "step": 50900 }, { "epoch": 44.12, "learning_rate": 4.764335664335664e-07, "loss": 0.3748, "step": 50910 }, { "epoch": 44.12, "learning_rate": 4.757342657342657e-07, "loss": 0.3427, "step": 50920 }, { "epoch": 44.13, "learning_rate": 4.7503496503496504e-07, "loss": 0.3596, "step": 50930 }, { "epoch": 44.14, "learning_rate": 4.7433566433566427e-07, "loss": 0.3468, "step": 50940 }, { "epoch": 44.15, "learning_rate": 4.736363636363636e-07, "loss": 0.3084, "step": 50950 }, { "epoch": 44.16, "learning_rate": 4.7293706293706295e-07, "loss": 0.3412, "step": 50960 }, { "epoch": 44.17, "learning_rate": 4.7223776223776223e-07, "loss": 0.3512, "step": 50970 }, { "epoch": 44.18, "learning_rate": 4.715384615384615e-07, "loss": 0.3601, "step": 50980 }, { "epoch": 44.19, "learning_rate": 4.708391608391608e-07, "loss": 0.4109, "step": 50990 }, { "epoch": 44.19, "learning_rate": 4.7013986013986014e-07, "loss": 0.3168, "step": 51000 }, { "epoch": 44.2, "learning_rate": 4.6944055944055943e-07, "loss": 0.3551, "step": 51010 }, { "epoch": 44.21, "learning_rate": 4.687412587412587e-07, "loss": 0.3557, "step": 51020 }, { "epoch": 44.22, "learning_rate": 4.68041958041958e-07, "loss": 0.3283, "step": 51030 }, { "epoch": 44.23, "learning_rate": 4.6734265734265734e-07, "loss": 0.3595, "step": 51040 }, { "epoch": 44.24, "learning_rate": 4.666433566433566e-07, "loss": 0.3826, "step": 51050 }, { "epoch": 44.25, "learning_rate": 4.6594405594405596e-07, "loss": 0.3451, "step": 51060 }, { "epoch": 44.25, "learning_rate": 4.652447552447552e-07, "loss": 0.3752, "step": 51070 }, { "epoch": 44.26, "learning_rate": 4.6454545454545453e-07, "loss": 0.3869, "step": 51080 }, { "epoch": 44.27, "learning_rate": 4.638461538461538e-07, "loss": 0.3548, "step": 51090 }, { "epoch": 44.28, "learning_rate": 4.6314685314685315e-07, "loss": 0.3236, "step": 51100 }, { "epoch": 44.29, "learning_rate": 4.624475524475524e-07, "loss": 0.3261, "step": 51110 }, { "epoch": 44.3, "learning_rate": 4.617482517482517e-07, "loss": 0.342, "step": 51120 }, { "epoch": 44.31, "learning_rate": 4.61048951048951e-07, "loss": 0.3196, "step": 51130 }, { "epoch": 44.32, "learning_rate": 4.6034965034965035e-07, "loss": 0.319, "step": 51140 }, { "epoch": 44.32, "learning_rate": 4.5965034965034963e-07, "loss": 0.3924, "step": 51150 }, { "epoch": 44.33, "learning_rate": 4.589510489510489e-07, "loss": 0.3715, "step": 51160 }, { "epoch": 44.34, "learning_rate": 4.582517482517482e-07, "loss": 0.3719, "step": 51170 }, { "epoch": 44.35, "learning_rate": 4.5755244755244754e-07, "loss": 0.3456, "step": 51180 }, { "epoch": 44.36, "learning_rate": 4.568531468531469e-07, "loss": 0.3956, "step": 51190 }, { "epoch": 44.37, "learning_rate": 4.561538461538461e-07, "loss": 0.3757, "step": 51200 }, { "epoch": 44.38, "learning_rate": 4.5545454545454545e-07, "loss": 0.3573, "step": 51210 }, { "epoch": 44.38, "learning_rate": 4.5475524475524473e-07, "loss": 0.362, "step": 51220 }, { "epoch": 44.39, "learning_rate": 4.5405594405594407e-07, "loss": 0.4066, "step": 51230 }, { "epoch": 44.4, "learning_rate": 4.533566433566433e-07, "loss": 0.386, "step": 51240 }, { "epoch": 44.41, "learning_rate": 4.5265734265734264e-07, "loss": 0.3183, "step": 51250 }, { "epoch": 44.42, "learning_rate": 4.5195804195804193e-07, "loss": 0.3254, "step": 51260 }, { "epoch": 44.43, "learning_rate": 4.5125874125874127e-07, "loss": 0.3963, "step": 51270 }, { "epoch": 44.44, "learning_rate": 4.5055944055944055e-07, "loss": 0.2913, "step": 51280 }, { "epoch": 44.45, "learning_rate": 4.4986013986013984e-07, "loss": 0.3316, "step": 51290 }, { "epoch": 44.45, "learning_rate": 4.491608391608391e-07, "loss": 0.3397, "step": 51300 }, { "epoch": 44.46, "learning_rate": 4.4846153846153846e-07, "loss": 0.3333, "step": 51310 }, { "epoch": 44.47, "learning_rate": 4.4776223776223775e-07, "loss": 0.4175, "step": 51320 }, { "epoch": 44.48, "learning_rate": 4.4706293706293703e-07, "loss": 0.3613, "step": 51330 }, { "epoch": 44.49, "learning_rate": 4.463636363636363e-07, "loss": 0.3953, "step": 51340 }, { "epoch": 44.5, "learning_rate": 4.4566433566433565e-07, "loss": 0.3269, "step": 51350 }, { "epoch": 44.51, "learning_rate": 4.4496503496503494e-07, "loss": 0.3545, "step": 51360 }, { "epoch": 44.51, "learning_rate": 4.442657342657343e-07, "loss": 0.4028, "step": 51370 }, { "epoch": 44.52, "learning_rate": 4.435664335664335e-07, "loss": 0.4086, "step": 51380 }, { "epoch": 44.53, "learning_rate": 4.4286713286713285e-07, "loss": 0.3323, "step": 51390 }, { "epoch": 44.54, "learning_rate": 4.4216783216783213e-07, "loss": 0.3906, "step": 51400 }, { "epoch": 44.55, "learning_rate": 4.4146853146853147e-07, "loss": 0.3551, "step": 51410 }, { "epoch": 44.56, "learning_rate": 4.407692307692307e-07, "loss": 0.3603, "step": 51420 }, { "epoch": 44.57, "learning_rate": 4.4006993006993004e-07, "loss": 0.2797, "step": 51430 }, { "epoch": 44.58, "learning_rate": 4.393706293706294e-07, "loss": 0.3186, "step": 51440 }, { "epoch": 44.58, "learning_rate": 4.3867132867132866e-07, "loss": 0.3282, "step": 51450 }, { "epoch": 44.59, "learning_rate": 4.37972027972028e-07, "loss": 0.3359, "step": 51460 }, { "epoch": 44.6, "learning_rate": 4.3727272727272723e-07, "loss": 0.3761, "step": 51470 }, { "epoch": 44.61, "learning_rate": 4.3657342657342657e-07, "loss": 0.3203, "step": 51480 }, { "epoch": 44.62, "learning_rate": 4.3587412587412586e-07, "loss": 0.366, "step": 51490 }, { "epoch": 44.63, "learning_rate": 4.351748251748252e-07, "loss": 0.28, "step": 51500 }, { "epoch": 44.64, "learning_rate": 4.3447552447552443e-07, "loss": 0.3208, "step": 51510 }, { "epoch": 44.64, "learning_rate": 4.3377622377622377e-07, "loss": 0.3376, "step": 51520 }, { "epoch": 44.65, "learning_rate": 4.3307692307692305e-07, "loss": 0.3777, "step": 51530 }, { "epoch": 44.66, "learning_rate": 4.323776223776224e-07, "loss": 0.3316, "step": 51540 }, { "epoch": 44.67, "learning_rate": 4.316783216783216e-07, "loss": 0.3205, "step": 51550 }, { "epoch": 44.68, "learning_rate": 4.3097902097902096e-07, "loss": 0.3252, "step": 51560 }, { "epoch": 44.69, "learning_rate": 4.3027972027972025e-07, "loss": 0.3657, "step": 51570 }, { "epoch": 44.7, "learning_rate": 4.295804195804196e-07, "loss": 0.361, "step": 51580 }, { "epoch": 44.71, "learning_rate": 4.2888111888111887e-07, "loss": 0.4195, "step": 51590 }, { "epoch": 44.71, "learning_rate": 4.2818181818181815e-07, "loss": 0.306, "step": 51600 }, { "epoch": 44.72, "learning_rate": 4.2748251748251744e-07, "loss": 0.3697, "step": 51610 }, { "epoch": 44.73, "learning_rate": 4.267832167832168e-07, "loss": 0.3762, "step": 51620 }, { "epoch": 44.74, "learning_rate": 4.2608391608391606e-07, "loss": 0.4058, "step": 51630 }, { "epoch": 44.75, "learning_rate": 4.2538461538461535e-07, "loss": 0.3401, "step": 51640 }, { "epoch": 44.76, "learning_rate": 4.2468531468531463e-07, "loss": 0.3201, "step": 51650 }, { "epoch": 44.77, "learning_rate": 4.2398601398601397e-07, "loss": 0.3638, "step": 51660 }, { "epoch": 44.77, "learning_rate": 4.2328671328671326e-07, "loss": 0.3522, "step": 51670 }, { "epoch": 44.78, "learning_rate": 4.225874125874126e-07, "loss": 0.361, "step": 51680 }, { "epoch": 44.79, "learning_rate": 4.218881118881119e-07, "loss": 0.3551, "step": 51690 }, { "epoch": 44.8, "learning_rate": 4.2118881118881116e-07, "loss": 0.3629, "step": 51700 }, { "epoch": 44.81, "learning_rate": 4.204895104895105e-07, "loss": 0.3809, "step": 51710 }, { "epoch": 44.82, "learning_rate": 4.197902097902098e-07, "loss": 0.4204, "step": 51720 }, { "epoch": 44.83, "learning_rate": 4.1909090909090907e-07, "loss": 0.3504, "step": 51730 }, { "epoch": 44.83, "learning_rate": 4.1839160839160836e-07, "loss": 0.321, "step": 51740 }, { "epoch": 44.84, "learning_rate": 4.176923076923077e-07, "loss": 0.3443, "step": 51750 }, { "epoch": 44.85, "learning_rate": 4.16993006993007e-07, "loss": 0.3294, "step": 51760 }, { "epoch": 44.86, "learning_rate": 4.1629370629370627e-07, "loss": 0.3754, "step": 51770 }, { "epoch": 44.87, "learning_rate": 4.1559440559440555e-07, "loss": 0.359, "step": 51780 }, { "epoch": 44.88, "learning_rate": 4.148951048951049e-07, "loss": 0.3334, "step": 51790 }, { "epoch": 44.89, "learning_rate": 4.141958041958042e-07, "loss": 0.3306, "step": 51800 }, { "epoch": 44.9, "learning_rate": 4.134965034965035e-07, "loss": 0.3905, "step": 51810 }, { "epoch": 44.9, "learning_rate": 4.1279720279720275e-07, "loss": 0.3473, "step": 51820 }, { "epoch": 44.91, "learning_rate": 4.120979020979021e-07, "loss": 0.3089, "step": 51830 }, { "epoch": 44.92, "learning_rate": 4.1139860139860137e-07, "loss": 0.3684, "step": 51840 }, { "epoch": 44.93, "learning_rate": 4.106993006993007e-07, "loss": 0.343, "step": 51850 }, { "epoch": 44.94, "learning_rate": 4.0999999999999994e-07, "loss": 0.3692, "step": 51860 }, { "epoch": 44.95, "learning_rate": 4.093006993006993e-07, "loss": 0.388, "step": 51870 }, { "epoch": 44.96, "learning_rate": 4.0860139860139856e-07, "loss": 0.3411, "step": 51880 }, { "epoch": 44.96, "learning_rate": 4.079020979020979e-07, "loss": 0.3736, "step": 51890 }, { "epoch": 44.97, "learning_rate": 4.072027972027972e-07, "loss": 0.3311, "step": 51900 }, { "epoch": 44.98, "learning_rate": 4.0650349650349647e-07, "loss": 0.368, "step": 51910 }, { "epoch": 44.99, "learning_rate": 4.0580419580419576e-07, "loss": 0.3885, "step": 51920 }, { "epoch": 45.0, "learning_rate": 4.051048951048951e-07, "loss": 0.3152, "step": 51930 }, { "epoch": 45.0, "eval_loss": 0.5559401512145996, "eval_runtime": 138.3022, "eval_samples_per_second": 3.847, "eval_steps_per_second": 1.923, "eval_wer": 0.24021340875490133, "step": 51930 }, { "epoch": 45.01, "learning_rate": 4.0440559440559443e-07, "loss": 0.3634, "step": 51940 }, { "epoch": 45.02, "learning_rate": 4.0370629370629366e-07, "loss": 0.3808, "step": 51950 }, { "epoch": 45.03, "learning_rate": 4.03006993006993e-07, "loss": 0.2829, "step": 51960 }, { "epoch": 45.03, "learning_rate": 4.023076923076923e-07, "loss": 0.3541, "step": 51970 }, { "epoch": 45.04, "learning_rate": 4.016083916083916e-07, "loss": 0.2983, "step": 51980 }, { "epoch": 45.05, "learning_rate": 4.0090909090909086e-07, "loss": 0.3205, "step": 51990 }, { "epoch": 45.06, "learning_rate": 4.002097902097902e-07, "loss": 0.3651, "step": 52000 }, { "epoch": 45.07, "learning_rate": 3.995104895104895e-07, "loss": 0.3451, "step": 52010 }, { "epoch": 45.08, "learning_rate": 3.988111888111888e-07, "loss": 0.3793, "step": 52020 }, { "epoch": 45.09, "learning_rate": 3.981118881118881e-07, "loss": 0.3988, "step": 52030 }, { "epoch": 45.1, "learning_rate": 3.974125874125874e-07, "loss": 0.3919, "step": 52040 }, { "epoch": 45.1, "learning_rate": 3.967132867132867e-07, "loss": 0.3249, "step": 52050 }, { "epoch": 45.11, "learning_rate": 3.96013986013986e-07, "loss": 0.3432, "step": 52060 }, { "epoch": 45.12, "learning_rate": 3.953146853146853e-07, "loss": 0.3442, "step": 52070 }, { "epoch": 45.13, "learning_rate": 3.946153846153846e-07, "loss": 0.3305, "step": 52080 }, { "epoch": 45.14, "learning_rate": 3.9391608391608387e-07, "loss": 0.3412, "step": 52090 }, { "epoch": 45.15, "learning_rate": 3.932167832167832e-07, "loss": 0.3864, "step": 52100 }, { "epoch": 45.16, "learning_rate": 3.925174825174825e-07, "loss": 0.3563, "step": 52110 }, { "epoch": 45.16, "learning_rate": 3.9181818181818183e-07, "loss": 0.3579, "step": 52120 }, { "epoch": 45.17, "learning_rate": 3.9111888111888106e-07, "loss": 0.416, "step": 52130 }, { "epoch": 45.18, "learning_rate": 3.904195804195804e-07, "loss": 0.3637, "step": 52140 }, { "epoch": 45.19, "learning_rate": 3.897202797202797e-07, "loss": 0.3377, "step": 52150 }, { "epoch": 45.2, "learning_rate": 3.89020979020979e-07, "loss": 0.3395, "step": 52160 }, { "epoch": 45.21, "learning_rate": 3.8832167832167826e-07, "loss": 0.3114, "step": 52170 }, { "epoch": 45.22, "learning_rate": 3.876223776223776e-07, "loss": 0.3728, "step": 52180 }, { "epoch": 45.23, "learning_rate": 3.8692307692307693e-07, "loss": 0.348, "step": 52190 }, { "epoch": 45.23, "learning_rate": 3.862237762237762e-07, "loss": 0.3457, "step": 52200 }, { "epoch": 45.24, "learning_rate": 3.8552447552447556e-07, "loss": 0.3347, "step": 52210 }, { "epoch": 45.25, "learning_rate": 3.848251748251748e-07, "loss": 0.3706, "step": 52220 }, { "epoch": 45.26, "learning_rate": 3.841258741258741e-07, "loss": 0.3942, "step": 52230 }, { "epoch": 45.27, "learning_rate": 3.834265734265734e-07, "loss": 0.3266, "step": 52240 }, { "epoch": 45.28, "learning_rate": 3.8272727272727275e-07, "loss": 0.3274, "step": 52250 }, { "epoch": 45.29, "learning_rate": 3.82027972027972e-07, "loss": 0.2802, "step": 52260 }, { "epoch": 45.29, "learning_rate": 3.813286713286713e-07, "loss": 0.3797, "step": 52270 }, { "epoch": 45.3, "learning_rate": 3.806293706293706e-07, "loss": 0.3517, "step": 52280 }, { "epoch": 45.31, "learning_rate": 3.7993006993006994e-07, "loss": 0.3494, "step": 52290 }, { "epoch": 45.32, "learning_rate": 3.792307692307692e-07, "loss": 0.3575, "step": 52300 }, { "epoch": 45.33, "learning_rate": 3.785314685314685e-07, "loss": 0.3258, "step": 52310 }, { "epoch": 45.34, "learning_rate": 3.778321678321678e-07, "loss": 0.361, "step": 52320 }, { "epoch": 45.35, "learning_rate": 3.7713286713286714e-07, "loss": 0.3957, "step": 52330 }, { "epoch": 45.36, "learning_rate": 3.764335664335664e-07, "loss": 0.3734, "step": 52340 }, { "epoch": 45.36, "learning_rate": 3.757342657342657e-07, "loss": 0.3217, "step": 52350 }, { "epoch": 45.37, "learning_rate": 3.75034965034965e-07, "loss": 0.352, "step": 52360 }, { "epoch": 45.38, "learning_rate": 3.7433566433566433e-07, "loss": 0.3292, "step": 52370 }, { "epoch": 45.39, "learning_rate": 3.736363636363636e-07, "loss": 0.3959, "step": 52380 }, { "epoch": 45.4, "learning_rate": 3.729370629370629e-07, "loss": 0.3335, "step": 52390 }, { "epoch": 45.41, "learning_rate": 3.722377622377622e-07, "loss": 0.3569, "step": 52400 }, { "epoch": 45.42, "learning_rate": 3.715384615384615e-07, "loss": 0.3919, "step": 52410 }, { "epoch": 45.42, "learning_rate": 3.7083916083916086e-07, "loss": 0.3862, "step": 52420 }, { "epoch": 45.43, "learning_rate": 3.7013986013986015e-07, "loss": 0.3332, "step": 52430 }, { "epoch": 45.44, "learning_rate": 3.6944055944055943e-07, "loss": 0.348, "step": 52440 }, { "epoch": 45.45, "learning_rate": 3.687412587412587e-07, "loss": 0.3456, "step": 52450 }, { "epoch": 45.46, "learning_rate": 3.6804195804195806e-07, "loss": 0.3297, "step": 52460 }, { "epoch": 45.47, "learning_rate": 3.6734265734265734e-07, "loss": 0.4109, "step": 52470 }, { "epoch": 45.48, "learning_rate": 3.666433566433566e-07, "loss": 0.3729, "step": 52480 }, { "epoch": 45.49, "learning_rate": 3.659440559440559e-07, "loss": 0.3014, "step": 52490 }, { "epoch": 45.49, "learning_rate": 3.6524475524475525e-07, "loss": 0.4247, "step": 52500 }, { "epoch": 45.5, "learning_rate": 3.6454545454545453e-07, "loss": 0.3382, "step": 52510 }, { "epoch": 45.51, "learning_rate": 3.638461538461538e-07, "loss": 0.3732, "step": 52520 }, { "epoch": 45.52, "learning_rate": 3.631468531468531e-07, "loss": 0.3224, "step": 52530 }, { "epoch": 45.53, "learning_rate": 3.6244755244755244e-07, "loss": 0.3809, "step": 52540 }, { "epoch": 45.54, "learning_rate": 3.6174825174825173e-07, "loss": 0.3758, "step": 52550 }, { "epoch": 45.55, "learning_rate": 3.6104895104895107e-07, "loss": 0.3511, "step": 52560 }, { "epoch": 45.55, "learning_rate": 3.603496503496503e-07, "loss": 0.3247, "step": 52570 }, { "epoch": 45.56, "learning_rate": 3.5965034965034964e-07, "loss": 0.4197, "step": 52580 }, { "epoch": 45.57, "learning_rate": 3.589510489510489e-07, "loss": 0.3722, "step": 52590 }, { "epoch": 45.58, "learning_rate": 3.5825174825174826e-07, "loss": 0.3467, "step": 52600 }, { "epoch": 45.59, "learning_rate": 3.575524475524475e-07, "loss": 0.2931, "step": 52610 }, { "epoch": 45.6, "learning_rate": 3.5685314685314683e-07, "loss": 0.391, "step": 52620 }, { "epoch": 45.61, "learning_rate": 3.561538461538461e-07, "loss": 0.3567, "step": 52630 }, { "epoch": 45.61, "learning_rate": 3.5545454545454545e-07, "loss": 0.3436, "step": 52640 }, { "epoch": 45.62, "learning_rate": 3.5475524475524474e-07, "loss": 0.3486, "step": 52650 }, { "epoch": 45.63, "learning_rate": 3.54055944055944e-07, "loss": 0.3513, "step": 52660 }, { "epoch": 45.64, "learning_rate": 3.533566433566433e-07, "loss": 0.3871, "step": 52670 }, { "epoch": 45.65, "learning_rate": 3.5265734265734265e-07, "loss": 0.3758, "step": 52680 }, { "epoch": 45.66, "learning_rate": 3.51958041958042e-07, "loss": 0.3677, "step": 52690 }, { "epoch": 45.67, "learning_rate": 3.512587412587412e-07, "loss": 0.3368, "step": 52700 }, { "epoch": 45.68, "learning_rate": 3.5055944055944056e-07, "loss": 0.3457, "step": 52710 }, { "epoch": 45.68, "learning_rate": 3.4986013986013984e-07, "loss": 0.3342, "step": 52720 }, { "epoch": 45.69, "learning_rate": 3.491608391608392e-07, "loss": 0.3456, "step": 52730 }, { "epoch": 45.7, "learning_rate": 3.4846153846153846e-07, "loss": 0.3281, "step": 52740 }, { "epoch": 45.71, "learning_rate": 3.4776223776223775e-07, "loss": 0.3023, "step": 52750 }, { "epoch": 45.72, "learning_rate": 3.4706293706293703e-07, "loss": 0.4121, "step": 52760 }, { "epoch": 45.73, "learning_rate": 3.4636363636363637e-07, "loss": 0.3656, "step": 52770 }, { "epoch": 45.74, "learning_rate": 3.4566433566433566e-07, "loss": 0.3331, "step": 52780 }, { "epoch": 45.74, "learning_rate": 3.4496503496503494e-07, "loss": 0.3769, "step": 52790 }, { "epoch": 45.75, "learning_rate": 3.4426573426573423e-07, "loss": 0.3901, "step": 52800 }, { "epoch": 45.76, "learning_rate": 3.4356643356643357e-07, "loss": 0.3108, "step": 52810 }, { "epoch": 45.77, "learning_rate": 3.4286713286713285e-07, "loss": 0.3604, "step": 52820 }, { "epoch": 45.78, "learning_rate": 3.4216783216783214e-07, "loss": 0.335, "step": 52830 }, { "epoch": 45.79, "learning_rate": 3.414685314685314e-07, "loss": 0.349, "step": 52840 }, { "epoch": 45.8, "learning_rate": 3.4076923076923076e-07, "loss": 0.3362, "step": 52850 }, { "epoch": 45.81, "learning_rate": 3.4006993006993005e-07, "loss": 0.3089, "step": 52860 }, { "epoch": 45.81, "learning_rate": 3.393706293706294e-07, "loss": 0.3587, "step": 52870 }, { "epoch": 45.82, "learning_rate": 3.386713286713286e-07, "loss": 0.3461, "step": 52880 }, { "epoch": 45.83, "learning_rate": 3.3797202797202795e-07, "loss": 0.3051, "step": 52890 }, { "epoch": 45.84, "learning_rate": 3.3727272727272724e-07, "loss": 0.3519, "step": 52900 }, { "epoch": 45.85, "learning_rate": 3.365734265734266e-07, "loss": 0.3095, "step": 52910 }, { "epoch": 45.86, "learning_rate": 3.358741258741258e-07, "loss": 0.3646, "step": 52920 }, { "epoch": 45.87, "learning_rate": 3.3517482517482515e-07, "loss": 0.3363, "step": 52930 }, { "epoch": 45.87, "learning_rate": 3.344755244755245e-07, "loss": 0.3295, "step": 52940 }, { "epoch": 45.88, "learning_rate": 3.3377622377622377e-07, "loss": 0.3362, "step": 52950 }, { "epoch": 45.89, "learning_rate": 3.330769230769231e-07, "loss": 0.4204, "step": 52960 }, { "epoch": 45.9, "learning_rate": 3.3237762237762234e-07, "loss": 0.3752, "step": 52970 }, { "epoch": 45.91, "learning_rate": 3.316783216783217e-07, "loss": 0.3524, "step": 52980 }, { "epoch": 45.92, "learning_rate": 3.3097902097902096e-07, "loss": 0.3185, "step": 52990 }, { "epoch": 45.93, "learning_rate": 3.302797202797203e-07, "loss": 0.3749, "step": 53000 }, { "epoch": 45.94, "learning_rate": 3.2958041958041954e-07, "loss": 0.3107, "step": 53010 }, { "epoch": 45.94, "learning_rate": 3.2888111888111887e-07, "loss": 0.3935, "step": 53020 }, { "epoch": 45.95, "learning_rate": 3.2818181818181816e-07, "loss": 0.3288, "step": 53030 }, { "epoch": 45.96, "learning_rate": 3.274825174825175e-07, "loss": 0.3549, "step": 53040 }, { "epoch": 45.97, "learning_rate": 3.2678321678321673e-07, "loss": 0.3727, "step": 53050 }, { "epoch": 45.98, "learning_rate": 3.2608391608391607e-07, "loss": 0.3913, "step": 53060 }, { "epoch": 45.99, "learning_rate": 3.2538461538461535e-07, "loss": 0.3895, "step": 53070 }, { "epoch": 46.0, "learning_rate": 3.246853146853147e-07, "loss": 0.4, "step": 53080 }, { "epoch": 46.0, "eval_loss": 0.5598962903022766, "eval_runtime": 136.728, "eval_samples_per_second": 3.891, "eval_steps_per_second": 1.945, "eval_wer": 0.24291315806389407, "step": 53084 }, { "epoch": 46.01, "learning_rate": 3.23986013986014e-07, "loss": 0.338, "step": 53090 }, { "epoch": 46.01, "learning_rate": 3.2328671328671326e-07, "loss": 0.3319, "step": 53100 }, { "epoch": 46.02, "learning_rate": 3.2258741258741255e-07, "loss": 0.361, "step": 53110 }, { "epoch": 46.03, "learning_rate": 3.218881118881119e-07, "loss": 0.3428, "step": 53120 }, { "epoch": 46.04, "learning_rate": 3.2118881118881117e-07, "loss": 0.3781, "step": 53130 }, { "epoch": 46.05, "learning_rate": 3.2048951048951045e-07, "loss": 0.3949, "step": 53140 }, { "epoch": 46.06, "learning_rate": 3.1979020979020974e-07, "loss": 0.3512, "step": 53150 }, { "epoch": 46.07, "learning_rate": 3.190909090909091e-07, "loss": 0.3601, "step": 53160 }, { "epoch": 46.07, "learning_rate": 3.183916083916084e-07, "loss": 0.3801, "step": 53170 }, { "epoch": 46.08, "learning_rate": 3.176923076923077e-07, "loss": 0.3381, "step": 53180 }, { "epoch": 46.09, "learning_rate": 3.16993006993007e-07, "loss": 0.3352, "step": 53190 }, { "epoch": 46.1, "learning_rate": 3.1629370629370627e-07, "loss": 0.3853, "step": 53200 }, { "epoch": 46.11, "learning_rate": 3.155944055944056e-07, "loss": 0.3489, "step": 53210 }, { "epoch": 46.12, "learning_rate": 3.148951048951049e-07, "loss": 0.3868, "step": 53220 }, { "epoch": 46.13, "learning_rate": 3.141958041958042e-07, "loss": 0.293, "step": 53230 }, { "epoch": 46.14, "learning_rate": 3.1349650349650346e-07, "loss": 0.3221, "step": 53240 }, { "epoch": 46.14, "learning_rate": 3.127972027972028e-07, "loss": 0.3962, "step": 53250 }, { "epoch": 46.15, "learning_rate": 3.120979020979021e-07, "loss": 0.3337, "step": 53260 }, { "epoch": 46.16, "learning_rate": 3.1139860139860137e-07, "loss": 0.3624, "step": 53270 }, { "epoch": 46.17, "learning_rate": 3.1069930069930066e-07, "loss": 0.3983, "step": 53280 }, { "epoch": 46.18, "learning_rate": 3.1e-07, "loss": 0.3618, "step": 53290 }, { "epoch": 46.19, "learning_rate": 3.093006993006993e-07, "loss": 0.3796, "step": 53300 }, { "epoch": 46.2, "learning_rate": 3.086013986013986e-07, "loss": 0.3536, "step": 53310 }, { "epoch": 46.2, "learning_rate": 3.0790209790209785e-07, "loss": 0.362, "step": 53320 }, { "epoch": 46.21, "learning_rate": 3.072027972027972e-07, "loss": 0.3184, "step": 53330 }, { "epoch": 46.22, "learning_rate": 3.065034965034965e-07, "loss": 0.3803, "step": 53340 }, { "epoch": 46.23, "learning_rate": 3.058041958041958e-07, "loss": 0.3361, "step": 53350 }, { "epoch": 46.24, "learning_rate": 3.0510489510489505e-07, "loss": 0.3337, "step": 53360 }, { "epoch": 46.25, "learning_rate": 3.044055944055944e-07, "loss": 0.3476, "step": 53370 }, { "epoch": 46.26, "learning_rate": 3.0370629370629367e-07, "loss": 0.3582, "step": 53380 }, { "epoch": 46.27, "learning_rate": 3.03006993006993e-07, "loss": 0.3691, "step": 53390 }, { "epoch": 46.27, "learning_rate": 3.0230769230769235e-07, "loss": 0.3526, "step": 53400 }, { "epoch": 46.28, "learning_rate": 3.016083916083916e-07, "loss": 0.3684, "step": 53410 }, { "epoch": 46.29, "learning_rate": 3.009090909090909e-07, "loss": 0.4539, "step": 53420 }, { "epoch": 46.3, "learning_rate": 3.002097902097902e-07, "loss": 0.3908, "step": 53430 }, { "epoch": 46.31, "learning_rate": 2.9951048951048954e-07, "loss": 0.3204, "step": 53440 }, { "epoch": 46.32, "learning_rate": 2.9881118881118877e-07, "loss": 0.3961, "step": 53450 }, { "epoch": 46.33, "learning_rate": 2.981118881118881e-07, "loss": 0.335, "step": 53460 }, { "epoch": 46.33, "learning_rate": 2.974125874125874e-07, "loss": 0.374, "step": 53470 }, { "epoch": 46.34, "learning_rate": 2.9671328671328673e-07, "loss": 0.449, "step": 53480 }, { "epoch": 46.35, "learning_rate": 2.96013986013986e-07, "loss": 0.3361, "step": 53490 }, { "epoch": 46.36, "learning_rate": 2.953146853146853e-07, "loss": 0.3499, "step": 53500 }, { "epoch": 46.37, "learning_rate": 2.946153846153846e-07, "loss": 0.3204, "step": 53510 }, { "epoch": 46.38, "learning_rate": 2.939160839160839e-07, "loss": 0.3682, "step": 53520 }, { "epoch": 46.39, "learning_rate": 2.932167832167832e-07, "loss": 0.3741, "step": 53530 }, { "epoch": 46.39, "learning_rate": 2.925174825174825e-07, "loss": 0.3433, "step": 53540 }, { "epoch": 46.4, "learning_rate": 2.918181818181818e-07, "loss": 0.3687, "step": 53550 }, { "epoch": 46.41, "learning_rate": 2.911188811188811e-07, "loss": 0.319, "step": 53560 }, { "epoch": 46.42, "learning_rate": 2.904195804195804e-07, "loss": 0.3686, "step": 53570 }, { "epoch": 46.43, "learning_rate": 2.897202797202797e-07, "loss": 0.3313, "step": 53580 }, { "epoch": 46.44, "learning_rate": 2.89020979020979e-07, "loss": 0.3729, "step": 53590 }, { "epoch": 46.45, "learning_rate": 2.883216783216783e-07, "loss": 0.4025, "step": 53600 }, { "epoch": 46.46, "learning_rate": 2.876223776223776e-07, "loss": 0.2871, "step": 53610 }, { "epoch": 46.46, "learning_rate": 2.8692307692307694e-07, "loss": 0.3758, "step": 53620 }, { "epoch": 46.47, "learning_rate": 2.8622377622377617e-07, "loss": 0.3482, "step": 53630 }, { "epoch": 46.48, "learning_rate": 2.855244755244755e-07, "loss": 0.3169, "step": 53640 }, { "epoch": 46.49, "learning_rate": 2.848251748251748e-07, "loss": 0.3718, "step": 53650 }, { "epoch": 46.5, "learning_rate": 2.8412587412587413e-07, "loss": 0.2951, "step": 53660 }, { "epoch": 46.51, "learning_rate": 2.834265734265734e-07, "loss": 0.3914, "step": 53670 }, { "epoch": 46.52, "learning_rate": 2.827272727272727e-07, "loss": 0.3822, "step": 53680 }, { "epoch": 46.52, "learning_rate": 2.8202797202797204e-07, "loss": 0.3789, "step": 53690 }, { "epoch": 46.53, "learning_rate": 2.813286713286713e-07, "loss": 0.3486, "step": 53700 }, { "epoch": 46.54, "learning_rate": 2.8062937062937066e-07, "loss": 0.3458, "step": 53710 }, { "epoch": 46.55, "learning_rate": 2.799300699300699e-07, "loss": 0.3958, "step": 53720 }, { "epoch": 46.56, "learning_rate": 2.7923076923076923e-07, "loss": 0.3574, "step": 53730 }, { "epoch": 46.57, "learning_rate": 2.785314685314685e-07, "loss": 0.3624, "step": 53740 }, { "epoch": 46.58, "learning_rate": 2.7783216783216786e-07, "loss": 0.3705, "step": 53750 }, { "epoch": 46.59, "learning_rate": 2.771328671328671e-07, "loss": 0.3209, "step": 53760 }, { "epoch": 46.59, "learning_rate": 2.764335664335664e-07, "loss": 0.3529, "step": 53770 }, { "epoch": 46.6, "learning_rate": 2.757342657342657e-07, "loss": 0.3359, "step": 53780 }, { "epoch": 46.61, "learning_rate": 2.7503496503496505e-07, "loss": 0.3595, "step": 53790 }, { "epoch": 46.62, "learning_rate": 2.743356643356643e-07, "loss": 0.3597, "step": 53800 }, { "epoch": 46.63, "learning_rate": 2.736363636363636e-07, "loss": 0.3038, "step": 53810 }, { "epoch": 46.64, "learning_rate": 2.729370629370629e-07, "loss": 0.3261, "step": 53820 }, { "epoch": 46.65, "learning_rate": 2.7223776223776224e-07, "loss": 0.3323, "step": 53830 }, { "epoch": 46.65, "learning_rate": 2.7153846153846153e-07, "loss": 0.3983, "step": 53840 }, { "epoch": 46.66, "learning_rate": 2.708391608391608e-07, "loss": 0.373, "step": 53850 }, { "epoch": 46.67, "learning_rate": 2.701398601398601e-07, "loss": 0.3463, "step": 53860 }, { "epoch": 46.68, "learning_rate": 2.6944055944055944e-07, "loss": 0.3492, "step": 53870 }, { "epoch": 46.69, "learning_rate": 2.687412587412587e-07, "loss": 0.3555, "step": 53880 }, { "epoch": 46.7, "learning_rate": 2.68041958041958e-07, "loss": 0.3306, "step": 53890 }, { "epoch": 46.71, "learning_rate": 2.673426573426573e-07, "loss": 0.3866, "step": 53900 }, { "epoch": 46.72, "learning_rate": 2.6664335664335663e-07, "loss": 0.4149, "step": 53910 }, { "epoch": 46.72, "learning_rate": 2.6594405594405597e-07, "loss": 0.4307, "step": 53920 }, { "epoch": 46.73, "learning_rate": 2.6524475524475525e-07, "loss": 0.3798, "step": 53930 }, { "epoch": 46.74, "learning_rate": 2.6454545454545454e-07, "loss": 0.385, "step": 53940 }, { "epoch": 46.75, "learning_rate": 2.638461538461538e-07, "loss": 0.3675, "step": 53950 }, { "epoch": 46.76, "learning_rate": 2.6314685314685316e-07, "loss": 0.3411, "step": 53960 }, { "epoch": 46.77, "learning_rate": 2.6244755244755245e-07, "loss": 0.3486, "step": 53970 }, { "epoch": 46.78, "learning_rate": 2.6174825174825173e-07, "loss": 0.2884, "step": 53980 }, { "epoch": 46.78, "learning_rate": 2.61048951048951e-07, "loss": 0.3276, "step": 53990 }, { "epoch": 46.79, "learning_rate": 2.6034965034965036e-07, "loss": 0.3774, "step": 54000 }, { "epoch": 46.8, "learning_rate": 2.5965034965034964e-07, "loss": 0.3754, "step": 54010 }, { "epoch": 46.81, "learning_rate": 2.58951048951049e-07, "loss": 0.3675, "step": 54020 }, { "epoch": 46.82, "learning_rate": 2.582517482517482e-07, "loss": 0.3309, "step": 54030 }, { "epoch": 46.83, "learning_rate": 2.5755244755244755e-07, "loss": 0.3408, "step": 54040 }, { "epoch": 46.84, "learning_rate": 2.5685314685314684e-07, "loss": 0.334, "step": 54050 }, { "epoch": 46.85, "learning_rate": 2.5615384615384617e-07, "loss": 0.3203, "step": 54060 }, { "epoch": 46.85, "learning_rate": 2.554545454545454e-07, "loss": 0.3555, "step": 54070 }, { "epoch": 46.86, "learning_rate": 2.5475524475524474e-07, "loss": 0.366, "step": 54080 }, { "epoch": 46.87, "learning_rate": 2.5405594405594403e-07, "loss": 0.3755, "step": 54090 }, { "epoch": 46.88, "learning_rate": 2.5335664335664337e-07, "loss": 0.3058, "step": 54100 }, { "epoch": 46.89, "learning_rate": 2.526573426573426e-07, "loss": 0.3177, "step": 54110 }, { "epoch": 46.9, "learning_rate": 2.5195804195804194e-07, "loss": 0.3584, "step": 54120 }, { "epoch": 46.91, "learning_rate": 2.512587412587412e-07, "loss": 0.3873, "step": 54130 }, { "epoch": 46.91, "learning_rate": 2.5055944055944056e-07, "loss": 0.3423, "step": 54140 }, { "epoch": 46.92, "learning_rate": 2.4986013986013985e-07, "loss": 0.3947, "step": 54150 }, { "epoch": 46.93, "learning_rate": 2.491608391608392e-07, "loss": 0.288, "step": 54160 }, { "epoch": 46.94, "learning_rate": 2.4846153846153847e-07, "loss": 0.3879, "step": 54170 }, { "epoch": 46.95, "learning_rate": 2.4776223776223775e-07, "loss": 0.3688, "step": 54180 }, { "epoch": 46.96, "learning_rate": 2.4706293706293704e-07, "loss": 0.2977, "step": 54190 }, { "epoch": 46.97, "learning_rate": 2.463636363636364e-07, "loss": 0.3618, "step": 54200 }, { "epoch": 46.98, "learning_rate": 2.4566433566433566e-07, "loss": 0.3247, "step": 54210 }, { "epoch": 46.98, "learning_rate": 2.4496503496503495e-07, "loss": 0.3606, "step": 54220 }, { "epoch": 46.99, "learning_rate": 2.4426573426573423e-07, "loss": 0.4154, "step": 54230 }, { "epoch": 47.0, "eval_loss": 0.5568397641181946, "eval_runtime": 137.629, "eval_samples_per_second": 3.865, "eval_steps_per_second": 1.933, "eval_wer": 0.24304171755479848, "step": 54238 }, { "epoch": 47.0, "learning_rate": 2.4356643356643357e-07, "loss": 0.3797, "step": 54240 }, { "epoch": 47.01, "learning_rate": 2.4286713286713286e-07, "loss": 0.3366, "step": 54250 }, { "epoch": 47.02, "learning_rate": 2.4216783216783214e-07, "loss": 0.3544, "step": 54260 }, { "epoch": 47.03, "learning_rate": 2.414685314685315e-07, "loss": 0.3364, "step": 54270 }, { "epoch": 47.04, "learning_rate": 2.4076923076923076e-07, "loss": 0.3394, "step": 54280 }, { "epoch": 47.05, "learning_rate": 2.4006993006993005e-07, "loss": 0.3604, "step": 54290 }, { "epoch": 47.05, "learning_rate": 2.3937062937062934e-07, "loss": 0.3669, "step": 54300 }, { "epoch": 47.06, "learning_rate": 2.3867132867132867e-07, "loss": 0.2888, "step": 54310 }, { "epoch": 47.07, "learning_rate": 2.3797202797202796e-07, "loss": 0.3718, "step": 54320 }, { "epoch": 47.08, "learning_rate": 2.3727272727272727e-07, "loss": 0.3313, "step": 54330 }, { "epoch": 47.09, "learning_rate": 2.3657342657342656e-07, "loss": 0.3984, "step": 54340 }, { "epoch": 47.1, "learning_rate": 2.3587412587412587e-07, "loss": 0.3705, "step": 54350 }, { "epoch": 47.11, "learning_rate": 2.3517482517482518e-07, "loss": 0.3335, "step": 54360 }, { "epoch": 47.11, "learning_rate": 2.3447552447552446e-07, "loss": 0.3551, "step": 54370 }, { "epoch": 47.12, "learning_rate": 2.3377622377622378e-07, "loss": 0.3671, "step": 54380 }, { "epoch": 47.13, "learning_rate": 2.3307692307692306e-07, "loss": 0.3905, "step": 54390 }, { "epoch": 47.14, "learning_rate": 2.3237762237762237e-07, "loss": 0.3684, "step": 54400 }, { "epoch": 47.15, "learning_rate": 2.3167832167832166e-07, "loss": 0.3137, "step": 54410 }, { "epoch": 47.16, "learning_rate": 2.3097902097902097e-07, "loss": 0.2697, "step": 54420 }, { "epoch": 47.17, "learning_rate": 2.3027972027972025e-07, "loss": 0.381, "step": 54430 }, { "epoch": 47.17, "learning_rate": 2.2958041958041957e-07, "loss": 0.366, "step": 54440 }, { "epoch": 47.18, "learning_rate": 2.2888111888111888e-07, "loss": 0.3381, "step": 54450 }, { "epoch": 47.19, "learning_rate": 2.2818181818181816e-07, "loss": 0.3675, "step": 54460 }, { "epoch": 47.2, "learning_rate": 2.2748251748251747e-07, "loss": 0.4371, "step": 54470 }, { "epoch": 47.21, "learning_rate": 2.2678321678321676e-07, "loss": 0.3368, "step": 54480 }, { "epoch": 47.22, "learning_rate": 2.2608391608391607e-07, "loss": 0.3477, "step": 54490 }, { "epoch": 47.23, "learning_rate": 2.2538461538461536e-07, "loss": 0.3952, "step": 54500 }, { "epoch": 47.24, "learning_rate": 2.2468531468531467e-07, "loss": 0.382, "step": 54510 }, { "epoch": 47.24, "learning_rate": 2.2398601398601395e-07, "loss": 0.3393, "step": 54520 }, { "epoch": 47.25, "learning_rate": 2.232867132867133e-07, "loss": 0.377, "step": 54530 }, { "epoch": 47.26, "learning_rate": 2.2258741258741258e-07, "loss": 0.3356, "step": 54540 }, { "epoch": 47.27, "learning_rate": 2.218881118881119e-07, "loss": 0.3276, "step": 54550 }, { "epoch": 47.28, "learning_rate": 2.211888111888112e-07, "loss": 0.3384, "step": 54560 }, { "epoch": 47.29, "learning_rate": 2.2048951048951049e-07, "loss": 0.3336, "step": 54570 }, { "epoch": 47.3, "learning_rate": 2.197902097902098e-07, "loss": 0.3849, "step": 54580 }, { "epoch": 47.3, "learning_rate": 2.1909090909090908e-07, "loss": 0.3696, "step": 54590 }, { "epoch": 47.31, "learning_rate": 2.183916083916084e-07, "loss": 0.3393, "step": 54600 }, { "epoch": 47.32, "learning_rate": 2.1769230769230768e-07, "loss": 0.3248, "step": 54610 }, { "epoch": 47.33, "learning_rate": 2.16993006993007e-07, "loss": 0.3582, "step": 54620 }, { "epoch": 47.34, "learning_rate": 2.1629370629370628e-07, "loss": 0.3992, "step": 54630 }, { "epoch": 47.35, "learning_rate": 2.155944055944056e-07, "loss": 0.3919, "step": 54640 }, { "epoch": 47.36, "learning_rate": 2.1489510489510487e-07, "loss": 0.3243, "step": 54650 }, { "epoch": 47.37, "learning_rate": 2.1419580419580418e-07, "loss": 0.3565, "step": 54660 }, { "epoch": 47.37, "learning_rate": 2.134965034965035e-07, "loss": 0.3303, "step": 54670 }, { "epoch": 47.38, "learning_rate": 2.1279720279720278e-07, "loss": 0.379, "step": 54680 }, { "epoch": 47.39, "learning_rate": 2.120979020979021e-07, "loss": 0.3638, "step": 54690 }, { "epoch": 47.4, "learning_rate": 2.1139860139860138e-07, "loss": 0.3546, "step": 54700 }, { "epoch": 47.41, "learning_rate": 2.106993006993007e-07, "loss": 0.3522, "step": 54710 }, { "epoch": 47.42, "learning_rate": 2.0999999999999997e-07, "loss": 0.3087, "step": 54720 }, { "epoch": 47.43, "learning_rate": 2.0930069930069929e-07, "loss": 0.3587, "step": 54730 }, { "epoch": 47.43, "learning_rate": 2.0860139860139857e-07, "loss": 0.3933, "step": 54740 }, { "epoch": 47.44, "learning_rate": 2.0790209790209788e-07, "loss": 0.3762, "step": 54750 }, { "epoch": 47.45, "learning_rate": 2.0720279720279717e-07, "loss": 0.2997, "step": 54760 }, { "epoch": 47.46, "learning_rate": 2.065034965034965e-07, "loss": 0.3557, "step": 54770 }, { "epoch": 47.47, "learning_rate": 2.0580419580419582e-07, "loss": 0.3875, "step": 54780 }, { "epoch": 47.48, "learning_rate": 2.051048951048951e-07, "loss": 0.3961, "step": 54790 }, { "epoch": 47.49, "learning_rate": 2.0440559440559441e-07, "loss": 0.3651, "step": 54800 }, { "epoch": 47.5, "learning_rate": 2.037062937062937e-07, "loss": 0.3966, "step": 54810 }, { "epoch": 47.5, "learning_rate": 2.03006993006993e-07, "loss": 0.3651, "step": 54820 }, { "epoch": 47.51, "learning_rate": 2.023076923076923e-07, "loss": 0.3566, "step": 54830 }, { "epoch": 47.52, "learning_rate": 2.016083916083916e-07, "loss": 0.3443, "step": 54840 }, { "epoch": 47.53, "learning_rate": 2.009090909090909e-07, "loss": 0.3262, "step": 54850 }, { "epoch": 47.54, "learning_rate": 2.002097902097902e-07, "loss": 0.3129, "step": 54860 }, { "epoch": 47.55, "learning_rate": 1.995104895104895e-07, "loss": 0.3609, "step": 54870 }, { "epoch": 47.56, "learning_rate": 1.988111888111888e-07, "loss": 0.2917, "step": 54880 }, { "epoch": 47.56, "learning_rate": 1.9811188811188811e-07, "loss": 0.391, "step": 54890 }, { "epoch": 47.57, "learning_rate": 1.974125874125874e-07, "loss": 0.3483, "step": 54900 }, { "epoch": 47.58, "learning_rate": 1.967132867132867e-07, "loss": 0.3754, "step": 54910 }, { "epoch": 47.59, "learning_rate": 1.96013986013986e-07, "loss": 0.3642, "step": 54920 }, { "epoch": 47.6, "learning_rate": 1.953146853146853e-07, "loss": 0.3519, "step": 54930 }, { "epoch": 47.61, "learning_rate": 1.946153846153846e-07, "loss": 0.4031, "step": 54940 }, { "epoch": 47.62, "learning_rate": 1.939160839160839e-07, "loss": 0.3196, "step": 54950 }, { "epoch": 47.63, "learning_rate": 1.932167832167832e-07, "loss": 0.3574, "step": 54960 }, { "epoch": 47.63, "learning_rate": 1.925174825174825e-07, "loss": 0.342, "step": 54970 }, { "epoch": 47.64, "learning_rate": 1.9181818181818179e-07, "loss": 0.3426, "step": 54980 }, { "epoch": 47.65, "learning_rate": 1.911188811188811e-07, "loss": 0.3166, "step": 54990 }, { "epoch": 47.66, "learning_rate": 1.904195804195804e-07, "loss": 0.3258, "step": 55000 }, { "epoch": 47.67, "learning_rate": 1.897202797202797e-07, "loss": 0.3332, "step": 55010 }, { "epoch": 47.68, "learning_rate": 1.8902097902097903e-07, "loss": 0.3769, "step": 55020 }, { "epoch": 47.69, "learning_rate": 1.8832167832167832e-07, "loss": 0.4165, "step": 55030 }, { "epoch": 47.69, "learning_rate": 1.8769230769230767e-07, "loss": 0.3893, "step": 55040 }, { "epoch": 47.7, "learning_rate": 1.8699300699300699e-07, "loss": 0.3782, "step": 55050 }, { "epoch": 47.71, "learning_rate": 1.8629370629370627e-07, "loss": 0.3125, "step": 55060 }, { "epoch": 47.72, "learning_rate": 1.8559440559440558e-07, "loss": 0.3644, "step": 55070 }, { "epoch": 47.73, "learning_rate": 1.8489510489510487e-07, "loss": 0.339, "step": 55080 }, { "epoch": 47.74, "learning_rate": 1.8419580419580418e-07, "loss": 0.3563, "step": 55090 }, { "epoch": 47.75, "learning_rate": 1.834965034965035e-07, "loss": 0.3465, "step": 55100 }, { "epoch": 47.76, "learning_rate": 1.8279720279720278e-07, "loss": 0.3255, "step": 55110 }, { "epoch": 47.76, "learning_rate": 1.820979020979021e-07, "loss": 0.3639, "step": 55120 }, { "epoch": 47.77, "learning_rate": 1.8139860139860137e-07, "loss": 0.3893, "step": 55130 }, { "epoch": 47.78, "learning_rate": 1.806993006993007e-07, "loss": 0.3311, "step": 55140 }, { "epoch": 47.79, "learning_rate": 1.8e-07, "loss": 0.3554, "step": 55150 }, { "epoch": 47.8, "learning_rate": 1.793006993006993e-07, "loss": 0.3587, "step": 55160 }, { "epoch": 47.81, "learning_rate": 1.786013986013986e-07, "loss": 0.301, "step": 55170 }, { "epoch": 47.82, "learning_rate": 1.779020979020979e-07, "loss": 0.3313, "step": 55180 }, { "epoch": 47.82, "learning_rate": 1.772027972027972e-07, "loss": 0.3896, "step": 55190 }, { "epoch": 47.83, "learning_rate": 1.765034965034965e-07, "loss": 0.3046, "step": 55200 }, { "epoch": 47.84, "learning_rate": 1.7580419580419581e-07, "loss": 0.3305, "step": 55210 }, { "epoch": 47.85, "learning_rate": 1.751048951048951e-07, "loss": 0.3427, "step": 55220 }, { "epoch": 47.86, "learning_rate": 1.744055944055944e-07, "loss": 0.3899, "step": 55230 }, { "epoch": 47.87, "learning_rate": 1.737062937062937e-07, "loss": 0.3873, "step": 55240 }, { "epoch": 47.88, "learning_rate": 1.73006993006993e-07, "loss": 0.3425, "step": 55250 }, { "epoch": 47.89, "learning_rate": 1.723076923076923e-07, "loss": 0.3016, "step": 55260 }, { "epoch": 47.89, "learning_rate": 1.716083916083916e-07, "loss": 0.3186, "step": 55270 }, { "epoch": 47.9, "learning_rate": 1.709090909090909e-07, "loss": 0.3615, "step": 55280 }, { "epoch": 47.91, "learning_rate": 1.702097902097902e-07, "loss": 0.3495, "step": 55290 }, { "epoch": 47.92, "learning_rate": 1.6951048951048949e-07, "loss": 0.317, "step": 55300 }, { "epoch": 47.93, "learning_rate": 1.688111888111888e-07, "loss": 0.4341, "step": 55310 }, { "epoch": 47.94, "learning_rate": 1.681118881118881e-07, "loss": 0.3467, "step": 55320 }, { "epoch": 47.95, "learning_rate": 1.674125874125874e-07, "loss": 0.3802, "step": 55330 }, { "epoch": 47.95, "learning_rate": 1.667132867132867e-07, "loss": 0.3541, "step": 55340 }, { "epoch": 47.96, "learning_rate": 1.66013986013986e-07, "loss": 0.3015, "step": 55350 }, { "epoch": 47.97, "learning_rate": 1.653146853146853e-07, "loss": 0.3601, "step": 55360 }, { "epoch": 47.98, "learning_rate": 1.646153846153846e-07, "loss": 0.3906, "step": 55370 }, { "epoch": 47.99, "learning_rate": 1.6391608391608393e-07, "loss": 0.3486, "step": 55380 }, { "epoch": 48.0, "learning_rate": 1.632167832167832e-07, "loss": 0.3158, "step": 55390 }, { "epoch": 48.0, "eval_loss": 0.560836672782898, "eval_runtime": 134.7766, "eval_samples_per_second": 3.947, "eval_steps_per_second": 1.974, "eval_wer": 0.24284887831844185, "step": 55392 }, { "epoch": 48.01, "learning_rate": 1.6251748251748252e-07, "loss": 0.3843, "step": 55400 }, { "epoch": 48.02, "learning_rate": 1.618181818181818e-07, "loss": 0.4182, "step": 55410 }, { "epoch": 48.02, "learning_rate": 1.6111888111888112e-07, "loss": 0.2969, "step": 55420 }, { "epoch": 48.03, "learning_rate": 1.6041958041958043e-07, "loss": 0.3782, "step": 55430 }, { "epoch": 48.04, "learning_rate": 1.5972027972027972e-07, "loss": 0.3769, "step": 55440 }, { "epoch": 48.05, "learning_rate": 1.5902097902097903e-07, "loss": 0.3307, "step": 55450 }, { "epoch": 48.06, "learning_rate": 1.5832167832167831e-07, "loss": 0.3369, "step": 55460 }, { "epoch": 48.07, "learning_rate": 1.5762237762237763e-07, "loss": 0.3782, "step": 55470 }, { "epoch": 48.08, "learning_rate": 1.569230769230769e-07, "loss": 0.389, "step": 55480 }, { "epoch": 48.08, "learning_rate": 1.5622377622377622e-07, "loss": 0.3859, "step": 55490 }, { "epoch": 48.09, "learning_rate": 1.555244755244755e-07, "loss": 0.3444, "step": 55500 }, { "epoch": 48.1, "learning_rate": 1.5482517482517482e-07, "loss": 0.3688, "step": 55510 }, { "epoch": 48.11, "learning_rate": 1.541258741258741e-07, "loss": 0.3124, "step": 55520 }, { "epoch": 48.12, "learning_rate": 1.5342657342657342e-07, "loss": 0.303, "step": 55530 }, { "epoch": 48.13, "learning_rate": 1.5272727272727273e-07, "loss": 0.3582, "step": 55540 }, { "epoch": 48.14, "learning_rate": 1.5202797202797201e-07, "loss": 0.351, "step": 55550 }, { "epoch": 48.15, "learning_rate": 1.5132867132867132e-07, "loss": 0.41, "step": 55560 }, { "epoch": 48.15, "learning_rate": 1.506293706293706e-07, "loss": 0.3245, "step": 55570 }, { "epoch": 48.16, "learning_rate": 1.4993006993006992e-07, "loss": 0.3326, "step": 55580 }, { "epoch": 48.17, "learning_rate": 1.492307692307692e-07, "loss": 0.3845, "step": 55590 }, { "epoch": 48.18, "learning_rate": 1.4853146853146852e-07, "loss": 0.3734, "step": 55600 }, { "epoch": 48.19, "learning_rate": 1.478321678321678e-07, "loss": 0.3646, "step": 55610 }, { "epoch": 48.2, "learning_rate": 1.4713286713286712e-07, "loss": 0.3872, "step": 55620 }, { "epoch": 48.21, "learning_rate": 1.464335664335664e-07, "loss": 0.4069, "step": 55630 }, { "epoch": 48.21, "learning_rate": 1.4573426573426574e-07, "loss": 0.4001, "step": 55640 }, { "epoch": 48.22, "learning_rate": 1.4503496503496505e-07, "loss": 0.3788, "step": 55650 }, { "epoch": 48.23, "learning_rate": 1.4433566433566434e-07, "loss": 0.3732, "step": 55660 }, { "epoch": 48.24, "learning_rate": 1.4363636363636365e-07, "loss": 0.3641, "step": 55670 }, { "epoch": 48.25, "learning_rate": 1.4293706293706293e-07, "loss": 0.3531, "step": 55680 }, { "epoch": 48.26, "learning_rate": 1.4223776223776224e-07, "loss": 0.3396, "step": 55690 }, { "epoch": 48.27, "learning_rate": 1.4153846153846153e-07, "loss": 0.379, "step": 55700 }, { "epoch": 48.28, "learning_rate": 1.4083916083916084e-07, "loss": 0.3456, "step": 55710 }, { "epoch": 48.28, "learning_rate": 1.4013986013986013e-07, "loss": 0.2917, "step": 55720 }, { "epoch": 48.29, "learning_rate": 1.3944055944055944e-07, "loss": 0.3777, "step": 55730 }, { "epoch": 48.3, "learning_rate": 1.3874125874125875e-07, "loss": 0.3455, "step": 55740 }, { "epoch": 48.31, "learning_rate": 1.3804195804195803e-07, "loss": 0.3494, "step": 55750 }, { "epoch": 48.32, "learning_rate": 1.3734265734265735e-07, "loss": 0.3303, "step": 55760 }, { "epoch": 48.33, "learning_rate": 1.3664335664335663e-07, "loss": 0.3415, "step": 55770 }, { "epoch": 48.34, "learning_rate": 1.3594405594405594e-07, "loss": 0.3074, "step": 55780 }, { "epoch": 48.34, "learning_rate": 1.3524475524475523e-07, "loss": 0.4096, "step": 55790 }, { "epoch": 48.35, "learning_rate": 1.3454545454545454e-07, "loss": 0.3875, "step": 55800 }, { "epoch": 48.36, "learning_rate": 1.3384615384615383e-07, "loss": 0.344, "step": 55810 }, { "epoch": 48.37, "learning_rate": 1.3314685314685314e-07, "loss": 0.2696, "step": 55820 }, { "epoch": 48.38, "learning_rate": 1.3244755244755242e-07, "loss": 0.339, "step": 55830 }, { "epoch": 48.39, "learning_rate": 1.3174825174825173e-07, "loss": 0.354, "step": 55840 }, { "epoch": 48.4, "learning_rate": 1.3104895104895105e-07, "loss": 0.3863, "step": 55850 }, { "epoch": 48.41, "learning_rate": 1.3034965034965033e-07, "loss": 0.3484, "step": 55860 }, { "epoch": 48.41, "learning_rate": 1.2965034965034964e-07, "loss": 0.4278, "step": 55870 }, { "epoch": 48.42, "learning_rate": 1.2895104895104895e-07, "loss": 0.3246, "step": 55880 }, { "epoch": 48.43, "learning_rate": 1.2825174825174827e-07, "loss": 0.3766, "step": 55890 }, { "epoch": 48.44, "learning_rate": 1.2755244755244755e-07, "loss": 0.3238, "step": 55900 }, { "epoch": 48.45, "learning_rate": 1.2685314685314686e-07, "loss": 0.4097, "step": 55910 }, { "epoch": 48.46, "learning_rate": 1.2615384615384615e-07, "loss": 0.3207, "step": 55920 }, { "epoch": 48.47, "learning_rate": 1.2545454545454546e-07, "loss": 0.3636, "step": 55930 }, { "epoch": 48.47, "learning_rate": 1.2475524475524474e-07, "loss": 0.359, "step": 55940 }, { "epoch": 48.48, "learning_rate": 1.2405594405594406e-07, "loss": 0.3375, "step": 55950 }, { "epoch": 48.49, "learning_rate": 1.2335664335664334e-07, "loss": 0.3635, "step": 55960 }, { "epoch": 48.5, "learning_rate": 1.2265734265734265e-07, "loss": 0.2793, "step": 55970 }, { "epoch": 48.51, "learning_rate": 1.2195804195804194e-07, "loss": 0.41, "step": 55980 }, { "epoch": 48.52, "learning_rate": 1.2125874125874125e-07, "loss": 0.39, "step": 55990 }, { "epoch": 48.53, "learning_rate": 1.2055944055944053e-07, "loss": 0.3814, "step": 56000 }, { "epoch": 48.54, "learning_rate": 1.1986013986013987e-07, "loss": 0.3057, "step": 56010 }, { "epoch": 48.54, "learning_rate": 1.1916083916083916e-07, "loss": 0.3332, "step": 56020 }, { "epoch": 48.55, "learning_rate": 1.1846153846153846e-07, "loss": 0.3852, "step": 56030 }, { "epoch": 48.56, "learning_rate": 1.1776223776223775e-07, "loss": 0.4011, "step": 56040 }, { "epoch": 48.57, "learning_rate": 1.1706293706293705e-07, "loss": 0.3123, "step": 56050 }, { "epoch": 48.58, "learning_rate": 1.1636363636363636e-07, "loss": 0.3529, "step": 56060 }, { "epoch": 48.59, "learning_rate": 1.1566433566433566e-07, "loss": 0.3336, "step": 56070 }, { "epoch": 48.6, "learning_rate": 1.1496503496503496e-07, "loss": 0.3159, "step": 56080 }, { "epoch": 48.6, "learning_rate": 1.1426573426573426e-07, "loss": 0.3929, "step": 56090 }, { "epoch": 48.61, "learning_rate": 1.1356643356643356e-07, "loss": 0.3498, "step": 56100 }, { "epoch": 48.62, "learning_rate": 1.1286713286713286e-07, "loss": 0.3591, "step": 56110 }, { "epoch": 48.63, "learning_rate": 1.1216783216783217e-07, "loss": 0.3466, "step": 56120 }, { "epoch": 48.64, "learning_rate": 1.1146853146853147e-07, "loss": 0.3921, "step": 56130 }, { "epoch": 48.65, "learning_rate": 1.1076923076923077e-07, "loss": 0.42, "step": 56140 }, { "epoch": 48.66, "learning_rate": 1.1006993006993006e-07, "loss": 0.3855, "step": 56150 }, { "epoch": 48.67, "learning_rate": 1.0937062937062936e-07, "loss": 0.3384, "step": 56160 }, { "epoch": 48.67, "learning_rate": 1.0867132867132866e-07, "loss": 0.3103, "step": 56170 }, { "epoch": 48.68, "learning_rate": 1.0797202797202796e-07, "loss": 0.3521, "step": 56180 }, { "epoch": 48.69, "learning_rate": 1.0727272727272727e-07, "loss": 0.3497, "step": 56190 }, { "epoch": 48.7, "learning_rate": 1.0657342657342657e-07, "loss": 0.371, "step": 56200 }, { "epoch": 48.71, "learning_rate": 1.0587412587412587e-07, "loss": 0.324, "step": 56210 }, { "epoch": 48.72, "learning_rate": 1.0517482517482518e-07, "loss": 0.3263, "step": 56220 }, { "epoch": 48.73, "learning_rate": 1.0447552447552448e-07, "loss": 0.3513, "step": 56230 }, { "epoch": 48.73, "learning_rate": 1.0377622377622378e-07, "loss": 0.3406, "step": 56240 }, { "epoch": 48.74, "learning_rate": 1.0307692307692307e-07, "loss": 0.3813, "step": 56250 }, { "epoch": 48.75, "learning_rate": 1.0237762237762237e-07, "loss": 0.391, "step": 56260 }, { "epoch": 48.76, "learning_rate": 1.0167832167832167e-07, "loss": 0.3442, "step": 56270 }, { "epoch": 48.77, "learning_rate": 1.0097902097902097e-07, "loss": 0.375, "step": 56280 }, { "epoch": 48.78, "learning_rate": 1.0027972027972027e-07, "loss": 0.3793, "step": 56290 }, { "epoch": 48.79, "learning_rate": 9.958041958041957e-08, "loss": 0.31, "step": 56300 }, { "epoch": 48.8, "learning_rate": 9.888111888111888e-08, "loss": 0.3603, "step": 56310 }, { "epoch": 48.8, "learning_rate": 9.818181818181818e-08, "loss": 0.3785, "step": 56320 }, { "epoch": 48.81, "learning_rate": 9.748251748251749e-08, "loss": 0.3666, "step": 56330 }, { "epoch": 48.82, "learning_rate": 9.678321678321679e-08, "loss": 0.3912, "step": 56340 }, { "epoch": 48.83, "learning_rate": 9.608391608391609e-08, "loss": 0.3119, "step": 56350 }, { "epoch": 48.84, "learning_rate": 9.538461538461538e-08, "loss": 0.3483, "step": 56360 }, { "epoch": 48.85, "learning_rate": 9.468531468531468e-08, "loss": 0.3031, "step": 56370 }, { "epoch": 48.86, "learning_rate": 9.398601398601398e-08, "loss": 0.3225, "step": 56380 }, { "epoch": 48.86, "learning_rate": 9.328671328671328e-08, "loss": 0.3636, "step": 56390 }, { "epoch": 48.87, "learning_rate": 9.258741258741258e-08, "loss": 0.2924, "step": 56400 }, { "epoch": 48.88, "learning_rate": 9.188811188811188e-08, "loss": 0.333, "step": 56410 }, { "epoch": 48.89, "learning_rate": 9.118881118881117e-08, "loss": 0.3425, "step": 56420 }, { "epoch": 48.9, "learning_rate": 9.048951048951047e-08, "loss": 0.3841, "step": 56430 }, { "epoch": 48.91, "learning_rate": 8.97902097902098e-08, "loss": 0.3724, "step": 56440 }, { "epoch": 48.92, "learning_rate": 8.90909090909091e-08, "loss": 0.3315, "step": 56450 }, { "epoch": 48.93, "learning_rate": 8.83916083916084e-08, "loss": 0.3965, "step": 56460 }, { "epoch": 48.93, "learning_rate": 8.769230769230769e-08, "loss": 0.3083, "step": 56470 }, { "epoch": 48.94, "learning_rate": 8.699300699300699e-08, "loss": 0.3607, "step": 56480 }, { "epoch": 48.95, "learning_rate": 8.629370629370629e-08, "loss": 0.3723, "step": 56490 }, { "epoch": 48.96, "learning_rate": 8.559440559440559e-08, "loss": 0.388, "step": 56500 }, { "epoch": 48.97, "learning_rate": 8.489510489510489e-08, "loss": 0.3396, "step": 56510 }, { "epoch": 48.98, "learning_rate": 8.419580419580418e-08, "loss": 0.2864, "step": 56520 }, { "epoch": 48.99, "learning_rate": 8.349650349650348e-08, "loss": 0.3396, "step": 56530 }, { "epoch": 48.99, "learning_rate": 8.27972027972028e-08, "loss": 0.3577, "step": 56540 }, { "epoch": 49.0, "eval_loss": 0.5593469738960266, "eval_runtime": 135.5272, "eval_samples_per_second": 3.925, "eval_steps_per_second": 1.963, "eval_wer": 0.24117760493668444, "step": 56546 }, { "epoch": 49.0, "learning_rate": 8.209790209790209e-08, "loss": 0.3164, "step": 56550 }, { "epoch": 49.01, "learning_rate": 8.13986013986014e-08, "loss": 0.3259, "step": 56560 }, { "epoch": 49.02, "learning_rate": 8.06993006993007e-08, "loss": 0.3391, "step": 56570 }, { "epoch": 49.03, "learning_rate": 8e-08, "loss": 0.3855, "step": 56580 }, { "epoch": 49.04, "learning_rate": 7.93006993006993e-08, "loss": 0.3719, "step": 56590 }, { "epoch": 49.05, "learning_rate": 7.86013986013986e-08, "loss": 0.3446, "step": 56600 }, { "epoch": 49.06, "learning_rate": 7.79020979020979e-08, "loss": 0.291, "step": 56610 }, { "epoch": 49.06, "learning_rate": 7.72027972027972e-08, "loss": 0.3151, "step": 56620 }, { "epoch": 49.07, "learning_rate": 7.65034965034965e-08, "loss": 0.3284, "step": 56630 }, { "epoch": 49.08, "learning_rate": 7.580419580419579e-08, "loss": 0.386, "step": 56640 }, { "epoch": 49.09, "learning_rate": 7.51048951048951e-08, "loss": 0.3983, "step": 56650 }, { "epoch": 49.1, "learning_rate": 7.44055944055944e-08, "loss": 0.4279, "step": 56660 }, { "epoch": 49.11, "learning_rate": 7.37062937062937e-08, "loss": 0.3545, "step": 56670 }, { "epoch": 49.12, "learning_rate": 7.300699300699301e-08, "loss": 0.3488, "step": 56680 }, { "epoch": 49.12, "learning_rate": 7.230769230769231e-08, "loss": 0.336, "step": 56690 }, { "epoch": 49.13, "learning_rate": 7.160839160839161e-08, "loss": 0.2867, "step": 56700 }, { "epoch": 49.14, "learning_rate": 7.090909090909091e-08, "loss": 0.3295, "step": 56710 }, { "epoch": 49.15, "learning_rate": 7.02097902097902e-08, "loss": 0.3409, "step": 56720 }, { "epoch": 49.16, "learning_rate": 6.95104895104895e-08, "loss": 0.3139, "step": 56730 }, { "epoch": 49.17, "learning_rate": 6.88111888111888e-08, "loss": 0.3372, "step": 56740 }, { "epoch": 49.18, "learning_rate": 6.81118881118881e-08, "loss": 0.3601, "step": 56750 }, { "epoch": 49.19, "learning_rate": 6.741258741258741e-08, "loss": 0.4306, "step": 56760 }, { "epoch": 49.19, "learning_rate": 6.671328671328671e-08, "loss": 0.3192, "step": 56770 }, { "epoch": 49.2, "learning_rate": 6.601398601398601e-08, "loss": 0.4052, "step": 56780 }, { "epoch": 49.21, "learning_rate": 6.531468531468531e-08, "loss": 0.3666, "step": 56790 }, { "epoch": 49.22, "learning_rate": 6.461538461538462e-08, "loss": 0.3323, "step": 56800 }, { "epoch": 49.23, "learning_rate": 6.391608391608392e-08, "loss": 0.3665, "step": 56810 }, { "epoch": 49.24, "learning_rate": 6.321678321678322e-08, "loss": 0.3556, "step": 56820 }, { "epoch": 49.25, "learning_rate": 6.251748251748252e-08, "loss": 0.3442, "step": 56830 }, { "epoch": 49.25, "learning_rate": 6.181818181818181e-08, "loss": 0.3433, "step": 56840 }, { "epoch": 49.26, "learning_rate": 6.111888111888111e-08, "loss": 0.2919, "step": 56850 }, { "epoch": 49.27, "learning_rate": 6.041958041958041e-08, "loss": 0.3386, "step": 56860 }, { "epoch": 49.28, "learning_rate": 5.972027972027972e-08, "loss": 0.3452, "step": 56870 }, { "epoch": 49.29, "learning_rate": 5.9020979020979014e-08, "loss": 0.3379, "step": 56880 }, { "epoch": 49.3, "learning_rate": 5.832167832167832e-08, "loss": 0.3258, "step": 56890 }, { "epoch": 49.31, "learning_rate": 5.7622377622377624e-08, "loss": 0.4041, "step": 56900 }, { "epoch": 49.32, "learning_rate": 5.692307692307692e-08, "loss": 0.3279, "step": 56910 }, { "epoch": 49.32, "learning_rate": 5.622377622377622e-08, "loss": 0.3576, "step": 56920 }, { "epoch": 49.33, "learning_rate": 5.552447552447552e-08, "loss": 0.31, "step": 56930 }, { "epoch": 49.34, "learning_rate": 5.4825174825174824e-08, "loss": 0.3643, "step": 56940 }, { "epoch": 49.35, "learning_rate": 5.412587412587412e-08, "loss": 0.368, "step": 56950 }, { "epoch": 49.36, "learning_rate": 5.342657342657343e-08, "loss": 0.3732, "step": 56960 }, { "epoch": 49.37, "learning_rate": 5.2727272727272726e-08, "loss": 0.3594, "step": 56970 }, { "epoch": 49.38, "learning_rate": 5.2027972027972024e-08, "loss": 0.3388, "step": 56980 }, { "epoch": 49.38, "learning_rate": 5.132867132867132e-08, "loss": 0.4067, "step": 56990 }, { "epoch": 49.39, "learning_rate": 5.062937062937063e-08, "loss": 0.3645, "step": 57000 }, { "epoch": 49.4, "learning_rate": 4.9930069930069926e-08, "loss": 0.387, "step": 57010 }, { "epoch": 49.41, "learning_rate": 4.923076923076923e-08, "loss": 0.347, "step": 57020 }, { "epoch": 49.42, "learning_rate": 4.853146853146853e-08, "loss": 0.3459, "step": 57030 }, { "epoch": 49.43, "learning_rate": 4.783216783216783e-08, "loss": 0.3654, "step": 57040 }, { "epoch": 49.44, "learning_rate": 4.713286713286713e-08, "loss": 0.3412, "step": 57050 }, { "epoch": 49.45, "learning_rate": 4.643356643356643e-08, "loss": 0.3725, "step": 57060 }, { "epoch": 49.45, "learning_rate": 4.573426573426573e-08, "loss": 0.2922, "step": 57070 }, { "epoch": 49.46, "learning_rate": 4.5034965034965035e-08, "loss": 0.3583, "step": 57080 }, { "epoch": 49.47, "learning_rate": 4.4335664335664333e-08, "loss": 0.3585, "step": 57090 }, { "epoch": 49.48, "learning_rate": 4.363636363636364e-08, "loss": 0.3408, "step": 57100 }, { "epoch": 49.49, "learning_rate": 4.293706293706294e-08, "loss": 0.3853, "step": 57110 }, { "epoch": 49.5, "learning_rate": 4.2237762237762235e-08, "loss": 0.323, "step": 57120 }, { "epoch": 49.51, "learning_rate": 4.1538461538461534e-08, "loss": 0.3322, "step": 57130 }, { "epoch": 49.51, "learning_rate": 4.083916083916084e-08, "loss": 0.3715, "step": 57140 }, { "epoch": 49.52, "learning_rate": 4.013986013986014e-08, "loss": 0.3399, "step": 57150 }, { "epoch": 49.53, "learning_rate": 3.944055944055944e-08, "loss": 0.3108, "step": 57160 }, { "epoch": 49.54, "learning_rate": 3.874125874125874e-08, "loss": 0.3839, "step": 57170 }, { "epoch": 49.55, "learning_rate": 3.804195804195804e-08, "loss": 0.3441, "step": 57180 }, { "epoch": 49.56, "learning_rate": 3.734265734265734e-08, "loss": 0.3805, "step": 57190 }, { "epoch": 49.57, "learning_rate": 3.6643356643356636e-08, "loss": 0.357, "step": 57200 }, { "epoch": 49.58, "learning_rate": 3.594405594405595e-08, "loss": 0.3623, "step": 57210 }, { "epoch": 49.58, "learning_rate": 3.5244755244755246e-08, "loss": 0.3106, "step": 57220 }, { "epoch": 49.59, "learning_rate": 3.4545454545454544e-08, "loss": 0.3441, "step": 57230 }, { "epoch": 49.6, "learning_rate": 3.384615384615384e-08, "loss": 0.3801, "step": 57240 }, { "epoch": 49.61, "learning_rate": 3.314685314685314e-08, "loss": 0.4127, "step": 57250 }, { "epoch": 49.62, "learning_rate": 3.2447552447552446e-08, "loss": 0.3755, "step": 57260 }, { "epoch": 49.63, "learning_rate": 3.174825174825175e-08, "loss": 0.3613, "step": 57270 }, { "epoch": 49.64, "learning_rate": 3.104895104895105e-08, "loss": 0.3935, "step": 57280 }, { "epoch": 49.64, "learning_rate": 3.034965034965035e-08, "loss": 0.398, "step": 57290 }, { "epoch": 49.65, "learning_rate": 2.965034965034965e-08, "loss": 0.3381, "step": 57300 }, { "epoch": 49.66, "learning_rate": 2.895104895104895e-08, "loss": 0.3744, "step": 57310 }, { "epoch": 49.67, "learning_rate": 2.825174825174825e-08, "loss": 0.354, "step": 57320 }, { "epoch": 49.68, "learning_rate": 2.7552447552447552e-08, "loss": 0.3696, "step": 57330 }, { "epoch": 49.69, "learning_rate": 2.6853146853146853e-08, "loss": 0.351, "step": 57340 }, { "epoch": 49.7, "learning_rate": 2.6153846153846152e-08, "loss": 0.3758, "step": 57350 }, { "epoch": 49.71, "learning_rate": 2.5454545454545454e-08, "loss": 0.3705, "step": 57360 }, { "epoch": 49.71, "learning_rate": 2.4755244755244755e-08, "loss": 0.3173, "step": 57370 }, { "epoch": 49.72, "learning_rate": 2.4055944055944057e-08, "loss": 0.3319, "step": 57380 }, { "epoch": 49.73, "learning_rate": 2.3356643356643355e-08, "loss": 0.3558, "step": 57390 }, { "epoch": 49.74, "learning_rate": 2.2657342657342654e-08, "loss": 0.3602, "step": 57400 }, { "epoch": 49.75, "learning_rate": 2.195804195804196e-08, "loss": 0.3973, "step": 57410 }, { "epoch": 49.76, "learning_rate": 2.1258741258741257e-08, "loss": 0.3605, "step": 57420 }, { "epoch": 49.77, "learning_rate": 2.0559440559440556e-08, "loss": 0.3571, "step": 57430 }, { "epoch": 49.77, "learning_rate": 1.986013986013986e-08, "loss": 0.3679, "step": 57440 }, { "epoch": 49.78, "learning_rate": 1.916083916083916e-08, "loss": 0.3385, "step": 57450 }, { "epoch": 49.79, "learning_rate": 1.846153846153846e-08, "loss": 0.3208, "step": 57460 }, { "epoch": 49.8, "learning_rate": 1.7762237762237763e-08, "loss": 0.3961, "step": 57470 }, { "epoch": 49.81, "learning_rate": 1.706293706293706e-08, "loss": 0.4047, "step": 57480 }, { "epoch": 49.82, "learning_rate": 1.6363636363636363e-08, "loss": 0.417, "step": 57490 }, { "epoch": 49.83, "learning_rate": 1.5664335664335665e-08, "loss": 0.3229, "step": 57500 }, { "epoch": 49.83, "learning_rate": 1.4965034965034966e-08, "loss": 0.3654, "step": 57510 }, { "epoch": 49.84, "learning_rate": 1.4265734265734266e-08, "loss": 0.3457, "step": 57520 }, { "epoch": 49.85, "learning_rate": 1.3566433566433565e-08, "loss": 0.2899, "step": 57530 }, { "epoch": 49.86, "learning_rate": 1.2867132867132866e-08, "loss": 0.3838, "step": 57540 }, { "epoch": 49.87, "learning_rate": 1.2167832167832168e-08, "loss": 0.3387, "step": 57550 }, { "epoch": 49.88, "learning_rate": 1.1468531468531468e-08, "loss": 0.3008, "step": 57560 }, { "epoch": 49.89, "learning_rate": 1.0769230769230768e-08, "loss": 0.3183, "step": 57570 }, { "epoch": 49.9, "learning_rate": 1.006993006993007e-08, "loss": 0.3564, "step": 57580 }, { "epoch": 49.9, "learning_rate": 9.37062937062937e-09, "loss": 0.394, "step": 57590 }, { "epoch": 49.91, "learning_rate": 8.671328671328672e-09, "loss": 0.3434, "step": 57600 }, { "epoch": 49.92, "learning_rate": 7.972027972027972e-09, "loss": 0.3544, "step": 57610 }, { "epoch": 49.93, "learning_rate": 7.272727272727273e-09, "loss": 0.3326, "step": 57620 }, { "epoch": 49.94, "learning_rate": 6.573426573426574e-09, "loss": 0.3242, "step": 57630 }, { "epoch": 49.95, "learning_rate": 5.874125874125874e-09, "loss": 0.3569, "step": 57640 }, { "epoch": 49.96, "learning_rate": 5.174825174825175e-09, "loss": 0.3385, "step": 57650 }, { "epoch": 49.96, "learning_rate": 4.4755244755244756e-09, "loss": 0.3149, "step": 57660 }, { "epoch": 49.97, "learning_rate": 3.776223776223776e-09, "loss": 0.3932, "step": 57670 }, { "epoch": 49.98, "learning_rate": 3.076923076923077e-09, "loss": 0.3831, "step": 57680 }, { "epoch": 49.99, "learning_rate": 2.3776223776223774e-09, "loss": 0.3698, "step": 57690 }, { "epoch": 50.0, "learning_rate": 1.6783216783216783e-09, "loss": 0.3456, "step": 57700 }, { "epoch": 50.0, "eval_loss": 0.5582728385925293, "eval_runtime": 137.2226, "eval_samples_per_second": 3.877, "eval_steps_per_second": 1.938, "eval_wer": 0.24034196824580575, "step": 57700 }, { "epoch": 50.0, "step": 57700, "total_flos": 1.359460060199037e+20, "train_loss": 0.38523074480235264, "train_runtime": 114469.7461, "train_samples_per_second": 2.017, "train_steps_per_second": 0.504 } ], "max_steps": 57700, "num_train_epochs": 50, "total_flos": 1.359460060199037e+20, "trial_name": null, "trial_params": null }