{ "best_metric": 0.46595197916030884, "best_model_checkpoint": "ai-light-dance_singing3_ft_wav2vec2-large-xlsr-53-v2/checkpoint-3672", "epoch": 499.9965397923875, "global_step": 36000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.14, "learning_rate": 4.0000000000000003e-07, "loss": 0.4405, "step": 10 }, { "epoch": 0.28, "learning_rate": 7.6e-07, "loss": 0.4517, "step": 20 }, { "epoch": 0.42, "learning_rate": 1.1600000000000001e-06, "loss": 0.4412, "step": 30 }, { "epoch": 0.55, "learning_rate": 1.56e-06, "loss": 0.4446, "step": 40 }, { "epoch": 0.69, "learning_rate": 1.9600000000000003e-06, "loss": 0.4364, "step": 50 }, { "epoch": 0.83, "learning_rate": 2.3600000000000003e-06, "loss": 0.4273, "step": 60 }, { "epoch": 0.97, "learning_rate": 2.7600000000000003e-06, "loss": 0.4528, "step": 70 }, { "epoch": 1.0, "eval_loss": 0.4859951138496399, "eval_runtime": 127.812, "eval_samples_per_second": 4.162, "eval_steps_per_second": 0.524, "eval_wer": 0.22356495468277945, "step": 72 }, { "epoch": 1.11, "learning_rate": 3.1600000000000002e-06, "loss": 0.4443, "step": 80 }, { "epoch": 1.25, "learning_rate": 3.52e-06, "loss": 0.4371, "step": 90 }, { "epoch": 1.39, "learning_rate": 3.920000000000001e-06, "loss": 0.4287, "step": 100 }, { "epoch": 1.53, "learning_rate": 4.32e-06, "loss": 0.4345, "step": 110 }, { "epoch": 1.66, "learning_rate": 4.7200000000000005e-06, "loss": 0.4413, "step": 120 }, { "epoch": 1.8, "learning_rate": 5.12e-06, "loss": 0.4489, "step": 130 }, { "epoch": 1.94, "learning_rate": 5.5200000000000005e-06, "loss": 0.4403, "step": 140 }, { "epoch": 2.0, "eval_loss": 0.48137664794921875, "eval_runtime": 128.1242, "eval_samples_per_second": 4.152, "eval_steps_per_second": 0.523, "eval_wer": 0.22221508002828308, "step": 144 }, { "epoch": 2.08, "learning_rate": 5.92e-06, "loss": 0.4438, "step": 150 }, { "epoch": 2.22, "learning_rate": 6.3200000000000005e-06, "loss": 0.4393, "step": 160 }, { "epoch": 2.36, "learning_rate": 6.720000000000001e-06, "loss": 0.4379, "step": 170 }, { "epoch": 2.5, "learning_rate": 7.1200000000000004e-06, "loss": 0.4294, "step": 180 }, { "epoch": 2.64, "learning_rate": 7.520000000000001e-06, "loss": 0.4214, "step": 190 }, { "epoch": 2.78, "learning_rate": 7.92e-06, "loss": 0.44, "step": 200 }, { "epoch": 2.91, "learning_rate": 8.32e-06, "loss": 0.4309, "step": 210 }, { "epoch": 3.0, "eval_loss": 0.49520817399024963, "eval_runtime": 127.3688, "eval_samples_per_second": 4.177, "eval_steps_per_second": 0.526, "eval_wer": 0.22375779391913608, "step": 216 }, { "epoch": 3.06, "learning_rate": 8.720000000000001e-06, "loss": 0.4357, "step": 220 }, { "epoch": 3.19, "learning_rate": 9.12e-06, "loss": 0.432, "step": 230 }, { "epoch": 3.33, "learning_rate": 9.52e-06, "loss": 0.4387, "step": 240 }, { "epoch": 3.47, "learning_rate": 9.920000000000002e-06, "loss": 0.438, "step": 250 }, { "epoch": 3.61, "learning_rate": 1.0320000000000001e-05, "loss": 0.4194, "step": 260 }, { "epoch": 3.75, "learning_rate": 1.072e-05, "loss": 0.4245, "step": 270 }, { "epoch": 3.89, "learning_rate": 1.1120000000000002e-05, "loss": 0.4193, "step": 280 }, { "epoch": 4.0, "eval_loss": 0.4864279329776764, "eval_runtime": 127.4979, "eval_samples_per_second": 4.173, "eval_steps_per_second": 0.525, "eval_wer": 0.2190010927556727, "step": 288 }, { "epoch": 4.03, "learning_rate": 1.152e-05, "loss": 0.4478, "step": 290 }, { "epoch": 4.17, "learning_rate": 1.1920000000000001e-05, "loss": 0.4324, "step": 300 }, { "epoch": 4.3, "learning_rate": 1.232e-05, "loss": 0.4208, "step": 310 }, { "epoch": 4.44, "learning_rate": 1.2720000000000002e-05, "loss": 0.4339, "step": 320 }, { "epoch": 4.58, "learning_rate": 1.3120000000000001e-05, "loss": 0.4422, "step": 330 }, { "epoch": 4.72, "learning_rate": 1.3520000000000003e-05, "loss": 0.4412, "step": 340 }, { "epoch": 4.86, "learning_rate": 1.392e-05, "loss": 0.4305, "step": 350 }, { "epoch": 5.0, "learning_rate": 1.432e-05, "loss": 0.427, "step": 360 }, { "epoch": 5.0, "eval_loss": 0.507136881351471, "eval_runtime": 127.3672, "eval_samples_per_second": 4.177, "eval_steps_per_second": 0.526, "eval_wer": 0.22613614450086778, "step": 360 }, { "epoch": 5.14, "learning_rate": 1.4720000000000001e-05, "loss": 0.4332, "step": 370 }, { "epoch": 5.28, "learning_rate": 1.5120000000000001e-05, "loss": 0.4485, "step": 380 }, { "epoch": 5.42, "learning_rate": 1.552e-05, "loss": 0.4256, "step": 390 }, { "epoch": 5.55, "learning_rate": 1.5920000000000003e-05, "loss": 0.4255, "step": 400 }, { "epoch": 5.69, "learning_rate": 1.632e-05, "loss": 0.4352, "step": 410 }, { "epoch": 5.83, "learning_rate": 1.672e-05, "loss": 0.4187, "step": 420 }, { "epoch": 5.97, "learning_rate": 1.7120000000000002e-05, "loss": 0.4342, "step": 430 }, { "epoch": 6.0, "eval_loss": 0.49319037795066833, "eval_runtime": 127.3163, "eval_samples_per_second": 4.179, "eval_steps_per_second": 0.526, "eval_wer": 0.22176512181011762, "step": 432 }, { "epoch": 6.11, "learning_rate": 1.752e-05, "loss": 0.4477, "step": 440 }, { "epoch": 6.25, "learning_rate": 1.792e-05, "loss": 0.4199, "step": 450 }, { "epoch": 6.39, "learning_rate": 1.832e-05, "loss": 0.4322, "step": 460 }, { "epoch": 6.53, "learning_rate": 1.8720000000000004e-05, "loss": 0.4447, "step": 470 }, { "epoch": 6.66, "learning_rate": 1.912e-05, "loss": 0.4479, "step": 480 }, { "epoch": 6.8, "learning_rate": 1.9520000000000003e-05, "loss": 0.425, "step": 490 }, { "epoch": 6.94, "learning_rate": 1.9920000000000002e-05, "loss": 0.4205, "step": 500 }, { "epoch": 7.0, "eval_loss": 0.4868512749671936, "eval_runtime": 126.9437, "eval_samples_per_second": 4.191, "eval_steps_per_second": 0.528, "eval_wer": 0.22221508002828308, "step": 504 }, { "epoch": 7.08, "learning_rate": 2.0320000000000002e-05, "loss": 0.4458, "step": 510 }, { "epoch": 7.22, "learning_rate": 2.072e-05, "loss": 0.4351, "step": 520 }, { "epoch": 7.36, "learning_rate": 2.112e-05, "loss": 0.4306, "step": 530 }, { "epoch": 7.5, "learning_rate": 2.1520000000000004e-05, "loss": 0.4314, "step": 540 }, { "epoch": 7.64, "learning_rate": 2.1920000000000004e-05, "loss": 0.4208, "step": 550 }, { "epoch": 7.78, "learning_rate": 2.2280000000000004e-05, "loss": 0.4307, "step": 560 }, { "epoch": 7.91, "learning_rate": 2.268e-05, "loss": 0.437, "step": 570 }, { "epoch": 8.0, "eval_loss": 0.512541651725769, "eval_runtime": 127.6656, "eval_samples_per_second": 4.167, "eval_steps_per_second": 0.525, "eval_wer": 0.2224079192646397, "step": 576 }, { "epoch": 8.06, "learning_rate": 2.308e-05, "loss": 0.4428, "step": 580 }, { "epoch": 8.19, "learning_rate": 2.3480000000000002e-05, "loss": 0.441, "step": 590 }, { "epoch": 8.33, "learning_rate": 2.3880000000000002e-05, "loss": 0.4341, "step": 600 }, { "epoch": 8.47, "learning_rate": 2.428e-05, "loss": 0.4392, "step": 610 }, { "epoch": 8.61, "learning_rate": 2.468e-05, "loss": 0.4416, "step": 620 }, { "epoch": 8.75, "learning_rate": 2.508e-05, "loss": 0.4507, "step": 630 }, { "epoch": 8.89, "learning_rate": 2.5480000000000003e-05, "loss": 0.4316, "step": 640 }, { "epoch": 9.0, "eval_loss": 0.5095347762107849, "eval_runtime": 127.9451, "eval_samples_per_second": 4.158, "eval_steps_per_second": 0.524, "eval_wer": 0.22845021533714727, "step": 648 }, { "epoch": 9.03, "learning_rate": 2.5880000000000003e-05, "loss": 0.453, "step": 650 }, { "epoch": 9.17, "learning_rate": 2.6280000000000002e-05, "loss": 0.4399, "step": 660 }, { "epoch": 9.3, "learning_rate": 2.6680000000000002e-05, "loss": 0.4437, "step": 670 }, { "epoch": 9.44, "learning_rate": 2.7080000000000005e-05, "loss": 0.4527, "step": 680 }, { "epoch": 9.58, "learning_rate": 2.7480000000000005e-05, "loss": 0.4483, "step": 690 }, { "epoch": 9.72, "learning_rate": 2.788e-05, "loss": 0.4359, "step": 700 }, { "epoch": 9.86, "learning_rate": 2.828e-05, "loss": 0.4293, "step": 710 }, { "epoch": 10.0, "learning_rate": 2.868e-05, "loss": 0.4383, "step": 720 }, { "epoch": 10.0, "eval_loss": 0.5397593379020691, "eval_runtime": 128.2201, "eval_samples_per_second": 4.149, "eval_steps_per_second": 0.523, "eval_wer": 0.23462107090055923, "step": 720 }, { "epoch": 10.14, "learning_rate": 2.9080000000000003e-05, "loss": 0.4383, "step": 730 }, { "epoch": 10.28, "learning_rate": 2.9480000000000002e-05, "loss": 0.4407, "step": 740 }, { "epoch": 10.42, "learning_rate": 2.9880000000000002e-05, "loss": 0.4525, "step": 750 }, { "epoch": 10.55, "learning_rate": 3.028e-05, "loss": 0.4551, "step": 760 }, { "epoch": 10.69, "learning_rate": 3.0680000000000004e-05, "loss": 0.4531, "step": 770 }, { "epoch": 10.83, "learning_rate": 3.108e-05, "loss": 0.4346, "step": 780 }, { "epoch": 10.97, "learning_rate": 3.1480000000000004e-05, "loss": 0.4431, "step": 790 }, { "epoch": 11.0, "eval_loss": 0.5176960825920105, "eval_runtime": 127.266, "eval_samples_per_second": 4.18, "eval_steps_per_second": 0.526, "eval_wer": 0.22594330526451115, "step": 792 }, { "epoch": 11.11, "learning_rate": 3.1880000000000006e-05, "loss": 0.4501, "step": 800 }, { "epoch": 11.25, "learning_rate": 3.228e-05, "loss": 0.466, "step": 810 }, { "epoch": 11.39, "learning_rate": 3.268e-05, "loss": 0.4569, "step": 820 }, { "epoch": 11.53, "learning_rate": 3.308e-05, "loss": 0.4703, "step": 830 }, { "epoch": 11.66, "learning_rate": 3.3480000000000005e-05, "loss": 0.4497, "step": 840 }, { "epoch": 11.8, "learning_rate": 3.388e-05, "loss": 0.4574, "step": 850 }, { "epoch": 11.94, "learning_rate": 3.4280000000000004e-05, "loss": 0.4555, "step": 860 }, { "epoch": 12.0, "eval_loss": 0.5246450304985046, "eval_runtime": 126.9882, "eval_samples_per_second": 4.189, "eval_steps_per_second": 0.528, "eval_wer": 0.23346403548241948, "step": 864 }, { "epoch": 12.08, "learning_rate": 3.468e-05, "loss": 0.4411, "step": 870 }, { "epoch": 12.22, "learning_rate": 3.508e-05, "loss": 0.4268, "step": 880 }, { "epoch": 12.36, "learning_rate": 3.5480000000000006e-05, "loss": 0.4414, "step": 890 }, { "epoch": 12.5, "learning_rate": 3.588e-05, "loss": 0.4409, "step": 900 }, { "epoch": 12.64, "learning_rate": 3.6280000000000005e-05, "loss": 0.4217, "step": 910 }, { "epoch": 12.78, "learning_rate": 3.668e-05, "loss": 0.4426, "step": 920 }, { "epoch": 12.91, "learning_rate": 3.7080000000000004e-05, "loss": 0.4488, "step": 930 }, { "epoch": 13.0, "eval_loss": 0.5247890949249268, "eval_runtime": 127.5658, "eval_samples_per_second": 4.17, "eval_steps_per_second": 0.525, "eval_wer": 0.22767885839172078, "step": 936 }, { "epoch": 13.06, "learning_rate": 3.748000000000001e-05, "loss": 0.4485, "step": 940 }, { "epoch": 13.19, "learning_rate": 3.788e-05, "loss": 0.4315, "step": 950 }, { "epoch": 13.33, "learning_rate": 3.828e-05, "loss": 0.4605, "step": 960 }, { "epoch": 13.47, "learning_rate": 3.868e-05, "loss": 0.4501, "step": 970 }, { "epoch": 13.61, "learning_rate": 3.9080000000000005e-05, "loss": 0.4408, "step": 980 }, { "epoch": 13.75, "learning_rate": 3.948e-05, "loss": 0.4549, "step": 990 }, { "epoch": 13.89, "learning_rate": 3.9880000000000004e-05, "loss": 0.4449, "step": 1000 }, { "epoch": 14.0, "eval_loss": 0.5196382999420166, "eval_runtime": 127.3274, "eval_samples_per_second": 4.178, "eval_steps_per_second": 0.526, "eval_wer": 0.2254290673008935, "step": 1008 }, { "epoch": 14.03, "learning_rate": 3.9992000000000006e-05, "loss": 0.4589, "step": 1010 }, { "epoch": 14.17, "learning_rate": 3.998057142857143e-05, "loss": 0.4418, "step": 1020 }, { "epoch": 14.3, "learning_rate": 3.996914285714286e-05, "loss": 0.4525, "step": 1030 }, { "epoch": 14.44, "learning_rate": 3.9957714285714286e-05, "loss": 0.4601, "step": 1040 }, { "epoch": 14.58, "learning_rate": 3.994628571428572e-05, "loss": 0.4687, "step": 1050 }, { "epoch": 14.72, "learning_rate": 3.9934857142857147e-05, "loss": 0.4569, "step": 1060 }, { "epoch": 14.86, "learning_rate": 3.992342857142857e-05, "loss": 0.4359, "step": 1070 }, { "epoch": 15.0, "learning_rate": 3.991200000000001e-05, "loss": 0.4629, "step": 1080 }, { "epoch": 15.0, "eval_loss": 0.49327969551086426, "eval_runtime": 127.4507, "eval_samples_per_second": 4.174, "eval_steps_per_second": 0.526, "eval_wer": 0.2296715305007392, "step": 1080 }, { "epoch": 15.14, "learning_rate": 3.9900571428571434e-05, "loss": 0.4479, "step": 1090 }, { "epoch": 15.28, "learning_rate": 3.988914285714286e-05, "loss": 0.4615, "step": 1100 }, { "epoch": 15.42, "learning_rate": 3.987771428571429e-05, "loss": 0.4401, "step": 1110 }, { "epoch": 15.55, "learning_rate": 3.986628571428572e-05, "loss": 0.4426, "step": 1120 }, { "epoch": 15.69, "learning_rate": 3.985485714285715e-05, "loss": 0.4352, "step": 1130 }, { "epoch": 15.83, "learning_rate": 3.9843428571428574e-05, "loss": 0.4537, "step": 1140 }, { "epoch": 15.97, "learning_rate": 3.9832e-05, "loss": 0.4565, "step": 1150 }, { "epoch": 16.0, "eval_loss": 0.5468793511390686, "eval_runtime": 127.2416, "eval_samples_per_second": 4.181, "eval_steps_per_second": 0.527, "eval_wer": 0.2296715305007392, "step": 1152 }, { "epoch": 16.11, "learning_rate": 3.982057142857143e-05, "loss": 0.4506, "step": 1160 }, { "epoch": 16.25, "learning_rate": 3.980914285714286e-05, "loss": 0.4614, "step": 1170 }, { "epoch": 16.39, "learning_rate": 3.979771428571429e-05, "loss": 0.4474, "step": 1180 }, { "epoch": 16.53, "learning_rate": 3.978628571428572e-05, "loss": 0.4638, "step": 1190 }, { "epoch": 16.66, "learning_rate": 3.977485714285715e-05, "loss": 0.4641, "step": 1200 }, { "epoch": 16.8, "learning_rate": 3.9763428571428575e-05, "loss": 0.4379, "step": 1210 }, { "epoch": 16.94, "learning_rate": 3.9752e-05, "loss": 0.4396, "step": 1220 }, { "epoch": 17.0, "eval_loss": 0.5355833172798157, "eval_runtime": 127.2444, "eval_samples_per_second": 4.181, "eval_steps_per_second": 0.527, "eval_wer": 0.2439416339911294, "step": 1224 }, { "epoch": 17.08, "learning_rate": 3.974057142857143e-05, "loss": 0.4616, "step": 1230 }, { "epoch": 17.22, "learning_rate": 3.972914285714286e-05, "loss": 0.4272, "step": 1240 }, { "epoch": 17.36, "learning_rate": 3.971771428571429e-05, "loss": 0.4344, "step": 1250 }, { "epoch": 17.5, "learning_rate": 3.970628571428572e-05, "loss": 0.4502, "step": 1260 }, { "epoch": 17.64, "learning_rate": 3.969485714285715e-05, "loss": 0.4447, "step": 1270 }, { "epoch": 17.78, "learning_rate": 3.9683428571428576e-05, "loss": 0.4602, "step": 1280 }, { "epoch": 17.91, "learning_rate": 3.9672e-05, "loss": 0.4452, "step": 1290 }, { "epoch": 18.0, "eval_loss": 0.5297891497612, "eval_runtime": 127.1434, "eval_samples_per_second": 4.184, "eval_steps_per_second": 0.527, "eval_wer": 0.25101240599087227, "step": 1296 }, { "epoch": 18.06, "learning_rate": 3.966057142857143e-05, "loss": 0.4803, "step": 1300 }, { "epoch": 18.19, "learning_rate": 3.964914285714286e-05, "loss": 0.4774, "step": 1310 }, { "epoch": 18.33, "learning_rate": 3.963771428571429e-05, "loss": 0.4709, "step": 1320 }, { "epoch": 18.47, "learning_rate": 3.9626285714285716e-05, "loss": 0.4609, "step": 1330 }, { "epoch": 18.61, "learning_rate": 3.961485714285714e-05, "loss": 0.4762, "step": 1340 }, { "epoch": 18.75, "learning_rate": 3.960342857142857e-05, "loss": 0.4404, "step": 1350 }, { "epoch": 18.89, "learning_rate": 3.9592e-05, "loss": 0.4449, "step": 1360 }, { "epoch": 19.0, "eval_loss": 0.5024343132972717, "eval_runtime": 127.2936, "eval_samples_per_second": 4.179, "eval_steps_per_second": 0.526, "eval_wer": 0.22909301279166935, "step": 1368 }, { "epoch": 19.03, "learning_rate": 3.958057142857143e-05, "loss": 0.4584, "step": 1370 }, { "epoch": 19.17, "learning_rate": 3.956914285714286e-05, "loss": 0.444, "step": 1380 }, { "epoch": 19.3, "learning_rate": 3.955771428571429e-05, "loss": 0.4526, "step": 1390 }, { "epoch": 19.44, "learning_rate": 3.954628571428572e-05, "loss": 0.4576, "step": 1400 }, { "epoch": 19.58, "learning_rate": 3.9534857142857144e-05, "loss": 0.4584, "step": 1410 }, { "epoch": 19.72, "learning_rate": 3.952342857142857e-05, "loss": 0.4564, "step": 1420 }, { "epoch": 19.86, "learning_rate": 3.9512000000000004e-05, "loss": 0.4498, "step": 1430 }, { "epoch": 20.0, "learning_rate": 3.950057142857143e-05, "loss": 0.4437, "step": 1440 }, { "epoch": 20.0, "eval_loss": 0.5288242101669312, "eval_runtime": 127.6972, "eval_samples_per_second": 4.166, "eval_steps_per_second": 0.525, "eval_wer": 0.23738509995500418, "step": 1440 }, { "epoch": 20.14, "learning_rate": 3.9489142857142864e-05, "loss": 0.4504, "step": 1450 }, { "epoch": 20.28, "learning_rate": 3.947771428571429e-05, "loss": 0.4461, "step": 1460 }, { "epoch": 20.42, "learning_rate": 3.946628571428572e-05, "loss": 0.4425, "step": 1470 }, { "epoch": 20.55, "learning_rate": 3.9454857142857144e-05, "loss": 0.4531, "step": 1480 }, { "epoch": 20.69, "learning_rate": 3.944342857142857e-05, "loss": 0.4549, "step": 1490 }, { "epoch": 20.83, "learning_rate": 3.9432000000000005e-05, "loss": 0.4677, "step": 1500 }, { "epoch": 20.97, "learning_rate": 3.942057142857143e-05, "loss": 0.4572, "step": 1510 }, { "epoch": 21.0, "eval_loss": 0.49535703659057617, "eval_runtime": 128.3903, "eval_samples_per_second": 4.144, "eval_steps_per_second": 0.522, "eval_wer": 0.2343639519187504, "step": 1512 }, { "epoch": 21.11, "learning_rate": 3.940914285714286e-05, "loss": 0.4591, "step": 1520 }, { "epoch": 21.25, "learning_rate": 3.9397714285714285e-05, "loss": 0.4624, "step": 1530 }, { "epoch": 21.39, "learning_rate": 3.938628571428572e-05, "loss": 0.4563, "step": 1540 }, { "epoch": 21.53, "learning_rate": 3.9374857142857145e-05, "loss": 0.4526, "step": 1550 }, { "epoch": 21.66, "learning_rate": 3.936342857142857e-05, "loss": 0.4378, "step": 1560 }, { "epoch": 21.8, "learning_rate": 3.9352000000000005e-05, "loss": 0.4484, "step": 1570 }, { "epoch": 21.94, "learning_rate": 3.934057142857143e-05, "loss": 0.4633, "step": 1580 }, { "epoch": 22.0, "eval_loss": 0.5043376088142395, "eval_runtime": 128.3677, "eval_samples_per_second": 4.144, "eval_steps_per_second": 0.522, "eval_wer": 0.23609950504596003, "step": 1584 }, { "epoch": 22.08, "learning_rate": 3.932914285714286e-05, "loss": 0.4597, "step": 1590 }, { "epoch": 22.22, "learning_rate": 3.9317714285714286e-05, "loss": 0.4448, "step": 1600 }, { "epoch": 22.36, "learning_rate": 3.930628571428572e-05, "loss": 0.4483, "step": 1610 }, { "epoch": 22.5, "learning_rate": 3.9294857142857146e-05, "loss": 0.4585, "step": 1620 }, { "epoch": 22.64, "learning_rate": 3.928342857142858e-05, "loss": 0.4663, "step": 1630 }, { "epoch": 22.78, "learning_rate": 3.9272000000000006e-05, "loss": 0.4533, "step": 1640 }, { "epoch": 22.91, "learning_rate": 3.926057142857143e-05, "loss": 0.4486, "step": 1650 }, { "epoch": 23.0, "eval_loss": 0.5075653791427612, "eval_runtime": 128.3857, "eval_samples_per_second": 4.144, "eval_steps_per_second": 0.522, "eval_wer": 0.22497910908272803, "step": 1656 }, { "epoch": 23.06, "learning_rate": 3.924914285714286e-05, "loss": 0.4603, "step": 1660 }, { "epoch": 23.19, "learning_rate": 3.9237714285714286e-05, "loss": 0.4646, "step": 1670 }, { "epoch": 23.33, "learning_rate": 3.922628571428572e-05, "loss": 0.4592, "step": 1680 }, { "epoch": 23.47, "learning_rate": 3.921485714285715e-05, "loss": 0.4611, "step": 1690 }, { "epoch": 23.61, "learning_rate": 3.9203428571428573e-05, "loss": 0.4528, "step": 1700 }, { "epoch": 23.75, "learning_rate": 3.9192e-05, "loss": 0.4407, "step": 1710 }, { "epoch": 23.89, "learning_rate": 3.918057142857143e-05, "loss": 0.4386, "step": 1720 }, { "epoch": 24.0, "eval_loss": 0.5563700795173645, "eval_runtime": 128.0193, "eval_samples_per_second": 4.156, "eval_steps_per_second": 0.523, "eval_wer": 0.24921257311821046, "step": 1728 }, { "epoch": 24.03, "learning_rate": 3.916914285714286e-05, "loss": 0.47, "step": 1730 }, { "epoch": 24.17, "learning_rate": 3.915771428571429e-05, "loss": 0.4652, "step": 1740 }, { "epoch": 24.3, "learning_rate": 3.914628571428572e-05, "loss": 0.4609, "step": 1750 }, { "epoch": 24.44, "learning_rate": 3.913485714285715e-05, "loss": 0.4624, "step": 1760 }, { "epoch": 24.58, "learning_rate": 3.9123428571428574e-05, "loss": 0.4694, "step": 1770 }, { "epoch": 24.72, "learning_rate": 3.9112e-05, "loss": 0.4616, "step": 1780 }, { "epoch": 24.86, "learning_rate": 3.910057142857143e-05, "loss": 0.4535, "step": 1790 }, { "epoch": 25.0, "learning_rate": 3.908914285714286e-05, "loss": 0.4478, "step": 1800 }, { "epoch": 25.0, "eval_loss": 0.5298568606376648, "eval_runtime": 128.9105, "eval_samples_per_second": 4.127, "eval_steps_per_second": 0.52, "eval_wer": 0.22356495468277945, "step": 1800 }, { "epoch": 25.14, "learning_rate": 3.907771428571429e-05, "loss": 0.4638, "step": 1810 }, { "epoch": 25.28, "learning_rate": 3.906628571428572e-05, "loss": 0.4467, "step": 1820 }, { "epoch": 25.42, "learning_rate": 3.905485714285715e-05, "loss": 0.4605, "step": 1830 }, { "epoch": 25.55, "learning_rate": 3.9043428571428575e-05, "loss": 0.4698, "step": 1840 }, { "epoch": 25.69, "learning_rate": 3.9032e-05, "loss": 0.4768, "step": 1850 }, { "epoch": 25.83, "learning_rate": 3.902057142857143e-05, "loss": 0.4714, "step": 1860 }, { "epoch": 25.97, "learning_rate": 3.900914285714286e-05, "loss": 0.4654, "step": 1870 }, { "epoch": 26.0, "eval_loss": 0.5076239109039307, "eval_runtime": 127.8838, "eval_samples_per_second": 4.16, "eval_steps_per_second": 0.524, "eval_wer": 0.22761457864626855, "step": 1872 }, { "epoch": 26.11, "learning_rate": 3.899771428571429e-05, "loss": 0.475, "step": 1880 }, { "epoch": 26.25, "learning_rate": 3.8986285714285715e-05, "loss": 0.4616, "step": 1890 }, { "epoch": 26.39, "learning_rate": 3.897485714285714e-05, "loss": 0.4585, "step": 1900 }, { "epoch": 26.53, "learning_rate": 3.8963428571428576e-05, "loss": 0.4592, "step": 1910 }, { "epoch": 26.66, "learning_rate": 3.8952e-05, "loss": 0.4483, "step": 1920 }, { "epoch": 26.8, "learning_rate": 3.894057142857143e-05, "loss": 0.4669, "step": 1930 }, { "epoch": 26.94, "learning_rate": 3.892914285714286e-05, "loss": 0.453, "step": 1940 }, { "epoch": 27.0, "eval_loss": 0.56663978099823, "eval_runtime": 129.7369, "eval_samples_per_second": 4.101, "eval_steps_per_second": 0.516, "eval_wer": 0.23950633155492704, "step": 1944 }, { "epoch": 27.08, "learning_rate": 3.891771428571429e-05, "loss": 0.5038, "step": 1950 }, { "epoch": 27.22, "learning_rate": 3.8906285714285716e-05, "loss": 0.4487, "step": 1960 }, { "epoch": 27.36, "learning_rate": 3.889485714285714e-05, "loss": 0.4513, "step": 1970 }, { "epoch": 27.5, "learning_rate": 3.8883428571428576e-05, "loss": 0.4515, "step": 1980 }, { "epoch": 27.64, "learning_rate": 3.8872e-05, "loss": 0.4452, "step": 1990 }, { "epoch": 27.78, "learning_rate": 3.886057142857143e-05, "loss": 0.4526, "step": 2000 }, { "epoch": 27.91, "learning_rate": 3.8849142857142863e-05, "loss": 0.4474, "step": 2010 }, { "epoch": 28.0, "eval_loss": 0.502606987953186, "eval_runtime": 129.6242, "eval_samples_per_second": 4.104, "eval_steps_per_second": 0.517, "eval_wer": 0.2253647875554413, "step": 2016 }, { "epoch": 28.06, "learning_rate": 3.883771428571429e-05, "loss": 0.4631, "step": 2020 }, { "epoch": 28.19, "learning_rate": 3.882628571428572e-05, "loss": 0.4487, "step": 2030 }, { "epoch": 28.33, "learning_rate": 3.8814857142857144e-05, "loss": 0.45, "step": 2040 }, { "epoch": 28.47, "learning_rate": 3.880342857142858e-05, "loss": 0.4364, "step": 2050 }, { "epoch": 28.61, "learning_rate": 3.8792000000000004e-05, "loss": 0.4483, "step": 2060 }, { "epoch": 28.75, "learning_rate": 3.878057142857143e-05, "loss": 0.4562, "step": 2070 }, { "epoch": 28.89, "learning_rate": 3.876914285714286e-05, "loss": 0.4465, "step": 2080 }, { "epoch": 29.0, "eval_loss": 0.5216416120529175, "eval_runtime": 129.3904, "eval_samples_per_second": 4.112, "eval_steps_per_second": 0.518, "eval_wer": 0.2351995886096291, "step": 2088 }, { "epoch": 29.03, "learning_rate": 3.8757714285714284e-05, "loss": 0.4654, "step": 2090 }, { "epoch": 29.17, "learning_rate": 3.874628571428572e-05, "loss": 0.4644, "step": 2100 }, { "epoch": 29.3, "learning_rate": 3.8734857142857144e-05, "loss": 0.4585, "step": 2110 }, { "epoch": 29.44, "learning_rate": 3.872342857142858e-05, "loss": 0.4599, "step": 2120 }, { "epoch": 29.58, "learning_rate": 3.8712000000000005e-05, "loss": 0.4555, "step": 2130 }, { "epoch": 29.72, "learning_rate": 3.870057142857143e-05, "loss": 0.4592, "step": 2140 }, { "epoch": 29.86, "learning_rate": 3.868914285714286e-05, "loss": 0.4662, "step": 2150 }, { "epoch": 30.0, "learning_rate": 3.8677714285714285e-05, "loss": 0.4689, "step": 2160 }, { "epoch": 30.0, "eval_loss": 0.529291570186615, "eval_runtime": 129.3401, "eval_samples_per_second": 4.113, "eval_steps_per_second": 0.518, "eval_wer": 0.23699942148229092, "step": 2160 }, { "epoch": 30.14, "learning_rate": 3.866628571428572e-05, "loss": 0.4631, "step": 2170 }, { "epoch": 30.28, "learning_rate": 3.8654857142857145e-05, "loss": 0.4677, "step": 2180 }, { "epoch": 30.42, "learning_rate": 3.864342857142858e-05, "loss": 0.45, "step": 2190 }, { "epoch": 30.55, "learning_rate": 3.8632000000000006e-05, "loss": 0.473, "step": 2200 }, { "epoch": 30.69, "learning_rate": 3.862057142857143e-05, "loss": 0.4616, "step": 2210 }, { "epoch": 30.83, "learning_rate": 3.860914285714286e-05, "loss": 0.4584, "step": 2220 }, { "epoch": 30.97, "learning_rate": 3.8597714285714286e-05, "loss": 0.4467, "step": 2230 }, { "epoch": 31.0, "eval_loss": 0.48561057448387146, "eval_runtime": 129.1726, "eval_samples_per_second": 4.119, "eval_steps_per_second": 0.519, "eval_wer": 0.2302500482098091, "step": 2232 }, { "epoch": 31.11, "learning_rate": 3.858628571428572e-05, "loss": 0.4621, "step": 2240 }, { "epoch": 31.25, "learning_rate": 3.8574857142857146e-05, "loss": 0.4446, "step": 2250 }, { "epoch": 31.39, "learning_rate": 3.856342857142857e-05, "loss": 0.4312, "step": 2260 }, { "epoch": 31.53, "learning_rate": 3.8552e-05, "loss": 0.4455, "step": 2270 }, { "epoch": 31.66, "learning_rate": 3.854057142857143e-05, "loss": 0.4433, "step": 2280 }, { "epoch": 31.8, "learning_rate": 3.852914285714286e-05, "loss": 0.4588, "step": 2290 }, { "epoch": 31.94, "learning_rate": 3.8517714285714287e-05, "loss": 0.4379, "step": 2300 }, { "epoch": 32.0, "eval_loss": 0.5088739395141602, "eval_runtime": 128.7265, "eval_samples_per_second": 4.133, "eval_steps_per_second": 0.52, "eval_wer": 0.2239506331554927, "step": 2304 }, { "epoch": 32.08, "learning_rate": 3.850628571428572e-05, "loss": 0.4728, "step": 2310 }, { "epoch": 32.22, "learning_rate": 3.849485714285715e-05, "loss": 0.4481, "step": 2320 }, { "epoch": 32.36, "learning_rate": 3.8483428571428574e-05, "loss": 0.4674, "step": 2330 }, { "epoch": 32.5, "learning_rate": 3.8472e-05, "loss": 0.4657, "step": 2340 }, { "epoch": 32.64, "learning_rate": 3.8460571428571434e-05, "loss": 0.4367, "step": 2350 }, { "epoch": 32.78, "learning_rate": 3.844914285714286e-05, "loss": 0.4476, "step": 2360 }, { "epoch": 32.91, "learning_rate": 3.843771428571429e-05, "loss": 0.4302, "step": 2370 }, { "epoch": 33.0, "eval_loss": 0.4957752525806427, "eval_runtime": 129.2784, "eval_samples_per_second": 4.115, "eval_steps_per_second": 0.518, "eval_wer": 0.21732981937391527, "step": 2376 }, { "epoch": 33.06, "learning_rate": 3.842628571428572e-05, "loss": 0.4657, "step": 2380 }, { "epoch": 33.19, "learning_rate": 3.841485714285715e-05, "loss": 0.4482, "step": 2390 }, { "epoch": 33.33, "learning_rate": 3.8403428571428574e-05, "loss": 0.4487, "step": 2400 }, { "epoch": 33.47, "learning_rate": 3.8392e-05, "loss": 0.4512, "step": 2410 }, { "epoch": 33.61, "learning_rate": 3.8380571428571435e-05, "loss": 0.4455, "step": 2420 }, { "epoch": 33.75, "learning_rate": 3.836914285714286e-05, "loss": 0.4321, "step": 2430 }, { "epoch": 33.89, "learning_rate": 3.835771428571429e-05, "loss": 0.4417, "step": 2440 }, { "epoch": 34.0, "eval_loss": 0.5391955971717834, "eval_runtime": 128.1528, "eval_samples_per_second": 4.151, "eval_steps_per_second": 0.523, "eval_wer": 0.2336568747187761, "step": 2448 }, { "epoch": 34.03, "learning_rate": 3.8346285714285715e-05, "loss": 0.4546, "step": 2450 }, { "epoch": 34.17, "learning_rate": 3.833485714285714e-05, "loss": 0.4353, "step": 2460 }, { "epoch": 34.3, "learning_rate": 3.8323428571428575e-05, "loss": 0.4393, "step": 2470 }, { "epoch": 34.44, "learning_rate": 3.8312e-05, "loss": 0.4537, "step": 2480 }, { "epoch": 34.58, "learning_rate": 3.8300571428571435e-05, "loss": 0.4481, "step": 2490 }, { "epoch": 34.72, "learning_rate": 3.828914285714286e-05, "loss": 0.4619, "step": 2500 }, { "epoch": 34.86, "learning_rate": 3.827771428571429e-05, "loss": 0.4531, "step": 2510 }, { "epoch": 35.0, "learning_rate": 3.8266285714285716e-05, "loss": 0.4458, "step": 2520 }, { "epoch": 35.0, "eval_loss": 0.5228686928749084, "eval_runtime": 128.7042, "eval_samples_per_second": 4.134, "eval_steps_per_second": 0.521, "eval_wer": 0.2415632834093977, "step": 2520 }, { "epoch": 35.14, "learning_rate": 3.825485714285714e-05, "loss": 0.4548, "step": 2530 }, { "epoch": 35.28, "learning_rate": 3.8243428571428576e-05, "loss": 0.4496, "step": 2540 }, { "epoch": 35.42, "learning_rate": 3.8232e-05, "loss": 0.4419, "step": 2550 }, { "epoch": 35.55, "learning_rate": 3.8220571428571436e-05, "loss": 0.4573, "step": 2560 }, { "epoch": 35.69, "learning_rate": 3.820914285714286e-05, "loss": 0.4487, "step": 2570 }, { "epoch": 35.83, "learning_rate": 3.819771428571429e-05, "loss": 0.4492, "step": 2580 }, { "epoch": 35.97, "learning_rate": 3.8187428571428575e-05, "loss": 0.4415, "step": 2590 }, { "epoch": 36.0, "eval_loss": 0.5280052423477173, "eval_runtime": 128.1421, "eval_samples_per_second": 4.152, "eval_steps_per_second": 0.523, "eval_wer": 0.2344282316642026, "step": 2592 }, { "epoch": 36.11, "learning_rate": 3.8176e-05, "loss": 0.4528, "step": 2600 }, { "epoch": 36.25, "learning_rate": 3.816457142857143e-05, "loss": 0.4421, "step": 2610 }, { "epoch": 36.39, "learning_rate": 3.815314285714286e-05, "loss": 0.4358, "step": 2620 }, { "epoch": 36.53, "learning_rate": 3.814171428571429e-05, "loss": 0.4758, "step": 2630 }, { "epoch": 36.66, "learning_rate": 3.8130285714285716e-05, "loss": 0.4542, "step": 2640 }, { "epoch": 36.8, "learning_rate": 3.811885714285715e-05, "loss": 0.4526, "step": 2650 }, { "epoch": 36.94, "learning_rate": 3.8107428571428576e-05, "loss": 0.4621, "step": 2660 }, { "epoch": 37.0, "eval_loss": 0.5361986756324768, "eval_runtime": 128.1497, "eval_samples_per_second": 4.151, "eval_steps_per_second": 0.523, "eval_wer": 0.24593430610014785, "step": 2664 }, { "epoch": 37.08, "learning_rate": 3.8096e-05, "loss": 0.4725, "step": 2670 }, { "epoch": 37.22, "learning_rate": 3.808457142857143e-05, "loss": 0.4678, "step": 2680 }, { "epoch": 37.36, "learning_rate": 3.807314285714286e-05, "loss": 0.4449, "step": 2690 }, { "epoch": 37.5, "learning_rate": 3.806171428571429e-05, "loss": 0.4756, "step": 2700 }, { "epoch": 37.64, "learning_rate": 3.8050285714285716e-05, "loss": 0.4339, "step": 2710 }, { "epoch": 37.78, "learning_rate": 3.803885714285714e-05, "loss": 0.4505, "step": 2720 }, { "epoch": 37.91, "learning_rate": 3.802742857142857e-05, "loss": 0.44, "step": 2730 }, { "epoch": 38.0, "eval_loss": 0.507107138633728, "eval_runtime": 128.4192, "eval_samples_per_second": 4.143, "eval_steps_per_second": 0.522, "eval_wer": 0.22851449508259947, "step": 2736 }, { "epoch": 38.06, "learning_rate": 3.8016e-05, "loss": 0.4586, "step": 2740 }, { "epoch": 38.19, "learning_rate": 3.800457142857143e-05, "loss": 0.458, "step": 2750 }, { "epoch": 38.33, "learning_rate": 3.7993142857142864e-05, "loss": 0.4394, "step": 2760 }, { "epoch": 38.47, "learning_rate": 3.798171428571429e-05, "loss": 0.4579, "step": 2770 }, { "epoch": 38.61, "learning_rate": 3.797028571428572e-05, "loss": 0.4612, "step": 2780 }, { "epoch": 38.75, "learning_rate": 3.7958857142857144e-05, "loss": 0.4686, "step": 2790 }, { "epoch": 38.89, "learning_rate": 3.794742857142857e-05, "loss": 0.4288, "step": 2800 }, { "epoch": 39.0, "eval_loss": 0.5263686776161194, "eval_runtime": 128.3848, "eval_samples_per_second": 4.144, "eval_steps_per_second": 0.522, "eval_wer": 0.23134280388249662, "step": 2808 }, { "epoch": 39.03, "learning_rate": 3.7936000000000004e-05, "loss": 0.4668, "step": 2810 }, { "epoch": 39.17, "learning_rate": 3.792457142857143e-05, "loss": 0.4399, "step": 2820 }, { "epoch": 39.3, "learning_rate": 3.7913142857142864e-05, "loss": 0.4368, "step": 2830 }, { "epoch": 39.44, "learning_rate": 3.790171428571429e-05, "loss": 0.427, "step": 2840 }, { "epoch": 39.58, "learning_rate": 3.789028571428572e-05, "loss": 0.4517, "step": 2850 }, { "epoch": 39.72, "learning_rate": 3.7878857142857145e-05, "loss": 0.4574, "step": 2860 }, { "epoch": 39.86, "learning_rate": 3.786742857142857e-05, "loss": 0.4426, "step": 2870 }, { "epoch": 40.0, "learning_rate": 3.7856000000000005e-05, "loss": 0.4594, "step": 2880 }, { "epoch": 40.0, "eval_loss": 0.5237553119659424, "eval_runtime": 128.8038, "eval_samples_per_second": 4.13, "eval_steps_per_second": 0.52, "eval_wer": 0.23063572668252233, "step": 2880 }, { "epoch": 40.14, "learning_rate": 3.784457142857143e-05, "loss": 0.4559, "step": 2890 }, { "epoch": 40.28, "learning_rate": 3.783314285714286e-05, "loss": 0.431, "step": 2900 }, { "epoch": 40.42, "learning_rate": 3.7821714285714285e-05, "loss": 0.4336, "step": 2910 }, { "epoch": 40.55, "learning_rate": 3.781028571428572e-05, "loss": 0.4329, "step": 2920 }, { "epoch": 40.69, "learning_rate": 3.7798857142857145e-05, "loss": 0.4389, "step": 2930 }, { "epoch": 40.83, "learning_rate": 3.778742857142857e-05, "loss": 0.4484, "step": 2940 }, { "epoch": 40.97, "learning_rate": 3.7776000000000006e-05, "loss": 0.4428, "step": 2950 }, { "epoch": 41.0, "eval_loss": 0.5374780893325806, "eval_runtime": 128.1104, "eval_samples_per_second": 4.153, "eval_steps_per_second": 0.523, "eval_wer": 0.2286430545735039, "step": 2952 }, { "epoch": 41.11, "learning_rate": 3.776457142857143e-05, "loss": 0.4586, "step": 2960 }, { "epoch": 41.25, "learning_rate": 3.775314285714286e-05, "loss": 0.444, "step": 2970 }, { "epoch": 41.39, "learning_rate": 3.7741714285714286e-05, "loss": 0.4371, "step": 2980 }, { "epoch": 41.53, "learning_rate": 3.773028571428572e-05, "loss": 0.4379, "step": 2990 }, { "epoch": 41.66, "learning_rate": 3.7718857142857146e-05, "loss": 0.4524, "step": 3000 }, { "epoch": 41.8, "learning_rate": 3.770742857142857e-05, "loss": 0.4391, "step": 3010 }, { "epoch": 41.94, "learning_rate": 3.7696000000000006e-05, "loss": 0.4233, "step": 3020 }, { "epoch": 42.0, "eval_loss": 0.5214474201202393, "eval_runtime": 128.9328, "eval_samples_per_second": 4.126, "eval_steps_per_second": 0.52, "eval_wer": 0.2254290673008935, "step": 3024 }, { "epoch": 42.08, "learning_rate": 3.768457142857143e-05, "loss": 0.452, "step": 3030 }, { "epoch": 42.22, "learning_rate": 3.767314285714286e-05, "loss": 0.4282, "step": 3040 }, { "epoch": 42.36, "learning_rate": 3.7661714285714287e-05, "loss": 0.4398, "step": 3050 }, { "epoch": 42.5, "learning_rate": 3.765028571428572e-05, "loss": 0.4473, "step": 3060 }, { "epoch": 42.64, "learning_rate": 3.763885714285715e-05, "loss": 0.4193, "step": 3070 }, { "epoch": 42.78, "learning_rate": 3.7627428571428574e-05, "loss": 0.4476, "step": 3080 }, { "epoch": 42.91, "learning_rate": 3.7616e-05, "loss": 0.4462, "step": 3090 }, { "epoch": 43.0, "eval_loss": 0.5145358443260193, "eval_runtime": 128.3093, "eval_samples_per_second": 4.146, "eval_steps_per_second": 0.522, "eval_wer": 0.24503438966381694, "step": 3096 }, { "epoch": 43.06, "learning_rate": 3.760457142857143e-05, "loss": 0.4592, "step": 3100 }, { "epoch": 43.19, "learning_rate": 3.759314285714286e-05, "loss": 0.4391, "step": 3110 }, { "epoch": 43.33, "learning_rate": 3.758171428571429e-05, "loss": 0.43, "step": 3120 }, { "epoch": 43.47, "learning_rate": 3.757028571428572e-05, "loss": 0.4385, "step": 3130 }, { "epoch": 43.61, "learning_rate": 3.755885714285715e-05, "loss": 0.434, "step": 3140 }, { "epoch": 43.75, "learning_rate": 3.7547428571428574e-05, "loss": 0.4309, "step": 3150 }, { "epoch": 43.89, "learning_rate": 3.7536e-05, "loss": 0.4282, "step": 3160 }, { "epoch": 44.0, "eval_loss": 0.5519401431083679, "eval_runtime": 128.7714, "eval_samples_per_second": 4.131, "eval_steps_per_second": 0.52, "eval_wer": 0.2254290673008935, "step": 3168 }, { "epoch": 44.03, "learning_rate": 3.752457142857143e-05, "loss": 0.4476, "step": 3170 }, { "epoch": 44.17, "learning_rate": 3.751314285714286e-05, "loss": 0.4354, "step": 3180 }, { "epoch": 44.3, "learning_rate": 3.750171428571429e-05, "loss": 0.4403, "step": 3190 }, { "epoch": 44.44, "learning_rate": 3.749028571428572e-05, "loss": 0.4318, "step": 3200 }, { "epoch": 44.58, "learning_rate": 3.747885714285715e-05, "loss": 0.423, "step": 3210 }, { "epoch": 44.72, "learning_rate": 3.7467428571428575e-05, "loss": 0.4173, "step": 3220 }, { "epoch": 44.86, "learning_rate": 3.7456e-05, "loss": 0.4331, "step": 3230 }, { "epoch": 45.0, "learning_rate": 3.744457142857143e-05, "loss": 0.454, "step": 3240 }, { "epoch": 45.0, "eval_loss": 0.5401215553283691, "eval_runtime": 128.0775, "eval_samples_per_second": 4.154, "eval_steps_per_second": 0.523, "eval_wer": 0.23815645690043066, "step": 3240 }, { "epoch": 45.14, "learning_rate": 3.743314285714286e-05, "loss": 0.4417, "step": 3250 }, { "epoch": 45.28, "learning_rate": 3.742171428571429e-05, "loss": 0.4359, "step": 3260 }, { "epoch": 45.42, "learning_rate": 3.7410285714285716e-05, "loss": 0.4287, "step": 3270 }, { "epoch": 45.55, "learning_rate": 3.739885714285714e-05, "loss": 0.4482, "step": 3280 }, { "epoch": 45.69, "learning_rate": 3.738742857142857e-05, "loss": 0.442, "step": 3290 }, { "epoch": 45.83, "learning_rate": 3.7376e-05, "loss": 0.4395, "step": 3300 }, { "epoch": 45.97, "learning_rate": 3.736457142857143e-05, "loss": 0.4494, "step": 3310 }, { "epoch": 46.0, "eval_loss": 0.5116974115371704, "eval_runtime": 128.6158, "eval_samples_per_second": 4.136, "eval_steps_per_second": 0.521, "eval_wer": 0.22285787748280517, "step": 3312 }, { "epoch": 46.11, "learning_rate": 3.735314285714286e-05, "loss": 0.456, "step": 3320 }, { "epoch": 46.25, "learning_rate": 3.734171428571429e-05, "loss": 0.4355, "step": 3330 }, { "epoch": 46.39, "learning_rate": 3.7330285714285716e-05, "loss": 0.4302, "step": 3340 }, { "epoch": 46.53, "learning_rate": 3.731885714285714e-05, "loss": 0.4289, "step": 3350 }, { "epoch": 46.66, "learning_rate": 3.730742857142858e-05, "loss": 0.4247, "step": 3360 }, { "epoch": 46.8, "learning_rate": 3.7296000000000003e-05, "loss": 0.4288, "step": 3370 }, { "epoch": 46.94, "learning_rate": 3.728457142857143e-05, "loss": 0.4292, "step": 3380 }, { "epoch": 47.0, "eval_loss": 0.5295329689979553, "eval_runtime": 128.49, "eval_samples_per_second": 4.14, "eval_steps_per_second": 0.521, "eval_wer": 0.2351995886096291, "step": 3384 }, { "epoch": 47.08, "learning_rate": 3.7273142857142864e-05, "loss": 0.4404, "step": 3390 }, { "epoch": 47.22, "learning_rate": 3.726171428571429e-05, "loss": 0.434, "step": 3400 }, { "epoch": 47.36, "learning_rate": 3.725028571428572e-05, "loss": 0.4284, "step": 3410 }, { "epoch": 47.5, "learning_rate": 3.724e-05, "loss": 0.4319, "step": 3420 }, { "epoch": 47.64, "learning_rate": 3.722857142857143e-05, "loss": 0.4261, "step": 3430 }, { "epoch": 47.78, "learning_rate": 3.7217142857142856e-05, "loss": 0.4393, "step": 3440 }, { "epoch": 47.91, "learning_rate": 3.720571428571429e-05, "loss": 0.4321, "step": 3450 }, { "epoch": 48.0, "eval_loss": 0.49526622891426086, "eval_runtime": 128.3376, "eval_samples_per_second": 4.145, "eval_steps_per_second": 0.522, "eval_wer": 0.22992864948254804, "step": 3456 }, { "epoch": 48.06, "learning_rate": 3.7194285714285716e-05, "loss": 0.4502, "step": 3460 }, { "epoch": 48.19, "learning_rate": 3.718285714285715e-05, "loss": 0.4336, "step": 3470 }, { "epoch": 48.33, "learning_rate": 3.717142857142858e-05, "loss": 0.4365, "step": 3480 }, { "epoch": 48.47, "learning_rate": 3.716e-05, "loss": 0.419, "step": 3490 }, { "epoch": 48.61, "learning_rate": 3.714857142857143e-05, "loss": 0.4246, "step": 3500 }, { "epoch": 48.75, "learning_rate": 3.713714285714286e-05, "loss": 0.4388, "step": 3510 }, { "epoch": 48.89, "learning_rate": 3.712571428571429e-05, "loss": 0.4145, "step": 3520 }, { "epoch": 49.0, "eval_loss": 0.5232734680175781, "eval_runtime": 128.3313, "eval_samples_per_second": 4.146, "eval_steps_per_second": 0.522, "eval_wer": 0.2296715305007392, "step": 3528 }, { "epoch": 49.03, "learning_rate": 3.711428571428572e-05, "loss": 0.436, "step": 3530 }, { "epoch": 49.17, "learning_rate": 3.7102857142857144e-05, "loss": 0.4165, "step": 3540 }, { "epoch": 49.3, "learning_rate": 3.709142857142857e-05, "loss": 0.4344, "step": 3550 }, { "epoch": 49.44, "learning_rate": 3.7080000000000004e-05, "loss": 0.4184, "step": 3560 }, { "epoch": 49.58, "learning_rate": 3.706857142857143e-05, "loss": 0.4262, "step": 3570 }, { "epoch": 49.72, "learning_rate": 3.705714285714286e-05, "loss": 0.4295, "step": 3580 }, { "epoch": 49.86, "learning_rate": 3.704571428571429e-05, "loss": 0.4325, "step": 3590 }, { "epoch": 50.0, "learning_rate": 3.703428571428572e-05, "loss": 0.4278, "step": 3600 }, { "epoch": 50.0, "eval_loss": 0.5150754451751709, "eval_runtime": 128.3935, "eval_samples_per_second": 4.144, "eval_steps_per_second": 0.522, "eval_wer": 0.22575046602815452, "step": 3600 }, { "epoch": 50.14, "learning_rate": 3.7022857142857145e-05, "loss": 0.4323, "step": 3610 }, { "epoch": 50.28, "learning_rate": 3.701142857142857e-05, "loss": 0.4265, "step": 3620 }, { "epoch": 50.42, "learning_rate": 3.7000000000000005e-05, "loss": 0.4304, "step": 3630 }, { "epoch": 50.55, "learning_rate": 3.698857142857143e-05, "loss": 0.4436, "step": 3640 }, { "epoch": 50.69, "learning_rate": 3.697714285714286e-05, "loss": 0.4407, "step": 3650 }, { "epoch": 50.83, "learning_rate": 3.696571428571429e-05, "loss": 0.4374, "step": 3660 }, { "epoch": 50.97, "learning_rate": 3.695428571428572e-05, "loss": 0.4395, "step": 3670 }, { "epoch": 51.0, "eval_loss": 0.46595197916030884, "eval_runtime": 128.442, "eval_samples_per_second": 4.142, "eval_steps_per_second": 0.522, "eval_wer": 0.22735745966445972, "step": 3672 }, { "epoch": 51.11, "learning_rate": 3.6942857142857145e-05, "loss": 0.4447, "step": 3680 }, { "epoch": 51.25, "learning_rate": 3.693142857142857e-05, "loss": 0.4272, "step": 3690 }, { "epoch": 51.39, "learning_rate": 3.6920000000000006e-05, "loss": 0.4272, "step": 3700 }, { "epoch": 51.53, "learning_rate": 3.690857142857143e-05, "loss": 0.4384, "step": 3710 }, { "epoch": 51.66, "learning_rate": 3.689714285714286e-05, "loss": 0.4188, "step": 3720 }, { "epoch": 51.8, "learning_rate": 3.6885714285714286e-05, "loss": 0.4299, "step": 3730 }, { "epoch": 51.94, "learning_rate": 3.687428571428571e-05, "loss": 0.4298, "step": 3740 }, { "epoch": 52.0, "eval_loss": 0.508307933807373, "eval_runtime": 128.5789, "eval_samples_per_second": 4.138, "eval_steps_per_second": 0.521, "eval_wer": 0.2409204859548756, "step": 3744 }, { "epoch": 52.08, "learning_rate": 3.6862857142857146e-05, "loss": 0.4531, "step": 3750 }, { "epoch": 52.22, "learning_rate": 3.685142857142857e-05, "loss": 0.4379, "step": 3760 }, { "epoch": 52.36, "learning_rate": 3.6840000000000006e-05, "loss": 0.4403, "step": 3770 }, { "epoch": 52.5, "learning_rate": 3.682857142857143e-05, "loss": 0.4436, "step": 3780 }, { "epoch": 52.64, "learning_rate": 3.681714285714286e-05, "loss": 0.4211, "step": 3790 }, { "epoch": 52.78, "learning_rate": 3.680571428571429e-05, "loss": 0.4327, "step": 3800 }, { "epoch": 52.91, "learning_rate": 3.6794285714285713e-05, "loss": 0.4279, "step": 3810 }, { "epoch": 53.0, "eval_loss": 0.48551836609840393, "eval_runtime": 128.302, "eval_samples_per_second": 4.146, "eval_steps_per_second": 0.522, "eval_wer": 0.22189368130102205, "step": 3816 }, { "epoch": 53.06, "learning_rate": 3.678285714285715e-05, "loss": 0.4371, "step": 3820 }, { "epoch": 53.19, "learning_rate": 3.6771428571428574e-05, "loss": 0.4255, "step": 3830 }, { "epoch": 53.33, "learning_rate": 3.676000000000001e-05, "loss": 0.4446, "step": 3840 }, { "epoch": 53.47, "learning_rate": 3.6748571428571434e-05, "loss": 0.4443, "step": 3850 }, { "epoch": 53.61, "learning_rate": 3.673714285714286e-05, "loss": 0.4316, "step": 3860 }, { "epoch": 53.75, "learning_rate": 3.672571428571429e-05, "loss": 0.4261, "step": 3870 }, { "epoch": 53.89, "learning_rate": 3.6714285714285714e-05, "loss": 0.4164, "step": 3880 }, { "epoch": 54.0, "eval_loss": 0.5073791742324829, "eval_runtime": 128.8064, "eval_samples_per_second": 4.13, "eval_steps_per_second": 0.52, "eval_wer": 0.22671466220993766, "step": 3888 }, { "epoch": 54.03, "learning_rate": 3.670285714285715e-05, "loss": 0.4616, "step": 3890 }, { "epoch": 54.17, "learning_rate": 3.6691428571428574e-05, "loss": 0.4239, "step": 3900 }, { "epoch": 54.3, "learning_rate": 3.668e-05, "loss": 0.4312, "step": 3910 }, { "epoch": 54.44, "learning_rate": 3.666857142857143e-05, "loss": 0.4269, "step": 3920 }, { "epoch": 54.58, "learning_rate": 3.665714285714286e-05, "loss": 0.4269, "step": 3930 }, { "epoch": 54.72, "learning_rate": 3.664571428571429e-05, "loss": 0.4259, "step": 3940 }, { "epoch": 54.86, "learning_rate": 3.6634285714285715e-05, "loss": 0.4427, "step": 3950 }, { "epoch": 55.0, "learning_rate": 3.662285714285715e-05, "loss": 0.4386, "step": 3960 }, { "epoch": 55.0, "eval_loss": 0.5015815496444702, "eval_runtime": 128.598, "eval_samples_per_second": 4.137, "eval_steps_per_second": 0.521, "eval_wer": 0.2240791926463971, "step": 3960 }, { "epoch": 55.14, "learning_rate": 3.6611428571428575e-05, "loss": 0.4195, "step": 3970 }, { "epoch": 55.28, "learning_rate": 3.66e-05, "loss": 0.4422, "step": 3980 }, { "epoch": 55.42, "learning_rate": 3.658857142857143e-05, "loss": 0.4459, "step": 3990 }, { "epoch": 55.55, "learning_rate": 3.657714285714286e-05, "loss": 0.4407, "step": 4000 }, { "epoch": 55.69, "learning_rate": 3.656571428571429e-05, "loss": 0.4388, "step": 4010 }, { "epoch": 55.83, "learning_rate": 3.6554285714285716e-05, "loss": 0.4322, "step": 4020 }, { "epoch": 55.97, "learning_rate": 3.654285714285715e-05, "loss": 0.4497, "step": 4030 }, { "epoch": 56.0, "eval_loss": 0.5378428101539612, "eval_runtime": 128.6754, "eval_samples_per_second": 4.134, "eval_steps_per_second": 0.521, "eval_wer": 0.23050716719161793, "step": 4032 }, { "epoch": 56.11, "learning_rate": 3.6531428571428576e-05, "loss": 0.4336, "step": 4040 }, { "epoch": 56.25, "learning_rate": 3.652e-05, "loss": 0.4231, "step": 4050 }, { "epoch": 56.39, "learning_rate": 3.650857142857143e-05, "loss": 0.4199, "step": 4060 }, { "epoch": 56.53, "learning_rate": 3.649714285714286e-05, "loss": 0.4347, "step": 4070 }, { "epoch": 56.66, "learning_rate": 3.648571428571429e-05, "loss": 0.4214, "step": 4080 }, { "epoch": 56.8, "learning_rate": 3.6474285714285716e-05, "loss": 0.435, "step": 4090 }, { "epoch": 56.94, "learning_rate": 3.646285714285714e-05, "loss": 0.4267, "step": 4100 }, { "epoch": 57.0, "eval_loss": 0.5199487805366516, "eval_runtime": 128.6217, "eval_samples_per_second": 4.136, "eval_steps_per_second": 0.521, "eval_wer": 0.2343639519187504, "step": 4104 }, { "epoch": 57.08, "learning_rate": 3.645142857142857e-05, "loss": 0.4307, "step": 4110 }, { "epoch": 57.22, "learning_rate": 3.6440000000000003e-05, "loss": 0.4334, "step": 4120 }, { "epoch": 57.36, "learning_rate": 3.642857142857143e-05, "loss": 0.4329, "step": 4130 }, { "epoch": 57.5, "learning_rate": 3.6417142857142864e-05, "loss": 0.4403, "step": 4140 }, { "epoch": 57.64, "learning_rate": 3.640571428571429e-05, "loss": 0.421, "step": 4150 }, { "epoch": 57.78, "learning_rate": 3.639428571428572e-05, "loss": 0.4299, "step": 4160 }, { "epoch": 57.91, "learning_rate": 3.6382857142857144e-05, "loss": 0.4083, "step": 4170 }, { "epoch": 58.0, "eval_loss": 0.5134491324424744, "eval_runtime": 128.858, "eval_samples_per_second": 4.129, "eval_steps_per_second": 0.52, "eval_wer": 0.22485054959182363, "step": 4176 }, { "epoch": 58.06, "learning_rate": 3.637142857142857e-05, "loss": 0.4496, "step": 4180 }, { "epoch": 58.19, "learning_rate": 3.6360000000000004e-05, "loss": 0.433, "step": 4190 }, { "epoch": 58.33, "learning_rate": 3.634857142857143e-05, "loss": 0.4354, "step": 4200 }, { "epoch": 58.47, "learning_rate": 3.6337142857142865e-05, "loss": 0.436, "step": 4210 }, { "epoch": 58.61, "learning_rate": 3.632571428571429e-05, "loss": 0.4078, "step": 4220 }, { "epoch": 58.75, "learning_rate": 3.631428571428572e-05, "loss": 0.4462, "step": 4230 }, { "epoch": 58.89, "learning_rate": 3.6302857142857145e-05, "loss": 0.4163, "step": 4240 }, { "epoch": 59.0, "eval_loss": 0.49748191237449646, "eval_runtime": 128.9559, "eval_samples_per_second": 4.125, "eval_steps_per_second": 0.52, "eval_wer": 0.23159992286430545, "step": 4248 }, { "epoch": 59.03, "learning_rate": 3.629142857142857e-05, "loss": 0.4314, "step": 4250 }, { "epoch": 59.17, "learning_rate": 3.6280000000000005e-05, "loss": 0.4144, "step": 4260 }, { "epoch": 59.3, "learning_rate": 3.626857142857143e-05, "loss": 0.4294, "step": 4270 }, { "epoch": 59.44, "learning_rate": 3.625714285714286e-05, "loss": 0.4338, "step": 4280 }, { "epoch": 59.58, "learning_rate": 3.6245714285714285e-05, "loss": 0.435, "step": 4290 }, { "epoch": 59.72, "learning_rate": 3.623428571428571e-05, "loss": 0.4444, "step": 4300 }, { "epoch": 59.86, "learning_rate": 3.6222857142857146e-05, "loss": 0.4107, "step": 4310 }, { "epoch": 60.0, "learning_rate": 3.621142857142857e-05, "loss": 0.4271, "step": 4320 }, { "epoch": 60.0, "eval_loss": 0.5298433303833008, "eval_runtime": 128.9128, "eval_samples_per_second": 4.127, "eval_steps_per_second": 0.52, "eval_wer": 0.22909301279166935, "step": 4320 }, { "epoch": 60.14, "learning_rate": 3.6200000000000006e-05, "loss": 0.4352, "step": 4330 }, { "epoch": 60.28, "learning_rate": 3.618857142857143e-05, "loss": 0.4334, "step": 4340 }, { "epoch": 60.42, "learning_rate": 3.617714285714286e-05, "loss": 0.4364, "step": 4350 }, { "epoch": 60.55, "learning_rate": 3.6165714285714286e-05, "loss": 0.4324, "step": 4360 }, { "epoch": 60.69, "learning_rate": 3.615428571428571e-05, "loss": 0.4412, "step": 4370 }, { "epoch": 60.83, "learning_rate": 3.6142857142857146e-05, "loss": 0.4218, "step": 4380 }, { "epoch": 60.97, "learning_rate": 3.613142857142857e-05, "loss": 0.43, "step": 4390 }, { "epoch": 61.0, "eval_loss": 0.4991164207458496, "eval_runtime": 128.4261, "eval_samples_per_second": 4.142, "eval_steps_per_second": 0.522, "eval_wer": 0.22890017355531272, "step": 4392 }, { "epoch": 61.11, "learning_rate": 3.6120000000000007e-05, "loss": 0.4478, "step": 4400 }, { "epoch": 61.25, "learning_rate": 3.610857142857143e-05, "loss": 0.4588, "step": 4410 }, { "epoch": 61.39, "learning_rate": 3.609714285714286e-05, "loss": 0.4465, "step": 4420 }, { "epoch": 61.53, "learning_rate": 3.608571428571429e-05, "loss": 0.4377, "step": 4430 }, { "epoch": 61.66, "learning_rate": 3.6074285714285714e-05, "loss": 0.4359, "step": 4440 }, { "epoch": 61.8, "learning_rate": 3.606285714285715e-05, "loss": 0.4572, "step": 4450 }, { "epoch": 61.94, "learning_rate": 3.6051428571428574e-05, "loss": 0.437, "step": 4460 }, { "epoch": 62.0, "eval_loss": 0.5154334902763367, "eval_runtime": 128.6615, "eval_samples_per_second": 4.135, "eval_steps_per_second": 0.521, "eval_wer": 0.22980008999164364, "step": 4464 }, { "epoch": 62.08, "learning_rate": 3.604e-05, "loss": 0.4579, "step": 4470 }, { "epoch": 62.22, "learning_rate": 3.602857142857143e-05, "loss": 0.4386, "step": 4480 }, { "epoch": 62.36, "learning_rate": 3.601714285714286e-05, "loss": 0.4275, "step": 4490 }, { "epoch": 62.5, "learning_rate": 3.600571428571429e-05, "loss": 0.4233, "step": 4500 }, { "epoch": 62.64, "learning_rate": 3.599428571428572e-05, "loss": 0.4096, "step": 4510 }, { "epoch": 62.78, "learning_rate": 3.598285714285715e-05, "loss": 0.42, "step": 4520 }, { "epoch": 62.91, "learning_rate": 3.5971428571428575e-05, "loss": 0.415, "step": 4530 }, { "epoch": 63.0, "eval_loss": 0.516696572303772, "eval_runtime": 128.7617, "eval_samples_per_second": 4.132, "eval_steps_per_second": 0.52, "eval_wer": 0.2224079192646397, "step": 4536 }, { "epoch": 63.06, "learning_rate": 3.596e-05, "loss": 0.4325, "step": 4540 }, { "epoch": 63.19, "learning_rate": 3.594857142857143e-05, "loss": 0.4239, "step": 4550 }, { "epoch": 63.33, "learning_rate": 3.593714285714286e-05, "loss": 0.435, "step": 4560 }, { "epoch": 63.47, "learning_rate": 3.592571428571429e-05, "loss": 0.4249, "step": 4570 }, { "epoch": 63.61, "learning_rate": 3.591428571428572e-05, "loss": 0.4283, "step": 4580 }, { "epoch": 63.75, "learning_rate": 3.590285714285715e-05, "loss": 0.4309, "step": 4590 }, { "epoch": 63.89, "learning_rate": 3.5891428571428575e-05, "loss": 0.4308, "step": 4600 }, { "epoch": 64.0, "eval_loss": 0.5324345827102661, "eval_runtime": 129.2354, "eval_samples_per_second": 4.117, "eval_steps_per_second": 0.518, "eval_wer": 0.2287073343189561, "step": 4608 }, { "epoch": 64.03, "learning_rate": 3.588e-05, "loss": 0.4556, "step": 4610 }, { "epoch": 64.17, "learning_rate": 3.586857142857143e-05, "loss": 0.4315, "step": 4620 }, { "epoch": 64.3, "learning_rate": 3.585714285714286e-05, "loss": 0.4261, "step": 4630 }, { "epoch": 64.44, "learning_rate": 3.584571428571429e-05, "loss": 0.4098, "step": 4640 }, { "epoch": 64.58, "learning_rate": 3.583428571428572e-05, "loss": 0.4278, "step": 4650 }, { "epoch": 64.72, "learning_rate": 3.582285714285714e-05, "loss": 0.4258, "step": 4660 }, { "epoch": 64.86, "learning_rate": 3.581142857142857e-05, "loss": 0.4286, "step": 4670 }, { "epoch": 65.0, "learning_rate": 3.58e-05, "loss": 0.4247, "step": 4680 }, { "epoch": 65.0, "eval_loss": 0.5395667552947998, "eval_runtime": 128.8047, "eval_samples_per_second": 4.13, "eval_steps_per_second": 0.52, "eval_wer": 0.2224079192646397, "step": 4680 }, { "epoch": 65.14, "learning_rate": 3.578857142857143e-05, "loss": 0.4413, "step": 4690 }, { "epoch": 65.28, "learning_rate": 3.577714285714286e-05, "loss": 0.4307, "step": 4700 }, { "epoch": 65.42, "learning_rate": 3.576571428571429e-05, "loss": 0.4181, "step": 4710 }, { "epoch": 65.55, "learning_rate": 3.5754285714285717e-05, "loss": 0.4149, "step": 4720 }, { "epoch": 65.69, "learning_rate": 3.574285714285714e-05, "loss": 0.4298, "step": 4730 }, { "epoch": 65.83, "learning_rate": 3.573142857142857e-05, "loss": 0.4336, "step": 4740 }, { "epoch": 65.97, "learning_rate": 3.5720000000000004e-05, "loss": 0.4076, "step": 4750 }, { "epoch": 66.0, "eval_loss": 0.5354385375976562, "eval_runtime": 130.1622, "eval_samples_per_second": 4.087, "eval_steps_per_second": 0.515, "eval_wer": 0.22742173940991195, "step": 4752 }, { "epoch": 66.11, "learning_rate": 3.570857142857143e-05, "loss": 0.4297, "step": 4760 }, { "epoch": 66.25, "learning_rate": 3.5697142857142864e-05, "loss": 0.4294, "step": 4770 }, { "epoch": 66.39, "learning_rate": 3.568571428571429e-05, "loss": 0.4164, "step": 4780 }, { "epoch": 66.53, "learning_rate": 3.567428571428572e-05, "loss": 0.436, "step": 4790 }, { "epoch": 66.66, "learning_rate": 3.5662857142857144e-05, "loss": 0.4204, "step": 4800 }, { "epoch": 66.8, "learning_rate": 3.565142857142857e-05, "loss": 0.4166, "step": 4810 }, { "epoch": 66.94, "learning_rate": 3.5640000000000004e-05, "loss": 0.4196, "step": 4820 }, { "epoch": 67.0, "eval_loss": 0.552278995513916, "eval_runtime": 130.0889, "eval_samples_per_second": 4.09, "eval_steps_per_second": 0.515, "eval_wer": 0.2224721990100919, "step": 4824 }, { "epoch": 67.08, "learning_rate": 3.562857142857143e-05, "loss": 0.425, "step": 4830 }, { "epoch": 67.22, "learning_rate": 3.5617142857142865e-05, "loss": 0.4403, "step": 4840 }, { "epoch": 67.36, "learning_rate": 3.5605714285714285e-05, "loss": 0.4079, "step": 4850 }, { "epoch": 67.5, "learning_rate": 3.559428571428572e-05, "loss": 0.4238, "step": 4860 }, { "epoch": 67.64, "learning_rate": 3.5582857142857145e-05, "loss": 0.4209, "step": 4870 }, { "epoch": 67.78, "learning_rate": 3.557142857142857e-05, "loss": 0.4251, "step": 4880 }, { "epoch": 67.91, "learning_rate": 3.5560000000000005e-05, "loss": 0.4216, "step": 4890 }, { "epoch": 68.0, "eval_loss": 0.5180095434188843, "eval_runtime": 129.8127, "eval_samples_per_second": 4.098, "eval_steps_per_second": 0.516, "eval_wer": 0.21662274217394098, "step": 4896 }, { "epoch": 68.06, "learning_rate": 3.554857142857143e-05, "loss": 0.4201, "step": 4900 }, { "epoch": 68.19, "learning_rate": 3.553714285714286e-05, "loss": 0.4189, "step": 4910 }, { "epoch": 68.33, "learning_rate": 3.5525714285714285e-05, "loss": 0.4298, "step": 4920 }, { "epoch": 68.47, "learning_rate": 3.551428571428572e-05, "loss": 0.4341, "step": 4930 }, { "epoch": 68.61, "learning_rate": 3.5502857142857146e-05, "loss": 0.4162, "step": 4940 }, { "epoch": 68.75, "learning_rate": 3.549142857142857e-05, "loss": 0.4127, "step": 4950 }, { "epoch": 68.89, "learning_rate": 3.5480000000000006e-05, "loss": 0.4132, "step": 4960 }, { "epoch": 69.0, "eval_loss": 0.5110918879508972, "eval_runtime": 129.3603, "eval_samples_per_second": 4.113, "eval_steps_per_second": 0.518, "eval_wer": 0.22118660410104776, "step": 4968 }, { "epoch": 69.03, "learning_rate": 3.546857142857143e-05, "loss": 0.4305, "step": 4970 }, { "epoch": 69.17, "learning_rate": 3.545714285714286e-05, "loss": 0.4217, "step": 4980 }, { "epoch": 69.3, "learning_rate": 3.5445714285714286e-05, "loss": 0.4265, "step": 4990 }, { "epoch": 69.44, "learning_rate": 3.543428571428572e-05, "loss": 0.4336, "step": 5000 }, { "epoch": 69.58, "learning_rate": 3.5422857142857146e-05, "loss": 0.4294, "step": 5010 }, { "epoch": 69.72, "learning_rate": 3.541142857142857e-05, "loss": 0.4261, "step": 5020 }, { "epoch": 69.86, "learning_rate": 3.54e-05, "loss": 0.424, "step": 5030 }, { "epoch": 70.0, "learning_rate": 3.538857142857143e-05, "loss": 0.4306, "step": 5040 }, { "epoch": 70.0, "eval_loss": 0.5534010529518127, "eval_runtime": 130.0447, "eval_samples_per_second": 4.091, "eval_steps_per_second": 0.515, "eval_wer": 0.2416275631548499, "step": 5040 }, { "epoch": 70.14, "learning_rate": 3.537714285714286e-05, "loss": 0.441, "step": 5050 }, { "epoch": 70.28, "learning_rate": 3.536571428571429e-05, "loss": 0.4356, "step": 5060 }, { "epoch": 70.42, "learning_rate": 3.535428571428572e-05, "loss": 0.4331, "step": 5070 }, { "epoch": 70.55, "learning_rate": 3.534285714285715e-05, "loss": 0.426, "step": 5080 }, { "epoch": 70.69, "learning_rate": 3.5331428571428574e-05, "loss": 0.4281, "step": 5090 }, { "epoch": 70.83, "learning_rate": 3.532e-05, "loss": 0.4428, "step": 5100 }, { "epoch": 70.97, "learning_rate": 3.530857142857143e-05, "loss": 0.4327, "step": 5110 }, { "epoch": 71.0, "eval_loss": 0.5627850890159607, "eval_runtime": 129.2167, "eval_samples_per_second": 4.117, "eval_steps_per_second": 0.519, "eval_wer": 0.24734846050009643, "step": 5112 }, { "epoch": 71.11, "learning_rate": 3.529714285714286e-05, "loss": 0.4483, "step": 5120 }, { "epoch": 71.25, "learning_rate": 3.528571428571429e-05, "loss": 0.4275, "step": 5130 }, { "epoch": 71.39, "learning_rate": 3.527428571428572e-05, "loss": 0.432, "step": 5140 }, { "epoch": 71.53, "learning_rate": 3.526285714285715e-05, "loss": 0.4401, "step": 5150 }, { "epoch": 71.66, "learning_rate": 3.5251428571428575e-05, "loss": 0.4334, "step": 5160 }, { "epoch": 71.8, "learning_rate": 3.524e-05, "loss": 0.4263, "step": 5170 }, { "epoch": 71.94, "learning_rate": 3.522857142857143e-05, "loss": 0.4301, "step": 5180 }, { "epoch": 72.0, "eval_loss": 0.5216126441955566, "eval_runtime": 128.993, "eval_samples_per_second": 4.124, "eval_steps_per_second": 0.519, "eval_wer": 0.22523622806453686, "step": 5184 }, { "epoch": 72.08, "learning_rate": 3.521714285714286e-05, "loss": 0.4466, "step": 5190 }, { "epoch": 72.22, "learning_rate": 3.520571428571429e-05, "loss": 0.4311, "step": 5200 }, { "epoch": 72.36, "learning_rate": 3.519428571428572e-05, "loss": 0.4179, "step": 5210 }, { "epoch": 72.5, "learning_rate": 3.518285714285714e-05, "loss": 0.4202, "step": 5220 }, { "epoch": 72.64, "learning_rate": 3.5171428571428575e-05, "loss": 0.4282, "step": 5230 }, { "epoch": 72.78, "learning_rate": 3.516e-05, "loss": 0.4333, "step": 5240 }, { "epoch": 72.91, "learning_rate": 3.514857142857143e-05, "loss": 0.4328, "step": 5250 }, { "epoch": 73.0, "eval_loss": 0.5153868198394775, "eval_runtime": 129.2686, "eval_samples_per_second": 4.115, "eval_steps_per_second": 0.518, "eval_wer": 0.22497910908272803, "step": 5256 }, { "epoch": 73.06, "learning_rate": 3.513714285714286e-05, "loss": 0.441, "step": 5260 }, { "epoch": 73.19, "learning_rate": 3.512571428571429e-05, "loss": 0.4177, "step": 5270 }, { "epoch": 73.33, "learning_rate": 3.5114285714285716e-05, "loss": 0.4256, "step": 5280 }, { "epoch": 73.47, "learning_rate": 3.510285714285714e-05, "loss": 0.423, "step": 5290 }, { "epoch": 73.61, "learning_rate": 3.5091428571428576e-05, "loss": 0.4238, "step": 5300 }, { "epoch": 73.75, "learning_rate": 3.508e-05, "loss": 0.4179, "step": 5310 }, { "epoch": 73.89, "learning_rate": 3.506857142857143e-05, "loss": 0.4021, "step": 5320 }, { "epoch": 74.0, "eval_loss": 0.5685908794403076, "eval_runtime": 128.8483, "eval_samples_per_second": 4.129, "eval_steps_per_second": 0.52, "eval_wer": 0.22446487111911037, "step": 5328 }, { "epoch": 74.03, "learning_rate": 3.505714285714286e-05, "loss": 0.4398, "step": 5330 }, { "epoch": 74.17, "learning_rate": 3.504571428571429e-05, "loss": 0.4041, "step": 5340 }, { "epoch": 74.3, "learning_rate": 3.503428571428572e-05, "loss": 0.418, "step": 5350 }, { "epoch": 74.44, "learning_rate": 3.5022857142857143e-05, "loss": 0.42, "step": 5360 }, { "epoch": 74.58, "learning_rate": 3.501142857142858e-05, "loss": 0.4232, "step": 5370 }, { "epoch": 74.72, "learning_rate": 3.5000000000000004e-05, "loss": 0.4252, "step": 5380 }, { "epoch": 74.86, "learning_rate": 3.498857142857143e-05, "loss": 0.4368, "step": 5390 }, { "epoch": 75.0, "learning_rate": 3.4977142857142864e-05, "loss": 0.465, "step": 5400 }, { "epoch": 75.0, "eval_loss": 0.523622989654541, "eval_runtime": 128.9304, "eval_samples_per_second": 4.126, "eval_steps_per_second": 0.52, "eval_wer": 0.24194896188211096, "step": 5400 }, { "epoch": 75.14, "learning_rate": 3.4965714285714284e-05, "loss": 0.4407, "step": 5410 }, { "epoch": 75.28, "learning_rate": 3.495428571428572e-05, "loss": 0.4207, "step": 5420 }, { "epoch": 75.42, "learning_rate": 3.4942857142857144e-05, "loss": 0.4204, "step": 5430 }, { "epoch": 75.55, "learning_rate": 3.493142857142858e-05, "loss": 0.4232, "step": 5440 }, { "epoch": 75.69, "learning_rate": 3.4920000000000004e-05, "loss": 0.4079, "step": 5450 }, { "epoch": 75.83, "learning_rate": 3.490857142857143e-05, "loss": 0.4168, "step": 5460 }, { "epoch": 75.97, "learning_rate": 3.489714285714286e-05, "loss": 0.416, "step": 5470 }, { "epoch": 76.0, "eval_loss": 0.5613663792610168, "eval_runtime": 130.3109, "eval_samples_per_second": 4.083, "eval_steps_per_second": 0.514, "eval_wer": 0.2365494632641255, "step": 5472 }, { "epoch": 76.11, "learning_rate": 3.4885714285714285e-05, "loss": 0.4242, "step": 5480 }, { "epoch": 76.25, "learning_rate": 3.487428571428572e-05, "loss": 0.4348, "step": 5490 }, { "epoch": 76.39, "learning_rate": 3.4862857142857145e-05, "loss": 0.4256, "step": 5500 }, { "epoch": 76.53, "learning_rate": 3.485142857142858e-05, "loss": 0.4155, "step": 5510 }, { "epoch": 76.66, "learning_rate": 3.4840000000000005e-05, "loss": 0.4253, "step": 5520 }, { "epoch": 76.8, "learning_rate": 3.482857142857143e-05, "loss": 0.4223, "step": 5530 }, { "epoch": 76.94, "learning_rate": 3.481714285714286e-05, "loss": 0.4337, "step": 5540 }, { "epoch": 77.0, "eval_loss": 0.527491569519043, "eval_runtime": 128.9936, "eval_samples_per_second": 4.124, "eval_steps_per_second": 0.519, "eval_wer": 0.23018576846435687, "step": 5544 }, { "epoch": 77.08, "learning_rate": 3.4805714285714285e-05, "loss": 0.4171, "step": 5550 }, { "epoch": 77.22, "learning_rate": 3.479428571428572e-05, "loss": 0.4206, "step": 5560 }, { "epoch": 77.36, "learning_rate": 3.4782857142857146e-05, "loss": 0.4246, "step": 5570 }, { "epoch": 77.5, "learning_rate": 3.477142857142858e-05, "loss": 0.4233, "step": 5580 }, { "epoch": 77.64, "learning_rate": 3.4760000000000006e-05, "loss": 0.4037, "step": 5590 }, { "epoch": 77.78, "learning_rate": 3.4748571428571426e-05, "loss": 0.4333, "step": 5600 }, { "epoch": 77.91, "learning_rate": 3.473714285714286e-05, "loss": 0.4157, "step": 5610 }, { "epoch": 78.0, "eval_loss": 0.5125765800476074, "eval_runtime": 129.1956, "eval_samples_per_second": 4.118, "eval_steps_per_second": 0.519, "eval_wer": 0.22928585202802598, "step": 5616 }, { "epoch": 78.06, "learning_rate": 3.4725714285714286e-05, "loss": 0.4169, "step": 5620 }, { "epoch": 78.19, "learning_rate": 3.471428571428572e-05, "loss": 0.4084, "step": 5630 }, { "epoch": 78.33, "learning_rate": 3.4702857142857147e-05, "loss": 0.4253, "step": 5640 }, { "epoch": 78.47, "learning_rate": 3.469142857142857e-05, "loss": 0.4247, "step": 5650 }, { "epoch": 78.61, "learning_rate": 3.468e-05, "loss": 0.4217, "step": 5660 }, { "epoch": 78.75, "learning_rate": 3.466857142857143e-05, "loss": 0.4279, "step": 5670 }, { "epoch": 78.89, "learning_rate": 3.465714285714286e-05, "loss": 0.4143, "step": 5680 }, { "epoch": 79.0, "eval_loss": 0.5260418057441711, "eval_runtime": 128.6638, "eval_samples_per_second": 4.135, "eval_steps_per_second": 0.521, "eval_wer": 0.2375779391913608, "step": 5688 }, { "epoch": 79.03, "learning_rate": 3.464571428571429e-05, "loss": 0.426, "step": 5690 }, { "epoch": 79.17, "learning_rate": 3.463428571428572e-05, "loss": 0.4127, "step": 5700 }, { "epoch": 79.3, "learning_rate": 3.462285714285715e-05, "loss": 0.4187, "step": 5710 }, { "epoch": 79.44, "learning_rate": 3.4611428571428574e-05, "loss": 0.4032, "step": 5720 }, { "epoch": 79.58, "learning_rate": 3.46e-05, "loss": 0.4137, "step": 5730 }, { "epoch": 79.72, "learning_rate": 3.4588571428571434e-05, "loss": 0.4189, "step": 5740 }, { "epoch": 79.86, "learning_rate": 3.457714285714286e-05, "loss": 0.4079, "step": 5750 }, { "epoch": 80.0, "learning_rate": 3.456571428571429e-05, "loss": 0.4174, "step": 5760 }, { "epoch": 80.0, "eval_loss": 0.5253907442092896, "eval_runtime": 129.8443, "eval_samples_per_second": 4.097, "eval_steps_per_second": 0.516, "eval_wer": 0.23172848235520987, "step": 5760 }, { "epoch": 80.14, "learning_rate": 3.455428571428572e-05, "loss": 0.4043, "step": 5770 }, { "epoch": 80.28, "learning_rate": 3.454285714285714e-05, "loss": 0.3992, "step": 5780 }, { "epoch": 80.42, "learning_rate": 3.4531428571428575e-05, "loss": 0.4024, "step": 5790 }, { "epoch": 80.55, "learning_rate": 3.452e-05, "loss": 0.3964, "step": 5800 }, { "epoch": 80.69, "learning_rate": 3.4508571428571435e-05, "loss": 0.4055, "step": 5810 }, { "epoch": 80.83, "learning_rate": 3.449714285714286e-05, "loss": 0.4157, "step": 5820 }, { "epoch": 80.97, "learning_rate": 3.448571428571429e-05, "loss": 0.4174, "step": 5830 }, { "epoch": 81.0, "eval_loss": 0.49711883068084717, "eval_runtime": 129.8273, "eval_samples_per_second": 4.098, "eval_steps_per_second": 0.516, "eval_wer": 0.2190653725011249, "step": 5832 }, { "epoch": 81.11, "learning_rate": 3.4474285714285715e-05, "loss": 0.4146, "step": 5840 }, { "epoch": 81.25, "learning_rate": 3.446285714285714e-05, "loss": 0.4202, "step": 5850 }, { "epoch": 81.39, "learning_rate": 3.4451428571428576e-05, "loss": 0.4029, "step": 5860 }, { "epoch": 81.53, "learning_rate": 3.444e-05, "loss": 0.4081, "step": 5870 }, { "epoch": 81.66, "learning_rate": 3.4428571428571436e-05, "loss": 0.4085, "step": 5880 }, { "epoch": 81.8, "learning_rate": 3.441714285714286e-05, "loss": 0.408, "step": 5890 }, { "epoch": 81.94, "learning_rate": 3.440571428571429e-05, "loss": 0.4082, "step": 5900 }, { "epoch": 82.0, "eval_loss": 0.5245266556739807, "eval_runtime": 129.1918, "eval_samples_per_second": 4.118, "eval_steps_per_second": 0.519, "eval_wer": 0.2320498810824709, "step": 5904 }, { "epoch": 82.08, "learning_rate": 3.4394285714285716e-05, "loss": 0.4171, "step": 5910 }, { "epoch": 82.22, "learning_rate": 3.438285714285714e-05, "loss": 0.4054, "step": 5920 }, { "epoch": 82.36, "learning_rate": 3.4371428571428576e-05, "loss": 0.3891, "step": 5930 }, { "epoch": 82.5, "learning_rate": 3.436e-05, "loss": 0.419, "step": 5940 }, { "epoch": 82.64, "learning_rate": 3.4348571428571437e-05, "loss": 0.4102, "step": 5950 }, { "epoch": 82.78, "learning_rate": 3.433714285714286e-05, "loss": 0.4139, "step": 5960 }, { "epoch": 82.91, "learning_rate": 3.432571428571428e-05, "loss": 0.4263, "step": 5970 }, { "epoch": 83.0, "eval_loss": 0.5691802501678467, "eval_runtime": 128.5529, "eval_samples_per_second": 4.138, "eval_steps_per_second": 0.521, "eval_wer": 0.24014912900944912, "step": 5976 }, { "epoch": 83.06, "learning_rate": 3.431428571428572e-05, "loss": 0.4385, "step": 5980 }, { "epoch": 83.19, "learning_rate": 3.4302857142857144e-05, "loss": 0.4229, "step": 5990 }, { "epoch": 83.33, "learning_rate": 3.429142857142858e-05, "loss": 0.4051, "step": 6000 }, { "epoch": 83.47, "learning_rate": 3.4280000000000004e-05, "loss": 0.4113, "step": 6010 }, { "epoch": 83.61, "learning_rate": 3.426857142857143e-05, "loss": 0.3985, "step": 6020 }, { "epoch": 83.75, "learning_rate": 3.425714285714286e-05, "loss": 0.4071, "step": 6030 }, { "epoch": 83.89, "learning_rate": 3.4245714285714284e-05, "loss": 0.4164, "step": 6040 }, { "epoch": 84.0, "eval_loss": 0.520900547504425, "eval_runtime": 129.1106, "eval_samples_per_second": 4.12, "eval_steps_per_second": 0.519, "eval_wer": 0.23121424439159222, "step": 6048 }, { "epoch": 84.03, "learning_rate": 3.423428571428572e-05, "loss": 0.4248, "step": 6050 }, { "epoch": 84.17, "learning_rate": 3.4222857142857144e-05, "loss": 0.4034, "step": 6060 }, { "epoch": 84.3, "learning_rate": 3.421142857142858e-05, "loss": 0.4114, "step": 6070 }, { "epoch": 84.44, "learning_rate": 3.4200000000000005e-05, "loss": 0.4204, "step": 6080 }, { "epoch": 84.58, "learning_rate": 3.418857142857143e-05, "loss": 0.3974, "step": 6090 }, { "epoch": 84.72, "learning_rate": 3.417714285714286e-05, "loss": 0.3966, "step": 6100 }, { "epoch": 84.86, "learning_rate": 3.4165714285714285e-05, "loss": 0.4068, "step": 6110 }, { "epoch": 85.0, "learning_rate": 3.415428571428572e-05, "loss": 0.4144, "step": 6120 }, { "epoch": 85.0, "eval_loss": 0.5164024233818054, "eval_runtime": 128.5527, "eval_samples_per_second": 4.138, "eval_steps_per_second": 0.521, "eval_wer": 0.23404255319148937, "step": 6120 }, { "epoch": 85.14, "learning_rate": 3.4142857142857145e-05, "loss": 0.4168, "step": 6130 }, { "epoch": 85.28, "learning_rate": 3.413142857142858e-05, "loss": 0.4246, "step": 6140 }, { "epoch": 85.42, "learning_rate": 3.4120000000000005e-05, "loss": 0.4282, "step": 6150 }, { "epoch": 85.55, "learning_rate": 3.410857142857143e-05, "loss": 0.4204, "step": 6160 }, { "epoch": 85.69, "learning_rate": 3.409714285714286e-05, "loss": 0.429, "step": 6170 }, { "epoch": 85.83, "learning_rate": 3.4085714285714286e-05, "loss": 0.4405, "step": 6180 }, { "epoch": 85.97, "learning_rate": 3.407428571428572e-05, "loss": 0.4189, "step": 6190 }, { "epoch": 86.0, "eval_loss": 0.5544713735580444, "eval_runtime": 129.6903, "eval_samples_per_second": 4.102, "eval_steps_per_second": 0.517, "eval_wer": 0.24587002635469563, "step": 6192 }, { "epoch": 86.11, "learning_rate": 3.4062857142857146e-05, "loss": 0.42, "step": 6200 }, { "epoch": 86.25, "learning_rate": 3.405142857142857e-05, "loss": 0.4149, "step": 6210 }, { "epoch": 86.39, "learning_rate": 3.404e-05, "loss": 0.4116, "step": 6220 }, { "epoch": 86.53, "learning_rate": 3.402857142857143e-05, "loss": 0.4144, "step": 6230 }, { "epoch": 86.66, "learning_rate": 3.401714285714286e-05, "loss": 0.4187, "step": 6240 }, { "epoch": 86.8, "learning_rate": 3.4005714285714286e-05, "loss": 0.4211, "step": 6250 }, { "epoch": 86.94, "learning_rate": 3.399428571428572e-05, "loss": 0.4311, "step": 6260 }, { "epoch": 87.0, "eval_loss": 0.5349487662315369, "eval_runtime": 129.2049, "eval_samples_per_second": 4.117, "eval_steps_per_second": 0.519, "eval_wer": 0.24773413897280966, "step": 6264 }, { "epoch": 87.08, "learning_rate": 3.398285714285715e-05, "loss": 0.4423, "step": 6270 }, { "epoch": 87.22, "learning_rate": 3.397142857142857e-05, "loss": 0.427, "step": 6280 }, { "epoch": 87.36, "learning_rate": 3.396e-05, "loss": 0.4, "step": 6290 }, { "epoch": 87.5, "learning_rate": 3.3948571428571434e-05, "loss": 0.4067, "step": 6300 }, { "epoch": 87.64, "learning_rate": 3.393714285714286e-05, "loss": 0.3944, "step": 6310 }, { "epoch": 87.78, "learning_rate": 3.3925714285714294e-05, "loss": 0.4018, "step": 6320 }, { "epoch": 87.91, "learning_rate": 3.391542857142857e-05, "loss": 0.4224, "step": 6330 }, { "epoch": 88.0, "eval_loss": 0.5093081593513489, "eval_runtime": 129.1296, "eval_samples_per_second": 4.12, "eval_steps_per_second": 0.519, "eval_wer": 0.2375136594459086, "step": 6336 }, { "epoch": 88.06, "learning_rate": 3.3904000000000006e-05, "loss": 0.4295, "step": 6340 }, { "epoch": 88.19, "learning_rate": 3.389257142857143e-05, "loss": 0.407, "step": 6350 }, { "epoch": 88.33, "learning_rate": 3.388114285714286e-05, "loss": 0.4063, "step": 6360 }, { "epoch": 88.47, "learning_rate": 3.3869714285714286e-05, "loss": 0.4067, "step": 6370 }, { "epoch": 88.61, "learning_rate": 3.385828571428572e-05, "loss": 0.3984, "step": 6380 }, { "epoch": 88.75, "learning_rate": 3.3846857142857147e-05, "loss": 0.4132, "step": 6390 }, { "epoch": 88.89, "learning_rate": 3.383542857142857e-05, "loss": 0.4069, "step": 6400 }, { "epoch": 89.0, "eval_loss": 0.5663569569587708, "eval_runtime": 128.7222, "eval_samples_per_second": 4.133, "eval_steps_per_second": 0.521, "eval_wer": 0.24432731246384265, "step": 6408 }, { "epoch": 89.03, "learning_rate": 3.382400000000001e-05, "loss": 0.4234, "step": 6410 }, { "epoch": 89.17, "learning_rate": 3.381257142857143e-05, "loss": 0.408, "step": 6420 }, { "epoch": 89.3, "learning_rate": 3.380114285714286e-05, "loss": 0.4063, "step": 6430 }, { "epoch": 89.44, "learning_rate": 3.378971428571429e-05, "loss": 0.4123, "step": 6440 }, { "epoch": 89.58, "learning_rate": 3.377828571428572e-05, "loss": 0.4065, "step": 6450 }, { "epoch": 89.72, "learning_rate": 3.376685714285715e-05, "loss": 0.4128, "step": 6460 }, { "epoch": 89.86, "learning_rate": 3.3755428571428574e-05, "loss": 0.4086, "step": 6470 }, { "epoch": 90.0, "learning_rate": 3.3744e-05, "loss": 0.4082, "step": 6480 }, { "epoch": 90.0, "eval_loss": 0.542646050453186, "eval_runtime": 129.1178, "eval_samples_per_second": 4.12, "eval_steps_per_second": 0.519, "eval_wer": 0.23905637333676158, "step": 6480 }, { "epoch": 90.14, "learning_rate": 3.373257142857143e-05, "loss": 0.4021, "step": 6490 }, { "epoch": 90.28, "learning_rate": 3.372114285714286e-05, "loss": 0.4074, "step": 6500 }, { "epoch": 90.42, "learning_rate": 3.370971428571429e-05, "loss": 0.4023, "step": 6510 }, { "epoch": 90.55, "learning_rate": 3.369828571428572e-05, "loss": 0.3947, "step": 6520 }, { "epoch": 90.69, "learning_rate": 3.368685714285715e-05, "loss": 0.3965, "step": 6530 }, { "epoch": 90.83, "learning_rate": 3.3675428571428575e-05, "loss": 0.3934, "step": 6540 }, { "epoch": 90.97, "learning_rate": 3.3664e-05, "loss": 0.411, "step": 6550 }, { "epoch": 91.0, "eval_loss": 0.5218707919120789, "eval_runtime": 129.4648, "eval_samples_per_second": 4.109, "eval_steps_per_second": 0.518, "eval_wer": 0.23391399370058494, "step": 6552 }, { "epoch": 91.11, "learning_rate": 3.365257142857143e-05, "loss": 0.4143, "step": 6560 }, { "epoch": 91.25, "learning_rate": 3.364114285714286e-05, "loss": 0.409, "step": 6570 }, { "epoch": 91.39, "learning_rate": 3.362971428571429e-05, "loss": 0.3964, "step": 6580 }, { "epoch": 91.53, "learning_rate": 3.361828571428572e-05, "loss": 0.3931, "step": 6590 }, { "epoch": 91.66, "learning_rate": 3.360685714285715e-05, "loss": 0.4038, "step": 6600 }, { "epoch": 91.8, "learning_rate": 3.359542857142857e-05, "loss": 0.4009, "step": 6610 }, { "epoch": 91.94, "learning_rate": 3.3584e-05, "loss": 0.4085, "step": 6620 }, { "epoch": 92.0, "eval_loss": 0.5467609167098999, "eval_runtime": 128.9177, "eval_samples_per_second": 4.127, "eval_steps_per_second": 0.52, "eval_wer": 0.2360352253005078, "step": 6624 }, { "epoch": 92.08, "learning_rate": 3.357257142857143e-05, "loss": 0.4123, "step": 6630 }, { "epoch": 92.22, "learning_rate": 3.356114285714286e-05, "loss": 0.3962, "step": 6640 }, { "epoch": 92.36, "learning_rate": 3.354971428571429e-05, "loss": 0.3939, "step": 6650 }, { "epoch": 92.5, "learning_rate": 3.3538285714285716e-05, "loss": 0.3974, "step": 6660 }, { "epoch": 92.64, "learning_rate": 3.352685714285714e-05, "loss": 0.3939, "step": 6670 }, { "epoch": 92.78, "learning_rate": 3.351542857142857e-05, "loss": 0.4115, "step": 6680 }, { "epoch": 92.91, "learning_rate": 3.3504e-05, "loss": 0.4012, "step": 6690 }, { "epoch": 93.0, "eval_loss": 0.5513857007026672, "eval_runtime": 128.8224, "eval_samples_per_second": 4.13, "eval_steps_per_second": 0.52, "eval_wer": 0.25255511988172524, "step": 6696 }, { "epoch": 93.06, "learning_rate": 3.349257142857143e-05, "loss": 0.4341, "step": 6700 }, { "epoch": 93.19, "learning_rate": 3.3481142857142863e-05, "loss": 0.4127, "step": 6710 }, { "epoch": 93.33, "learning_rate": 3.346971428571429e-05, "loss": 0.4024, "step": 6720 }, { "epoch": 93.47, "learning_rate": 3.345828571428572e-05, "loss": 0.4158, "step": 6730 }, { "epoch": 93.61, "learning_rate": 3.3446857142857144e-05, "loss": 0.413, "step": 6740 }, { "epoch": 93.75, "learning_rate": 3.343542857142857e-05, "loss": 0.4095, "step": 6750 }, { "epoch": 93.89, "learning_rate": 3.3424000000000004e-05, "loss": 0.3863, "step": 6760 }, { "epoch": 94.0, "eval_loss": 0.5440473556518555, "eval_runtime": 128.4821, "eval_samples_per_second": 4.141, "eval_steps_per_second": 0.521, "eval_wer": 0.2343639519187504, "step": 6768 }, { "epoch": 94.03, "learning_rate": 3.341257142857143e-05, "loss": 0.4062, "step": 6770 }, { "epoch": 94.17, "learning_rate": 3.3401142857142864e-05, "loss": 0.3944, "step": 6780 }, { "epoch": 94.3, "learning_rate": 3.338971428571429e-05, "loss": 0.395, "step": 6790 }, { "epoch": 94.44, "learning_rate": 3.337828571428572e-05, "loss": 0.3926, "step": 6800 }, { "epoch": 94.58, "learning_rate": 3.3366857142857144e-05, "loss": 0.4028, "step": 6810 }, { "epoch": 94.72, "learning_rate": 3.335542857142858e-05, "loss": 0.4199, "step": 6820 }, { "epoch": 94.86, "learning_rate": 3.3344000000000005e-05, "loss": 0.4132, "step": 6830 }, { "epoch": 95.0, "learning_rate": 3.333257142857143e-05, "loss": 0.4098, "step": 6840 }, { "epoch": 95.0, "eval_loss": 0.5355387330055237, "eval_runtime": 128.6796, "eval_samples_per_second": 4.134, "eval_steps_per_second": 0.521, "eval_wer": 0.23616378479141223, "step": 6840 }, { "epoch": 95.14, "learning_rate": 3.332114285714286e-05, "loss": 0.3988, "step": 6850 }, { "epoch": 95.28, "learning_rate": 3.3309714285714285e-05, "loss": 0.4007, "step": 6860 }, { "epoch": 95.42, "learning_rate": 3.329828571428572e-05, "loss": 0.4063, "step": 6870 }, { "epoch": 95.55, "learning_rate": 3.3286857142857145e-05, "loss": 0.4053, "step": 6880 }, { "epoch": 95.69, "learning_rate": 3.327542857142858e-05, "loss": 0.3959, "step": 6890 }, { "epoch": 95.83, "learning_rate": 3.3264000000000005e-05, "loss": 0.4123, "step": 6900 }, { "epoch": 95.97, "learning_rate": 3.325257142857143e-05, "loss": 0.4136, "step": 6910 }, { "epoch": 96.0, "eval_loss": 0.5400183200836182, "eval_runtime": 128.9505, "eval_samples_per_second": 4.126, "eval_steps_per_second": 0.52, "eval_wer": 0.2409204859548756, "step": 6912 }, { "epoch": 96.11, "learning_rate": 3.324114285714286e-05, "loss": 0.4, "step": 6920 }, { "epoch": 96.25, "learning_rate": 3.3229714285714286e-05, "loss": 0.3989, "step": 6930 }, { "epoch": 96.39, "learning_rate": 3.321828571428572e-05, "loss": 0.3894, "step": 6940 }, { "epoch": 96.53, "learning_rate": 3.3206857142857146e-05, "loss": 0.4086, "step": 6950 }, { "epoch": 96.66, "learning_rate": 3.319542857142858e-05, "loss": 0.4, "step": 6960 }, { "epoch": 96.8, "learning_rate": 3.3184000000000006e-05, "loss": 0.4054, "step": 6970 }, { "epoch": 96.94, "learning_rate": 3.3172571428571426e-05, "loss": 0.4066, "step": 6980 }, { "epoch": 97.0, "eval_loss": 0.5116966366767883, "eval_runtime": 128.7107, "eval_samples_per_second": 4.133, "eval_steps_per_second": 0.521, "eval_wer": 0.23127852413704442, "step": 6984 }, { "epoch": 97.08, "learning_rate": 3.316114285714286e-05, "loss": 0.4034, "step": 6990 }, { "epoch": 97.22, "learning_rate": 3.3149714285714286e-05, "loss": 0.3973, "step": 7000 }, { "epoch": 97.36, "learning_rate": 3.313828571428572e-05, "loss": 0.3946, "step": 7010 }, { "epoch": 97.5, "learning_rate": 3.312685714285715e-05, "loss": 0.3935, "step": 7020 }, { "epoch": 97.64, "learning_rate": 3.3115428571428573e-05, "loss": 0.391, "step": 7030 }, { "epoch": 97.78, "learning_rate": 3.3104e-05, "loss": 0.4029, "step": 7040 }, { "epoch": 97.91, "learning_rate": 3.309257142857143e-05, "loss": 0.4131, "step": 7050 }, { "epoch": 98.0, "eval_loss": 0.536474347114563, "eval_runtime": 129.0734, "eval_samples_per_second": 4.122, "eval_steps_per_second": 0.519, "eval_wer": 0.2375136594459086, "step": 7056 }, { "epoch": 98.06, "learning_rate": 3.308114285714286e-05, "loss": 0.3989, "step": 7060 }, { "epoch": 98.19, "learning_rate": 3.306971428571429e-05, "loss": 0.3894, "step": 7070 }, { "epoch": 98.33, "learning_rate": 3.305828571428572e-05, "loss": 0.389, "step": 7080 }, { "epoch": 98.47, "learning_rate": 3.304685714285715e-05, "loss": 0.4028, "step": 7090 }, { "epoch": 98.61, "learning_rate": 3.3035428571428574e-05, "loss": 0.386, "step": 7100 }, { "epoch": 98.75, "learning_rate": 3.3024e-05, "loss": 0.3871, "step": 7110 }, { "epoch": 98.89, "learning_rate": 3.301257142857143e-05, "loss": 0.3852, "step": 7120 }, { "epoch": 99.0, "eval_loss": 0.5171608328819275, "eval_runtime": 128.7263, "eval_samples_per_second": 4.133, "eval_steps_per_second": 0.52, "eval_wer": 0.2325641190460886, "step": 7128 }, { "epoch": 99.03, "learning_rate": 3.300114285714286e-05, "loss": 0.4162, "step": 7130 }, { "epoch": 99.17, "learning_rate": 3.298971428571429e-05, "loss": 0.3925, "step": 7140 }, { "epoch": 99.3, "learning_rate": 3.297828571428572e-05, "loss": 0.3867, "step": 7150 }, { "epoch": 99.44, "learning_rate": 3.296685714285715e-05, "loss": 0.3972, "step": 7160 }, { "epoch": 99.58, "learning_rate": 3.2955428571428575e-05, "loss": 0.4051, "step": 7170 }, { "epoch": 99.72, "learning_rate": 3.2944e-05, "loss": 0.3958, "step": 7180 }, { "epoch": 99.86, "learning_rate": 3.293257142857143e-05, "loss": 0.3885, "step": 7190 }, { "epoch": 100.0, "learning_rate": 3.292114285714286e-05, "loss": 0.3935, "step": 7200 }, { "epoch": 100.0, "eval_loss": 0.5084860920906067, "eval_runtime": 129.0291, "eval_samples_per_second": 4.123, "eval_steps_per_second": 0.519, "eval_wer": 0.229607250755287, "step": 7200 }, { "epoch": 100.14, "learning_rate": 3.290971428571429e-05, "loss": 0.4035, "step": 7210 }, { "epoch": 100.28, "learning_rate": 3.2898285714285715e-05, "loss": 0.4059, "step": 7220 }, { "epoch": 100.42, "learning_rate": 3.288685714285714e-05, "loss": 0.3902, "step": 7230 }, { "epoch": 100.55, "learning_rate": 3.2875428571428576e-05, "loss": 0.3958, "step": 7240 }, { "epoch": 100.69, "learning_rate": 3.2864e-05, "loss": 0.3959, "step": 7250 }, { "epoch": 100.83, "learning_rate": 3.285257142857143e-05, "loss": 0.3934, "step": 7260 }, { "epoch": 100.97, "learning_rate": 3.284114285714286e-05, "loss": 0.4093, "step": 7270 }, { "epoch": 101.0, "eval_loss": 0.5649605393409729, "eval_runtime": 129.4376, "eval_samples_per_second": 4.11, "eval_steps_per_second": 0.518, "eval_wer": 0.25249084013627304, "step": 7272 }, { "epoch": 101.11, "learning_rate": 3.282971428571429e-05, "loss": 0.4076, "step": 7280 }, { "epoch": 101.25, "learning_rate": 3.2818285714285716e-05, "loss": 0.4009, "step": 7290 }, { "epoch": 101.39, "learning_rate": 3.280685714285714e-05, "loss": 0.4057, "step": 7300 }, { "epoch": 101.53, "learning_rate": 3.2795428571428576e-05, "loss": 0.413, "step": 7310 }, { "epoch": 101.66, "learning_rate": 3.2784e-05, "loss": 0.4007, "step": 7320 }, { "epoch": 101.8, "learning_rate": 3.277257142857143e-05, "loss": 0.395, "step": 7330 }, { "epoch": 101.94, "learning_rate": 3.2761142857142864e-05, "loss": 0.3938, "step": 7340 }, { "epoch": 102.0, "eval_loss": 0.5246307253837585, "eval_runtime": 129.1776, "eval_samples_per_second": 4.118, "eval_steps_per_second": 0.519, "eval_wer": 0.23243555955518416, "step": 7344 }, { "epoch": 102.08, "learning_rate": 3.274971428571429e-05, "loss": 0.4032, "step": 7350 }, { "epoch": 102.22, "learning_rate": 3.273828571428572e-05, "loss": 0.3909, "step": 7360 }, { "epoch": 102.36, "learning_rate": 3.2726857142857144e-05, "loss": 0.3726, "step": 7370 }, { "epoch": 102.5, "learning_rate": 3.271542857142858e-05, "loss": 0.3954, "step": 7380 }, { "epoch": 102.64, "learning_rate": 3.2704000000000004e-05, "loss": 0.3899, "step": 7390 }, { "epoch": 102.78, "learning_rate": 3.269257142857143e-05, "loss": 0.386, "step": 7400 }, { "epoch": 102.91, "learning_rate": 3.268114285714286e-05, "loss": 0.4016, "step": 7410 }, { "epoch": 103.0, "eval_loss": 0.5083659291267395, "eval_runtime": 129.4605, "eval_samples_per_second": 4.109, "eval_steps_per_second": 0.518, "eval_wer": 0.22915729253712155, "step": 7416 }, { "epoch": 103.06, "learning_rate": 3.2669714285714284e-05, "loss": 0.4058, "step": 7420 }, { "epoch": 103.19, "learning_rate": 3.265828571428572e-05, "loss": 0.4006, "step": 7430 }, { "epoch": 103.33, "learning_rate": 3.2646857142857145e-05, "loss": 0.3985, "step": 7440 }, { "epoch": 103.47, "learning_rate": 3.263542857142858e-05, "loss": 0.4072, "step": 7450 }, { "epoch": 103.61, "learning_rate": 3.2624000000000005e-05, "loss": 0.4091, "step": 7460 }, { "epoch": 103.75, "learning_rate": 3.261257142857143e-05, "loss": 0.3986, "step": 7470 }, { "epoch": 103.89, "learning_rate": 3.260114285714286e-05, "loss": 0.412, "step": 7480 }, { "epoch": 104.0, "eval_loss": 0.530807614326477, "eval_runtime": 129.9649, "eval_samples_per_second": 4.093, "eval_steps_per_second": 0.516, "eval_wer": 0.22105804461014333, "step": 7488 }, { "epoch": 104.03, "learning_rate": 3.2589714285714285e-05, "loss": 0.4185, "step": 7490 }, { "epoch": 104.17, "learning_rate": 3.257828571428572e-05, "loss": 0.4076, "step": 7500 }, { "epoch": 104.3, "learning_rate": 3.2566857142857145e-05, "loss": 0.4012, "step": 7510 }, { "epoch": 104.44, "learning_rate": 3.255542857142858e-05, "loss": 0.4064, "step": 7520 }, { "epoch": 104.58, "learning_rate": 3.2544000000000006e-05, "loss": 0.3982, "step": 7530 }, { "epoch": 104.72, "learning_rate": 3.253257142857143e-05, "loss": 0.4042, "step": 7540 }, { "epoch": 104.86, "learning_rate": 3.252114285714286e-05, "loss": 0.3979, "step": 7550 }, { "epoch": 105.0, "learning_rate": 3.2509714285714286e-05, "loss": 0.3903, "step": 7560 }, { "epoch": 105.0, "eval_loss": 0.5046549439430237, "eval_runtime": 129.5771, "eval_samples_per_second": 4.106, "eval_steps_per_second": 0.517, "eval_wer": 0.22009384842836022, "step": 7560 }, { "epoch": 105.14, "learning_rate": 3.249828571428572e-05, "loss": 0.3977, "step": 7570 }, { "epoch": 105.28, "learning_rate": 3.2486857142857146e-05, "loss": 0.3876, "step": 7580 }, { "epoch": 105.42, "learning_rate": 3.247542857142857e-05, "loss": 0.3917, "step": 7590 }, { "epoch": 105.55, "learning_rate": 3.2464e-05, "loss": 0.3879, "step": 7600 }, { "epoch": 105.69, "learning_rate": 3.245257142857143e-05, "loss": 0.3889, "step": 7610 }, { "epoch": 105.83, "learning_rate": 3.244114285714286e-05, "loss": 0.3995, "step": 7620 }, { "epoch": 105.97, "learning_rate": 3.2429714285714287e-05, "loss": 0.396, "step": 7630 }, { "epoch": 106.0, "eval_loss": 0.5302377343177795, "eval_runtime": 129.5065, "eval_samples_per_second": 4.108, "eval_steps_per_second": 0.517, "eval_wer": 0.2222793597737353, "step": 7632 }, { "epoch": 106.11, "learning_rate": 3.241828571428572e-05, "loss": 0.3909, "step": 7640 }, { "epoch": 106.25, "learning_rate": 3.240685714285715e-05, "loss": 0.4007, "step": 7650 }, { "epoch": 106.39, "learning_rate": 3.2395428571428574e-05, "loss": 0.3823, "step": 7660 }, { "epoch": 106.53, "learning_rate": 3.2384e-05, "loss": 0.3998, "step": 7670 }, { "epoch": 106.66, "learning_rate": 3.2372571428571434e-05, "loss": 0.4064, "step": 7680 }, { "epoch": 106.8, "learning_rate": 3.236114285714286e-05, "loss": 0.4023, "step": 7690 }, { "epoch": 106.94, "learning_rate": 3.234971428571429e-05, "loss": 0.3891, "step": 7700 }, { "epoch": 107.0, "eval_loss": 0.5367183685302734, "eval_runtime": 129.6585, "eval_samples_per_second": 4.103, "eval_steps_per_second": 0.517, "eval_wer": 0.22215080028283088, "step": 7704 }, { "epoch": 107.08, "learning_rate": 3.233828571428572e-05, "loss": 0.405, "step": 7710 }, { "epoch": 107.22, "learning_rate": 3.232685714285715e-05, "loss": 0.3923, "step": 7720 }, { "epoch": 107.36, "learning_rate": 3.2315428571428574e-05, "loss": 0.3685, "step": 7730 }, { "epoch": 107.5, "learning_rate": 3.2304e-05, "loss": 0.3895, "step": 7740 }, { "epoch": 107.64, "learning_rate": 3.2292571428571435e-05, "loss": 0.391, "step": 7750 }, { "epoch": 107.78, "learning_rate": 3.228114285714286e-05, "loss": 0.3931, "step": 7760 }, { "epoch": 107.91, "learning_rate": 3.226971428571429e-05, "loss": 0.3886, "step": 7770 }, { "epoch": 108.0, "eval_loss": 0.5459126234054565, "eval_runtime": 130.5661, "eval_samples_per_second": 4.075, "eval_steps_per_second": 0.513, "eval_wer": 0.2327569582824452, "step": 7776 }, { "epoch": 108.06, "learning_rate": 3.2258285714285715e-05, "loss": 0.4131, "step": 7780 }, { "epoch": 108.19, "learning_rate": 3.224685714285714e-05, "loss": 0.3987, "step": 7790 }, { "epoch": 108.33, "learning_rate": 3.2235428571428575e-05, "loss": 0.3803, "step": 7800 }, { "epoch": 108.47, "learning_rate": 3.2224e-05, "loss": 0.3935, "step": 7810 }, { "epoch": 108.61, "learning_rate": 3.2212571428571435e-05, "loss": 0.3887, "step": 7820 }, { "epoch": 108.75, "learning_rate": 3.220114285714286e-05, "loss": 0.3947, "step": 7830 }, { "epoch": 108.89, "learning_rate": 3.218971428571429e-05, "loss": 0.379, "step": 7840 }, { "epoch": 109.0, "eval_loss": 0.5486302375793457, "eval_runtime": 129.0792, "eval_samples_per_second": 4.121, "eval_steps_per_second": 0.519, "eval_wer": 0.23404255319148937, "step": 7848 }, { "epoch": 109.03, "learning_rate": 3.2178285714285716e-05, "loss": 0.4064, "step": 7850 }, { "epoch": 109.17, "learning_rate": 3.216685714285714e-05, "loss": 0.3903, "step": 7860 }, { "epoch": 109.3, "learning_rate": 3.2155428571428576e-05, "loss": 0.3899, "step": 7870 }, { "epoch": 109.44, "learning_rate": 3.2144e-05, "loss": 0.388, "step": 7880 }, { "epoch": 109.58, "learning_rate": 3.2132571428571436e-05, "loss": 0.3874, "step": 7890 }, { "epoch": 109.72, "learning_rate": 3.212114285714286e-05, "loss": 0.3953, "step": 7900 }, { "epoch": 109.86, "learning_rate": 3.210971428571429e-05, "loss": 0.3784, "step": 7910 }, { "epoch": 110.0, "learning_rate": 3.2098285714285716e-05, "loss": 0.4009, "step": 7920 }, { "epoch": 110.0, "eval_loss": 0.5080066323280334, "eval_runtime": 131.7674, "eval_samples_per_second": 4.037, "eval_steps_per_second": 0.508, "eval_wer": 0.21861541428295944, "step": 7920 }, { "epoch": 110.14, "learning_rate": 3.208685714285714e-05, "loss": 0.3871, "step": 7930 }, { "epoch": 110.28, "learning_rate": 3.207542857142858e-05, "loss": 0.3918, "step": 7940 }, { "epoch": 110.42, "learning_rate": 3.2064e-05, "loss": 0.3971, "step": 7950 }, { "epoch": 110.55, "learning_rate": 3.205257142857143e-05, "loss": 0.3891, "step": 7960 }, { "epoch": 110.69, "learning_rate": 3.204114285714286e-05, "loss": 0.3892, "step": 7970 }, { "epoch": 110.83, "learning_rate": 3.2029714285714284e-05, "loss": 0.3923, "step": 7980 }, { "epoch": 110.97, "learning_rate": 3.201828571428572e-05, "loss": 0.3967, "step": 7990 }, { "epoch": 111.0, "eval_loss": 0.5389477014541626, "eval_runtime": 131.3376, "eval_samples_per_second": 4.051, "eval_steps_per_second": 0.51, "eval_wer": 0.21925821173748153, "step": 7992 }, { "epoch": 111.11, "learning_rate": 3.2006857142857144e-05, "loss": 0.4136, "step": 8000 }, { "epoch": 111.25, "learning_rate": 3.199542857142858e-05, "loss": 0.4034, "step": 8010 }, { "epoch": 111.39, "learning_rate": 3.1984000000000004e-05, "loss": 0.4028, "step": 8020 }, { "epoch": 111.53, "learning_rate": 3.197257142857143e-05, "loss": 0.3905, "step": 8030 }, { "epoch": 111.66, "learning_rate": 3.196114285714286e-05, "loss": 0.3941, "step": 8040 }, { "epoch": 111.8, "learning_rate": 3.1949714285714284e-05, "loss": 0.4047, "step": 8050 }, { "epoch": 111.94, "learning_rate": 3.193828571428572e-05, "loss": 0.3988, "step": 8060 }, { "epoch": 112.0, "eval_loss": 0.5487829446792603, "eval_runtime": 131.5089, "eval_samples_per_second": 4.045, "eval_steps_per_second": 0.509, "eval_wer": 0.228064536864434, "step": 8064 }, { "epoch": 112.08, "learning_rate": 3.1926857142857145e-05, "loss": 0.4008, "step": 8070 }, { "epoch": 112.22, "learning_rate": 3.191542857142858e-05, "loss": 0.3879, "step": 8080 }, { "epoch": 112.36, "learning_rate": 3.1904000000000005e-05, "loss": 0.3913, "step": 8090 }, { "epoch": 112.5, "learning_rate": 3.189257142857143e-05, "loss": 0.4024, "step": 8100 }, { "epoch": 112.64, "learning_rate": 3.188114285714286e-05, "loss": 0.3896, "step": 8110 }, { "epoch": 112.78, "learning_rate": 3.186971428571429e-05, "loss": 0.3867, "step": 8120 }, { "epoch": 112.91, "learning_rate": 3.185828571428572e-05, "loss": 0.3952, "step": 8130 }, { "epoch": 113.0, "eval_loss": 0.5409157872200012, "eval_runtime": 135.8896, "eval_samples_per_second": 3.915, "eval_steps_per_second": 0.493, "eval_wer": 0.22935013177347818, "step": 8136 }, { "epoch": 113.06, "learning_rate": 3.1846857142857145e-05, "loss": 0.393, "step": 8140 }, { "epoch": 113.19, "learning_rate": 3.183542857142857e-05, "loss": 0.3926, "step": 8150 }, { "epoch": 113.33, "learning_rate": 3.1824e-05, "loss": 0.3807, "step": 8160 }, { "epoch": 113.47, "learning_rate": 3.181257142857143e-05, "loss": 0.3871, "step": 8170 }, { "epoch": 113.61, "learning_rate": 3.180114285714286e-05, "loss": 0.3836, "step": 8180 }, { "epoch": 113.75, "learning_rate": 3.178971428571429e-05, "loss": 0.3941, "step": 8190 }, { "epoch": 113.89, "learning_rate": 3.177828571428572e-05, "loss": 0.3884, "step": 8200 }, { "epoch": 114.0, "eval_loss": 0.5304366946220398, "eval_runtime": 132.3053, "eval_samples_per_second": 4.021, "eval_steps_per_second": 0.506, "eval_wer": 0.2325641190460886, "step": 8208 }, { "epoch": 114.03, "learning_rate": 3.1766857142857146e-05, "loss": 0.4175, "step": 8210 }, { "epoch": 114.17, "learning_rate": 3.175542857142857e-05, "loss": 0.3866, "step": 8220 }, { "epoch": 114.3, "learning_rate": 3.1744e-05, "loss": 0.3798, "step": 8230 }, { "epoch": 114.44, "learning_rate": 3.173257142857143e-05, "loss": 0.3959, "step": 8240 }, { "epoch": 114.58, "learning_rate": 3.172114285714286e-05, "loss": 0.3764, "step": 8250 }, { "epoch": 114.72, "learning_rate": 3.1709714285714293e-05, "loss": 0.3828, "step": 8260 }, { "epoch": 114.86, "learning_rate": 3.169828571428572e-05, "loss": 0.3717, "step": 8270 }, { "epoch": 115.0, "learning_rate": 3.168685714285715e-05, "loss": 0.3939, "step": 8280 }, { "epoch": 115.0, "eval_loss": 0.5542382597923279, "eval_runtime": 131.7683, "eval_samples_per_second": 4.037, "eval_steps_per_second": 0.508, "eval_wer": 0.22105804461014333, "step": 8280 }, { "epoch": 115.14, "learning_rate": 3.1675428571428574e-05, "loss": 0.3944, "step": 8290 }, { "epoch": 115.28, "learning_rate": 3.1664e-05, "loss": 0.3853, "step": 8300 }, { "epoch": 115.42, "learning_rate": 3.1652571428571434e-05, "loss": 0.3912, "step": 8310 }, { "epoch": 115.55, "learning_rate": 3.164114285714286e-05, "loss": 0.3839, "step": 8320 }, { "epoch": 115.69, "learning_rate": 3.162971428571429e-05, "loss": 0.3925, "step": 8330 }, { "epoch": 115.83, "learning_rate": 3.1618285714285714e-05, "loss": 0.396, "step": 8340 }, { "epoch": 115.97, "learning_rate": 3.160685714285714e-05, "loss": 0.3927, "step": 8350 }, { "epoch": 116.0, "eval_loss": 0.567578911781311, "eval_runtime": 130.9693, "eval_samples_per_second": 4.062, "eval_steps_per_second": 0.512, "eval_wer": 0.22594330526451115, "step": 8352 }, { "epoch": 116.11, "learning_rate": 3.1595428571428574e-05, "loss": 0.3962, "step": 8360 }, { "epoch": 116.25, "learning_rate": 3.1584e-05, "loss": 0.3893, "step": 8370 }, { "epoch": 116.39, "learning_rate": 3.1572571428571435e-05, "loss": 0.4014, "step": 8380 }, { "epoch": 116.53, "learning_rate": 3.156114285714286e-05, "loss": 0.4025, "step": 8390 }, { "epoch": 116.66, "learning_rate": 3.154971428571429e-05, "loss": 0.3996, "step": 8400 }, { "epoch": 116.8, "learning_rate": 3.1538285714285715e-05, "loss": 0.3839, "step": 8410 }, { "epoch": 116.94, "learning_rate": 3.152685714285714e-05, "loss": 0.3944, "step": 8420 }, { "epoch": 117.0, "eval_loss": 0.522085428237915, "eval_runtime": 131.2599, "eval_samples_per_second": 4.053, "eval_steps_per_second": 0.51, "eval_wer": 0.22099376486469113, "step": 8424 }, { "epoch": 117.08, "learning_rate": 3.1515428571428575e-05, "loss": 0.3949, "step": 8430 }, { "epoch": 117.22, "learning_rate": 3.1504e-05, "loss": 0.4056, "step": 8440 }, { "epoch": 117.36, "learning_rate": 3.1492571428571435e-05, "loss": 0.3932, "step": 8450 }, { "epoch": 117.5, "learning_rate": 3.148114285714286e-05, "loss": 0.393, "step": 8460 }, { "epoch": 117.64, "learning_rate": 3.146971428571429e-05, "loss": 0.3877, "step": 8470 }, { "epoch": 117.78, "learning_rate": 3.1458285714285716e-05, "loss": 0.4022, "step": 8480 }, { "epoch": 117.91, "learning_rate": 3.144685714285714e-05, "loss": 0.3941, "step": 8490 }, { "epoch": 118.0, "eval_loss": 0.5473552942276001, "eval_runtime": 133.3099, "eval_samples_per_second": 3.991, "eval_steps_per_second": 0.503, "eval_wer": 0.224657710355467, "step": 8496 }, { "epoch": 118.06, "learning_rate": 3.1435428571428576e-05, "loss": 0.4207, "step": 8500 }, { "epoch": 118.19, "learning_rate": 3.142514285714286e-05, "loss": 0.4192, "step": 8510 }, { "epoch": 118.33, "learning_rate": 3.141371428571429e-05, "loss": 0.4183, "step": 8520 }, { "epoch": 118.47, "learning_rate": 3.140228571428572e-05, "loss": 0.4004, "step": 8530 }, { "epoch": 118.61, "learning_rate": 3.139085714285715e-05, "loss": 0.3917, "step": 8540 }, { "epoch": 118.75, "learning_rate": 3.1379428571428575e-05, "loss": 0.3946, "step": 8550 }, { "epoch": 118.89, "learning_rate": 3.1368e-05, "loss": 0.3912, "step": 8560 }, { "epoch": 119.0, "eval_loss": 0.5450686812400818, "eval_runtime": 129.2494, "eval_samples_per_second": 4.116, "eval_steps_per_second": 0.518, "eval_wer": 0.218486854792055, "step": 8568 }, { "epoch": 119.03, "learning_rate": 3.135657142857143e-05, "loss": 0.409, "step": 8570 }, { "epoch": 119.17, "learning_rate": 3.134514285714286e-05, "loss": 0.383, "step": 8580 }, { "epoch": 119.3, "learning_rate": 3.133371428571429e-05, "loss": 0.3876, "step": 8590 }, { "epoch": 119.44, "learning_rate": 3.1322285714285716e-05, "loss": 0.3918, "step": 8600 }, { "epoch": 119.58, "learning_rate": 3.131085714285714e-05, "loss": 0.3914, "step": 8610 }, { "epoch": 119.72, "learning_rate": 3.1299428571428576e-05, "loss": 0.4052, "step": 8620 }, { "epoch": 119.86, "learning_rate": 3.1288e-05, "loss": 0.4188, "step": 8630 }, { "epoch": 120.0, "learning_rate": 3.127657142857143e-05, "loss": 0.4209, "step": 8640 }, { "epoch": 120.0, "eval_loss": 0.5281777381896973, "eval_runtime": 130.7013, "eval_samples_per_second": 4.07, "eval_steps_per_second": 0.513, "eval_wer": 0.22819309635533844, "step": 8640 }, { "epoch": 120.14, "learning_rate": 3.126514285714286e-05, "loss": 0.4175, "step": 8650 }, { "epoch": 120.28, "learning_rate": 3.125371428571429e-05, "loss": 0.4096, "step": 8660 }, { "epoch": 120.42, "learning_rate": 3.1242285714285716e-05, "loss": 0.3867, "step": 8670 }, { "epoch": 120.55, "learning_rate": 3.123085714285714e-05, "loss": 0.3969, "step": 8680 }, { "epoch": 120.69, "learning_rate": 3.121942857142858e-05, "loss": 0.3923, "step": 8690 }, { "epoch": 120.83, "learning_rate": 3.1208000000000003e-05, "loss": 0.3861, "step": 8700 }, { "epoch": 120.97, "learning_rate": 3.119657142857143e-05, "loss": 0.3882, "step": 8710 }, { "epoch": 121.0, "eval_loss": 0.5262969136238098, "eval_runtime": 129.3775, "eval_samples_per_second": 4.112, "eval_steps_per_second": 0.518, "eval_wer": 0.2184225750466028, "step": 8712 }, { "epoch": 121.11, "learning_rate": 3.1185142857142864e-05, "loss": 0.3957, "step": 8720 }, { "epoch": 121.25, "learning_rate": 3.117371428571429e-05, "loss": 0.3844, "step": 8730 }, { "epoch": 121.39, "learning_rate": 3.116228571428572e-05, "loss": 0.3781, "step": 8740 }, { "epoch": 121.53, "learning_rate": 3.1150857142857144e-05, "loss": 0.3992, "step": 8750 }, { "epoch": 121.66, "learning_rate": 3.113942857142858e-05, "loss": 0.3919, "step": 8760 }, { "epoch": 121.8, "learning_rate": 3.1128000000000004e-05, "loss": 0.3821, "step": 8770 }, { "epoch": 121.94, "learning_rate": 3.111657142857143e-05, "loss": 0.3891, "step": 8780 }, { "epoch": 122.0, "eval_loss": 0.5301498174667358, "eval_runtime": 129.7211, "eval_samples_per_second": 4.101, "eval_steps_per_second": 0.516, "eval_wer": 0.21938677122838593, "step": 8784 }, { "epoch": 122.08, "learning_rate": 3.110514285714286e-05, "loss": 0.3915, "step": 8790 }, { "epoch": 122.22, "learning_rate": 3.1093714285714284e-05, "loss": 0.388, "step": 8800 }, { "epoch": 122.36, "learning_rate": 3.108228571428572e-05, "loss": 0.3731, "step": 8810 }, { "epoch": 122.5, "learning_rate": 3.1070857142857145e-05, "loss": 0.3819, "step": 8820 }, { "epoch": 122.64, "learning_rate": 3.105942857142858e-05, "loss": 0.4048, "step": 8830 }, { "epoch": 122.78, "learning_rate": 3.1048000000000005e-05, "loss": 0.4049, "step": 8840 }, { "epoch": 122.91, "learning_rate": 3.103657142857143e-05, "loss": 0.3964, "step": 8850 }, { "epoch": 123.0, "eval_loss": 0.5608429908752441, "eval_runtime": 132.6568, "eval_samples_per_second": 4.01, "eval_steps_per_second": 0.505, "eval_wer": 0.22202224079192645, "step": 8856 }, { "epoch": 123.06, "learning_rate": 3.102514285714286e-05, "loss": 0.4022, "step": 8860 }, { "epoch": 123.19, "learning_rate": 3.1013714285714285e-05, "loss": 0.3949, "step": 8870 }, { "epoch": 123.33, "learning_rate": 3.100228571428572e-05, "loss": 0.3946, "step": 8880 }, { "epoch": 123.47, "learning_rate": 3.0990857142857145e-05, "loss": 0.3976, "step": 8890 }, { "epoch": 123.61, "learning_rate": 3.097942857142858e-05, "loss": 0.3962, "step": 8900 }, { "epoch": 123.75, "learning_rate": 3.0968000000000006e-05, "loss": 0.4027, "step": 8910 }, { "epoch": 123.89, "learning_rate": 3.095657142857143e-05, "loss": 0.3918, "step": 8920 }, { "epoch": 124.0, "eval_loss": 0.5232579708099365, "eval_runtime": 129.2294, "eval_samples_per_second": 4.117, "eval_steps_per_second": 0.518, "eval_wer": 0.2229864369737096, "step": 8928 }, { "epoch": 124.03, "learning_rate": 3.094514285714286e-05, "loss": 0.4061, "step": 8930 }, { "epoch": 124.17, "learning_rate": 3.0933714285714286e-05, "loss": 0.3948, "step": 8940 }, { "epoch": 124.3, "learning_rate": 3.092228571428572e-05, "loss": 0.3905, "step": 8950 }, { "epoch": 124.44, "learning_rate": 3.0910857142857146e-05, "loss": 0.3864, "step": 8960 }, { "epoch": 124.58, "learning_rate": 3.089942857142857e-05, "loss": 0.3858, "step": 8970 }, { "epoch": 124.72, "learning_rate": 3.0888e-05, "loss": 0.3827, "step": 8980 }, { "epoch": 124.86, "learning_rate": 3.0876571428571426e-05, "loss": 0.385, "step": 8990 }, { "epoch": 125.0, "learning_rate": 3.086514285714286e-05, "loss": 0.3834, "step": 9000 }, { "epoch": 125.0, "eval_loss": 0.5285627245903015, "eval_runtime": 129.5061, "eval_samples_per_second": 4.108, "eval_steps_per_second": 0.517, "eval_wer": 0.21945105097383813, "step": 9000 }, { "epoch": 125.14, "learning_rate": 3.085371428571429e-05, "loss": 0.3898, "step": 9010 }, { "epoch": 125.28, "learning_rate": 3.084228571428572e-05, "loss": 0.3929, "step": 9020 }, { "epoch": 125.42, "learning_rate": 3.083085714285715e-05, "loss": 0.3976, "step": 9030 }, { "epoch": 125.55, "learning_rate": 3.0819428571428574e-05, "loss": 0.3856, "step": 9040 }, { "epoch": 125.69, "learning_rate": 3.0808e-05, "loss": 0.3962, "step": 9050 }, { "epoch": 125.83, "learning_rate": 3.079657142857143e-05, "loss": 0.3938, "step": 9060 }, { "epoch": 125.97, "learning_rate": 3.078514285714286e-05, "loss": 0.3952, "step": 9070 }, { "epoch": 126.0, "eval_loss": 0.5409618020057678, "eval_runtime": 131.9369, "eval_samples_per_second": 4.032, "eval_steps_per_second": 0.508, "eval_wer": 0.22575046602815452, "step": 9072 }, { "epoch": 126.11, "learning_rate": 3.077371428571429e-05, "loss": 0.3917, "step": 9080 }, { "epoch": 126.25, "learning_rate": 3.076228571428572e-05, "loss": 0.391, "step": 9090 }, { "epoch": 126.39, "learning_rate": 3.075085714285715e-05, "loss": 0.3744, "step": 9100 }, { "epoch": 126.53, "learning_rate": 3.0739428571428574e-05, "loss": 0.3877, "step": 9110 }, { "epoch": 126.66, "learning_rate": 3.0728e-05, "loss": 0.3894, "step": 9120 }, { "epoch": 126.8, "learning_rate": 3.071657142857143e-05, "loss": 0.3912, "step": 9130 }, { "epoch": 126.94, "learning_rate": 3.070514285714286e-05, "loss": 0.3812, "step": 9140 }, { "epoch": 127.0, "eval_loss": 0.5182816982269287, "eval_runtime": 128.9897, "eval_samples_per_second": 4.124, "eval_steps_per_second": 0.519, "eval_wer": 0.2206723661374301, "step": 9144 }, { "epoch": 127.08, "learning_rate": 3.069371428571429e-05, "loss": 0.382, "step": 9150 }, { "epoch": 127.22, "learning_rate": 3.0682285714285715e-05, "loss": 0.3834, "step": 9160 }, { "epoch": 127.36, "learning_rate": 3.067085714285714e-05, "loss": 0.3827, "step": 9170 }, { "epoch": 127.5, "learning_rate": 3.0659428571428575e-05, "loss": 0.3818, "step": 9180 }, { "epoch": 127.64, "learning_rate": 3.0648e-05, "loss": 0.3869, "step": 9190 }, { "epoch": 127.78, "learning_rate": 3.0636571428571436e-05, "loss": 0.3898, "step": 9200 }, { "epoch": 127.91, "learning_rate": 3.062514285714286e-05, "loss": 0.3904, "step": 9210 }, { "epoch": 128.0, "eval_loss": 0.539260983467102, "eval_runtime": 129.1065, "eval_samples_per_second": 4.121, "eval_steps_per_second": 0.519, "eval_wer": 0.22440059137365817, "step": 9216 }, { "epoch": 128.06, "learning_rate": 3.061371428571429e-05, "loss": 0.4071, "step": 9220 }, { "epoch": 128.19, "learning_rate": 3.0602285714285716e-05, "loss": 0.3889, "step": 9230 }, { "epoch": 128.33, "learning_rate": 3.059085714285714e-05, "loss": 0.3922, "step": 9240 }, { "epoch": 128.47, "learning_rate": 3.0579428571428576e-05, "loss": 0.3966, "step": 9250 }, { "epoch": 128.61, "learning_rate": 3.0568e-05, "loss": 0.3793, "step": 9260 }, { "epoch": 128.75, "learning_rate": 3.0556571428571436e-05, "loss": 0.3653, "step": 9270 }, { "epoch": 128.89, "learning_rate": 3.054514285714286e-05, "loss": 0.3797, "step": 9280 }, { "epoch": 129.0, "eval_loss": 0.5213383436203003, "eval_runtime": 129.0263, "eval_samples_per_second": 4.123, "eval_steps_per_second": 0.519, "eval_wer": 0.22260075850099634, "step": 9288 }, { "epoch": 129.03, "learning_rate": 3.053371428571429e-05, "loss": 0.3943, "step": 9290 }, { "epoch": 129.17, "learning_rate": 3.0522285714285717e-05, "loss": 0.3729, "step": 9300 }, { "epoch": 129.3, "learning_rate": 3.0510857142857143e-05, "loss": 0.3759, "step": 9310 }, { "epoch": 129.44, "learning_rate": 3.0499428571428577e-05, "loss": 0.3698, "step": 9320 }, { "epoch": 129.58, "learning_rate": 3.0488000000000004e-05, "loss": 0.3861, "step": 9330 }, { "epoch": 129.72, "learning_rate": 3.0476571428571434e-05, "loss": 0.3934, "step": 9340 }, { "epoch": 129.86, "learning_rate": 3.046514285714286e-05, "loss": 0.3854, "step": 9350 }, { "epoch": 130.0, "learning_rate": 3.0453714285714287e-05, "loss": 0.3802, "step": 9360 }, { "epoch": 130.0, "eval_loss": 0.5469784140586853, "eval_runtime": 129.2657, "eval_samples_per_second": 4.116, "eval_steps_per_second": 0.518, "eval_wer": 0.2207366458828823, "step": 9360 }, { "epoch": 130.14, "learning_rate": 3.0442285714285717e-05, "loss": 0.4048, "step": 9370 }, { "epoch": 130.28, "learning_rate": 3.0430857142857144e-05, "loss": 0.3854, "step": 9380 }, { "epoch": 130.42, "learning_rate": 3.0419428571428574e-05, "loss": 0.3817, "step": 9390 }, { "epoch": 130.55, "learning_rate": 3.0408e-05, "loss": 0.3783, "step": 9400 }, { "epoch": 130.69, "learning_rate": 3.0396571428571434e-05, "loss": 0.3822, "step": 9410 }, { "epoch": 130.83, "learning_rate": 3.038514285714286e-05, "loss": 0.3885, "step": 9420 }, { "epoch": 130.97, "learning_rate": 3.0373714285714288e-05, "loss": 0.4097, "step": 9430 }, { "epoch": 131.0, "eval_loss": 0.5205973982810974, "eval_runtime": 129.5339, "eval_samples_per_second": 4.107, "eval_steps_per_second": 0.517, "eval_wer": 0.2254290673008935, "step": 9432 }, { "epoch": 131.11, "learning_rate": 3.0362285714285718e-05, "loss": 0.3955, "step": 9440 }, { "epoch": 131.25, "learning_rate": 3.0350857142857145e-05, "loss": 0.3988, "step": 9450 }, { "epoch": 131.39, "learning_rate": 3.0339428571428575e-05, "loss": 0.3863, "step": 9460 }, { "epoch": 131.53, "learning_rate": 3.0328e-05, "loss": 0.3846, "step": 9470 }, { "epoch": 131.66, "learning_rate": 3.0316571428571432e-05, "loss": 0.3876, "step": 9480 }, { "epoch": 131.8, "learning_rate": 3.030514285714286e-05, "loss": 0.3821, "step": 9490 }, { "epoch": 131.94, "learning_rate": 3.0293714285714285e-05, "loss": 0.3771, "step": 9500 }, { "epoch": 132.0, "eval_loss": 0.5075005292892456, "eval_runtime": 129.3245, "eval_samples_per_second": 4.114, "eval_steps_per_second": 0.518, "eval_wer": 0.21822973581024618, "step": 9504 }, { "epoch": 132.08, "learning_rate": 3.028228571428572e-05, "loss": 0.3805, "step": 9510 }, { "epoch": 132.22, "learning_rate": 3.0270857142857146e-05, "loss": 0.3734, "step": 9520 }, { "epoch": 132.36, "learning_rate": 3.0259428571428576e-05, "loss": 0.3864, "step": 9530 }, { "epoch": 132.5, "learning_rate": 3.0248000000000002e-05, "loss": 0.3778, "step": 9540 }, { "epoch": 132.64, "learning_rate": 3.0236571428571433e-05, "loss": 0.3794, "step": 9550 }, { "epoch": 132.78, "learning_rate": 3.022514285714286e-05, "loss": 0.3733, "step": 9560 }, { "epoch": 132.91, "learning_rate": 3.0213714285714286e-05, "loss": 0.3732, "step": 9570 }, { "epoch": 133.0, "eval_loss": 0.5153090357780457, "eval_runtime": 129.0808, "eval_samples_per_second": 4.121, "eval_steps_per_second": 0.519, "eval_wer": 0.2254933470463457, "step": 9576 }, { "epoch": 133.06, "learning_rate": 3.0202285714285716e-05, "loss": 0.3936, "step": 9580 }, { "epoch": 133.19, "learning_rate": 3.0190857142857143e-05, "loss": 0.3767, "step": 9590 }, { "epoch": 133.33, "learning_rate": 3.0179428571428576e-05, "loss": 0.3924, "step": 9600 }, { "epoch": 133.47, "learning_rate": 3.0168000000000003e-05, "loss": 0.388, "step": 9610 }, { "epoch": 133.61, "learning_rate": 3.0156571428571433e-05, "loss": 0.3768, "step": 9620 }, { "epoch": 133.75, "learning_rate": 3.014514285714286e-05, "loss": 0.3864, "step": 9630 }, { "epoch": 133.89, "learning_rate": 3.0133714285714287e-05, "loss": 0.3727, "step": 9640 }, { "epoch": 134.0, "eval_loss": 0.5106567740440369, "eval_runtime": 129.2018, "eval_samples_per_second": 4.118, "eval_steps_per_second": 0.519, "eval_wer": 0.22118660410104776, "step": 9648 }, { "epoch": 134.03, "learning_rate": 3.0122285714285717e-05, "loss": 0.3965, "step": 9650 }, { "epoch": 134.17, "learning_rate": 3.0110857142857144e-05, "loss": 0.3799, "step": 9660 }, { "epoch": 134.3, "learning_rate": 3.0099428571428574e-05, "loss": 0.38, "step": 9670 }, { "epoch": 134.44, "learning_rate": 3.0088e-05, "loss": 0.3974, "step": 9680 }, { "epoch": 134.58, "learning_rate": 3.0076571428571434e-05, "loss": 0.3797, "step": 9690 }, { "epoch": 134.72, "learning_rate": 3.006514285714286e-05, "loss": 0.3784, "step": 9700 }, { "epoch": 134.86, "learning_rate": 3.0053714285714288e-05, "loss": 0.3704, "step": 9710 }, { "epoch": 135.0, "learning_rate": 3.0042285714285718e-05, "loss": 0.3751, "step": 9720 }, { "epoch": 135.0, "eval_loss": 0.5147270560264587, "eval_runtime": 129.7251, "eval_samples_per_second": 4.101, "eval_steps_per_second": 0.516, "eval_wer": 0.22587902551905895, "step": 9720 }, { "epoch": 135.14, "learning_rate": 3.0030857142857144e-05, "loss": 0.3805, "step": 9730 }, { "epoch": 135.28, "learning_rate": 3.0019428571428575e-05, "loss": 0.3782, "step": 9740 }, { "epoch": 135.42, "learning_rate": 3.0008e-05, "loss": 0.3729, "step": 9750 }, { "epoch": 135.55, "learning_rate": 2.999657142857143e-05, "loss": 0.3759, "step": 9760 }, { "epoch": 135.69, "learning_rate": 2.9985142857142858e-05, "loss": 0.3962, "step": 9770 }, { "epoch": 135.83, "learning_rate": 2.9973714285714285e-05, "loss": 0.3817, "step": 9780 }, { "epoch": 135.97, "learning_rate": 2.996228571428572e-05, "loss": 0.3858, "step": 9790 }, { "epoch": 136.0, "eval_loss": 0.5519046783447266, "eval_runtime": 129.2221, "eval_samples_per_second": 4.117, "eval_steps_per_second": 0.518, "eval_wer": 0.22202224079192645, "step": 9792 }, { "epoch": 136.11, "learning_rate": 2.9950857142857145e-05, "loss": 0.3785, "step": 9800 }, { "epoch": 136.25, "learning_rate": 2.9939428571428575e-05, "loss": 0.3874, "step": 9810 }, { "epoch": 136.39, "learning_rate": 2.9928000000000002e-05, "loss": 0.3771, "step": 9820 }, { "epoch": 136.53, "learning_rate": 2.9916571428571432e-05, "loss": 0.3908, "step": 9830 }, { "epoch": 136.66, "learning_rate": 2.990514285714286e-05, "loss": 0.3795, "step": 9840 }, { "epoch": 136.8, "learning_rate": 2.989371428571429e-05, "loss": 0.3802, "step": 9850 }, { "epoch": 136.94, "learning_rate": 2.9882285714285716e-05, "loss": 0.3889, "step": 9860 }, { "epoch": 137.0, "eval_loss": 0.5606067180633545, "eval_runtime": 129.584, "eval_samples_per_second": 4.105, "eval_steps_per_second": 0.517, "eval_wer": 0.22215080028283088, "step": 9864 }, { "epoch": 137.08, "learning_rate": 2.9870857142857143e-05, "loss": 0.4026, "step": 9870 }, { "epoch": 137.22, "learning_rate": 2.9859428571428576e-05, "loss": 0.3835, "step": 9880 }, { "epoch": 137.36, "learning_rate": 2.9848000000000003e-05, "loss": 0.3987, "step": 9890 }, { "epoch": 137.5, "learning_rate": 2.9836571428571433e-05, "loss": 0.3911, "step": 9900 }, { "epoch": 137.64, "learning_rate": 2.982514285714286e-05, "loss": 0.3868, "step": 9910 }, { "epoch": 137.78, "learning_rate": 2.981371428571429e-05, "loss": 0.3858, "step": 9920 }, { "epoch": 137.91, "learning_rate": 2.9802285714285717e-05, "loss": 0.3916, "step": 9930 }, { "epoch": 138.0, "eval_loss": 0.5400940179824829, "eval_runtime": 129.1885, "eval_samples_per_second": 4.118, "eval_steps_per_second": 0.519, "eval_wer": 0.22517194831908466, "step": 9936 }, { "epoch": 138.06, "learning_rate": 2.9790857142857143e-05, "loss": 0.3902, "step": 9940 }, { "epoch": 138.19, "learning_rate": 2.9779428571428574e-05, "loss": 0.3897, "step": 9950 }, { "epoch": 138.33, "learning_rate": 2.9768e-05, "loss": 0.3885, "step": 9960 }, { "epoch": 138.47, "learning_rate": 2.9756571428571434e-05, "loss": 0.3932, "step": 9970 }, { "epoch": 138.61, "learning_rate": 2.974514285714286e-05, "loss": 0.4025, "step": 9980 }, { "epoch": 138.75, "learning_rate": 2.973371428571429e-05, "loss": 0.3839, "step": 9990 }, { "epoch": 138.89, "learning_rate": 2.9722285714285717e-05, "loss": 0.3775, "step": 10000 }, { "epoch": 139.0, "eval_loss": 0.5393100380897522, "eval_runtime": 129.218, "eval_samples_per_second": 4.117, "eval_steps_per_second": 0.519, "eval_wer": 0.22690750144629426, "step": 10008 }, { "epoch": 139.03, "learning_rate": 2.9710857142857144e-05, "loss": 0.4053, "step": 10010 }, { "epoch": 139.17, "learning_rate": 2.9699428571428574e-05, "loss": 0.3904, "step": 10020 }, { "epoch": 139.3, "learning_rate": 2.9688e-05, "loss": 0.3871, "step": 10030 }, { "epoch": 139.44, "learning_rate": 2.967657142857143e-05, "loss": 0.3886, "step": 10040 }, { "epoch": 139.58, "learning_rate": 2.9665142857142858e-05, "loss": 0.3897, "step": 10050 }, { "epoch": 139.72, "learning_rate": 2.965371428571429e-05, "loss": 0.3848, "step": 10060 }, { "epoch": 139.86, "learning_rate": 2.9642285714285718e-05, "loss": 0.3811, "step": 10070 }, { "epoch": 140.0, "learning_rate": 2.9630857142857145e-05, "loss": 0.3963, "step": 10080 }, { "epoch": 140.0, "eval_loss": 0.5504253506660461, "eval_runtime": 129.6868, "eval_samples_per_second": 4.102, "eval_steps_per_second": 0.517, "eval_wer": 0.23217844057337533, "step": 10080 }, { "epoch": 140.14, "learning_rate": 2.9619428571428575e-05, "loss": 0.3903, "step": 10090 }, { "epoch": 140.28, "learning_rate": 2.9608000000000002e-05, "loss": 0.3828, "step": 10100 }, { "epoch": 140.42, "learning_rate": 2.9596571428571432e-05, "loss": 0.3839, "step": 10110 }, { "epoch": 140.55, "learning_rate": 2.958514285714286e-05, "loss": 0.3892, "step": 10120 }, { "epoch": 140.69, "learning_rate": 2.957371428571429e-05, "loss": 0.4029, "step": 10130 }, { "epoch": 140.83, "learning_rate": 2.9562285714285716e-05, "loss": 0.3959, "step": 10140 }, { "epoch": 140.97, "learning_rate": 2.9550857142857142e-05, "loss": 0.3941, "step": 10150 }, { "epoch": 141.0, "eval_loss": 0.533815860748291, "eval_runtime": 129.7113, "eval_samples_per_second": 4.101, "eval_steps_per_second": 0.517, "eval_wer": 0.23417111268239377, "step": 10152 }, { "epoch": 141.11, "learning_rate": 2.9539428571428576e-05, "loss": 0.3994, "step": 10160 }, { "epoch": 141.25, "learning_rate": 2.9528000000000003e-05, "loss": 0.4001, "step": 10170 }, { "epoch": 141.39, "learning_rate": 2.9516571428571433e-05, "loss": 0.3841, "step": 10180 }, { "epoch": 141.53, "learning_rate": 2.950514285714286e-05, "loss": 0.3971, "step": 10190 }, { "epoch": 141.66, "learning_rate": 2.949371428571429e-05, "loss": 0.3796, "step": 10200 }, { "epoch": 141.8, "learning_rate": 2.9482285714285716e-05, "loss": 0.3852, "step": 10210 }, { "epoch": 141.94, "learning_rate": 2.9470857142857143e-05, "loss": 0.3801, "step": 10220 }, { "epoch": 142.0, "eval_loss": 0.5115429162979126, "eval_runtime": 129.3352, "eval_samples_per_second": 4.113, "eval_steps_per_second": 0.518, "eval_wer": 0.22755029890081635, "step": 10224 }, { "epoch": 142.08, "learning_rate": 2.9459428571428573e-05, "loss": 0.3872, "step": 10230 }, { "epoch": 142.22, "learning_rate": 2.9448e-05, "loss": 0.3869, "step": 10240 }, { "epoch": 142.36, "learning_rate": 2.9436571428571433e-05, "loss": 0.3861, "step": 10250 }, { "epoch": 142.5, "learning_rate": 2.942514285714286e-05, "loss": 0.3779, "step": 10260 }, { "epoch": 142.64, "learning_rate": 2.941371428571429e-05, "loss": 0.3686, "step": 10270 }, { "epoch": 142.78, "learning_rate": 2.9402285714285717e-05, "loss": 0.4013, "step": 10280 }, { "epoch": 142.91, "learning_rate": 2.9390857142857144e-05, "loss": 0.3809, "step": 10290 }, { "epoch": 143.0, "eval_loss": 0.49661949276924133, "eval_runtime": 129.5047, "eval_samples_per_second": 4.108, "eval_steps_per_second": 0.517, "eval_wer": 0.22607186475541557, "step": 10296 }, { "epoch": 143.06, "learning_rate": 2.9379428571428574e-05, "loss": 0.3952, "step": 10300 }, { "epoch": 143.19, "learning_rate": 2.9368e-05, "loss": 0.3827, "step": 10310 }, { "epoch": 143.33, "learning_rate": 2.935657142857143e-05, "loss": 0.3986, "step": 10320 }, { "epoch": 143.47, "learning_rate": 2.9345142857142858e-05, "loss": 0.3853, "step": 10330 }, { "epoch": 143.61, "learning_rate": 2.933371428571429e-05, "loss": 0.3835, "step": 10340 }, { "epoch": 143.75, "learning_rate": 2.9322285714285718e-05, "loss": 0.3851, "step": 10350 }, { "epoch": 143.89, "learning_rate": 2.9310857142857145e-05, "loss": 0.3751, "step": 10360 }, { "epoch": 144.0, "eval_loss": 0.49101418256759644, "eval_runtime": 129.7315, "eval_samples_per_second": 4.101, "eval_steps_per_second": 0.516, "eval_wer": 0.2239506331554927, "step": 10368 }, { "epoch": 144.03, "learning_rate": 2.9299428571428575e-05, "loss": 0.3905, "step": 10370 }, { "epoch": 144.17, "learning_rate": 2.9288e-05, "loss": 0.3841, "step": 10380 }, { "epoch": 144.3, "learning_rate": 2.927657142857143e-05, "loss": 0.3794, "step": 10390 }, { "epoch": 144.44, "learning_rate": 2.926514285714286e-05, "loss": 0.3791, "step": 10400 }, { "epoch": 144.58, "learning_rate": 2.925371428571429e-05, "loss": 0.3921, "step": 10410 }, { "epoch": 144.72, "learning_rate": 2.9242285714285715e-05, "loss": 0.3666, "step": 10420 }, { "epoch": 144.86, "learning_rate": 2.9230857142857142e-05, "loss": 0.376, "step": 10430 }, { "epoch": 145.0, "learning_rate": 2.9219428571428575e-05, "loss": 0.3827, "step": 10440 }, { "epoch": 145.0, "eval_loss": 0.5291417837142944, "eval_runtime": 129.4487, "eval_samples_per_second": 4.11, "eval_steps_per_second": 0.518, "eval_wer": 0.22041524715562127, "step": 10440 }, { "epoch": 145.14, "learning_rate": 2.9208000000000002e-05, "loss": 0.3957, "step": 10450 }, { "epoch": 145.28, "learning_rate": 2.9196571428571432e-05, "loss": 0.379, "step": 10460 }, { "epoch": 145.42, "learning_rate": 2.918514285714286e-05, "loss": 0.3743, "step": 10470 }, { "epoch": 145.55, "learning_rate": 2.917371428571429e-05, "loss": 0.3836, "step": 10480 }, { "epoch": 145.69, "learning_rate": 2.9162285714285716e-05, "loss": 0.3727, "step": 10490 }, { "epoch": 145.83, "learning_rate": 2.9150857142857146e-05, "loss": 0.3762, "step": 10500 }, { "epoch": 145.97, "learning_rate": 2.9139428571428573e-05, "loss": 0.384, "step": 10510 }, { "epoch": 146.0, "eval_loss": 0.5701574087142944, "eval_runtime": 130.3352, "eval_samples_per_second": 4.082, "eval_steps_per_second": 0.514, "eval_wer": 0.22780741788262518, "step": 10512 }, { "epoch": 146.11, "learning_rate": 2.9128e-05, "loss": 0.4058, "step": 10520 }, { "epoch": 146.25, "learning_rate": 2.9116571428571433e-05, "loss": 0.3759, "step": 10530 }, { "epoch": 146.39, "learning_rate": 2.910514285714286e-05, "loss": 0.3913, "step": 10540 }, { "epoch": 146.53, "learning_rate": 2.909371428571429e-05, "loss": 0.3887, "step": 10550 }, { "epoch": 146.66, "learning_rate": 2.9082285714285717e-05, "loss": 0.3847, "step": 10560 }, { "epoch": 146.8, "learning_rate": 2.9070857142857147e-05, "loss": 0.3797, "step": 10570 }, { "epoch": 146.94, "learning_rate": 2.9059428571428574e-05, "loss": 0.3728, "step": 10580 }, { "epoch": 147.0, "eval_loss": 0.5339729189872742, "eval_runtime": 128.9709, "eval_samples_per_second": 4.125, "eval_steps_per_second": 0.519, "eval_wer": 0.22825737610079064, "step": 10584 }, { "epoch": 147.08, "learning_rate": 2.9048e-05, "loss": 0.4014, "step": 10590 }, { "epoch": 147.22, "learning_rate": 2.903657142857143e-05, "loss": 0.3913, "step": 10600 }, { "epoch": 147.36, "learning_rate": 2.9025142857142857e-05, "loss": 0.3703, "step": 10610 }, { "epoch": 147.5, "learning_rate": 2.901371428571429e-05, "loss": 0.3856, "step": 10620 }, { "epoch": 147.64, "learning_rate": 2.9002285714285718e-05, "loss": 0.3822, "step": 10630 }, { "epoch": 147.78, "learning_rate": 2.8990857142857148e-05, "loss": 0.391, "step": 10640 }, { "epoch": 147.91, "learning_rate": 2.8979428571428574e-05, "loss": 0.3963, "step": 10650 }, { "epoch": 148.0, "eval_loss": 0.5513004064559937, "eval_runtime": 129.078, "eval_samples_per_second": 4.122, "eval_steps_per_second": 0.519, "eval_wer": 0.2286430545735039, "step": 10656 }, { "epoch": 148.06, "learning_rate": 2.8968e-05, "loss": 0.3925, "step": 10660 }, { "epoch": 148.19, "learning_rate": 2.895657142857143e-05, "loss": 0.3751, "step": 10670 }, { "epoch": 148.33, "learning_rate": 2.8945142857142858e-05, "loss": 0.3881, "step": 10680 }, { "epoch": 148.47, "learning_rate": 2.8933714285714288e-05, "loss": 0.3957, "step": 10690 }, { "epoch": 148.61, "learning_rate": 2.8922285714285715e-05, "loss": 0.3788, "step": 10700 }, { "epoch": 148.75, "learning_rate": 2.891085714285715e-05, "loss": 0.3806, "step": 10710 }, { "epoch": 148.89, "learning_rate": 2.8899428571428575e-05, "loss": 0.3802, "step": 10720 }, { "epoch": 149.0, "eval_loss": 0.5423539876937866, "eval_runtime": 129.3032, "eval_samples_per_second": 4.114, "eval_steps_per_second": 0.518, "eval_wer": 0.2263932634826766, "step": 10728 }, { "epoch": 149.03, "learning_rate": 2.8888000000000002e-05, "loss": 0.3847, "step": 10730 }, { "epoch": 149.17, "learning_rate": 2.8876571428571432e-05, "loss": 0.3733, "step": 10740 }, { "epoch": 149.3, "learning_rate": 2.886514285714286e-05, "loss": 0.3843, "step": 10750 }, { "epoch": 149.44, "learning_rate": 2.885371428571429e-05, "loss": 0.3822, "step": 10760 }, { "epoch": 149.58, "learning_rate": 2.8842285714285716e-05, "loss": 0.3807, "step": 10770 }, { "epoch": 149.72, "learning_rate": 2.8830857142857146e-05, "loss": 0.401, "step": 10780 }, { "epoch": 149.86, "learning_rate": 2.8819428571428573e-05, "loss": 0.3781, "step": 10790 }, { "epoch": 150.0, "learning_rate": 2.8808e-05, "loss": 0.3874, "step": 10800 }, { "epoch": 150.0, "eval_loss": 0.52194744348526, "eval_runtime": 129.4643, "eval_samples_per_second": 4.109, "eval_steps_per_second": 0.518, "eval_wer": 0.21996528893745582, "step": 10800 }, { "epoch": 150.14, "learning_rate": 2.8796571428571433e-05, "loss": 0.3824, "step": 10810 }, { "epoch": 150.28, "learning_rate": 2.878514285714286e-05, "loss": 0.3793, "step": 10820 }, { "epoch": 150.42, "learning_rate": 2.877371428571429e-05, "loss": 0.3734, "step": 10830 }, { "epoch": 150.55, "learning_rate": 2.8762285714285716e-05, "loss": 0.376, "step": 10840 }, { "epoch": 150.69, "learning_rate": 2.8750857142857147e-05, "loss": 0.3947, "step": 10850 }, { "epoch": 150.83, "learning_rate": 2.8739428571428573e-05, "loss": 0.3688, "step": 10860 }, { "epoch": 150.97, "learning_rate": 2.8728e-05, "loss": 0.3743, "step": 10870 }, { "epoch": 151.0, "eval_loss": 0.5147446393966675, "eval_runtime": 129.0385, "eval_samples_per_second": 4.123, "eval_steps_per_second": 0.519, "eval_wer": 0.21610850421032332, "step": 10872 }, { "epoch": 151.11, "learning_rate": 2.871657142857143e-05, "loss": 0.3869, "step": 10880 }, { "epoch": 151.25, "learning_rate": 2.8705142857142857e-05, "loss": 0.3787, "step": 10890 }, { "epoch": 151.39, "learning_rate": 2.869371428571429e-05, "loss": 0.3873, "step": 10900 }, { "epoch": 151.53, "learning_rate": 2.8682285714285717e-05, "loss": 0.3837, "step": 10910 }, { "epoch": 151.66, "learning_rate": 2.8670857142857147e-05, "loss": 0.381, "step": 10920 }, { "epoch": 151.8, "learning_rate": 2.8659428571428574e-05, "loss": 0.3827, "step": 10930 }, { "epoch": 151.94, "learning_rate": 2.8648e-05, "loss": 0.3931, "step": 10940 }, { "epoch": 152.0, "eval_loss": 0.5318461060523987, "eval_runtime": 128.8958, "eval_samples_per_second": 4.127, "eval_steps_per_second": 0.52, "eval_wer": 0.23243555955518416, "step": 10944 }, { "epoch": 152.08, "learning_rate": 2.863657142857143e-05, "loss": 0.4021, "step": 10950 }, { "epoch": 152.22, "learning_rate": 2.8625142857142858e-05, "loss": 0.3849, "step": 10960 }, { "epoch": 152.36, "learning_rate": 2.8613714285714288e-05, "loss": 0.3639, "step": 10970 }, { "epoch": 152.5, "learning_rate": 2.8602285714285715e-05, "loss": 0.3671, "step": 10980 }, { "epoch": 152.64, "learning_rate": 2.8590857142857148e-05, "loss": 0.362, "step": 10990 }, { "epoch": 152.78, "learning_rate": 2.8579428571428575e-05, "loss": 0.3716, "step": 11000 }, { "epoch": 152.91, "learning_rate": 2.8568e-05, "loss": 0.3755, "step": 11010 }, { "epoch": 153.0, "eval_loss": 0.5456690192222595, "eval_runtime": 129.0236, "eval_samples_per_second": 4.123, "eval_steps_per_second": 0.519, "eval_wer": 0.22517194831908466, "step": 11016 }, { "epoch": 153.06, "learning_rate": 2.8556571428571432e-05, "loss": 0.3802, "step": 11020 }, { "epoch": 153.19, "learning_rate": 2.854514285714286e-05, "loss": 0.378, "step": 11030 }, { "epoch": 153.33, "learning_rate": 2.853371428571429e-05, "loss": 0.3843, "step": 11040 }, { "epoch": 153.47, "learning_rate": 2.8522285714285715e-05, "loss": 0.3768, "step": 11050 }, { "epoch": 153.61, "learning_rate": 2.8510857142857145e-05, "loss": 0.3591, "step": 11060 }, { "epoch": 153.75, "learning_rate": 2.8499428571428572e-05, "loss": 0.3673, "step": 11070 }, { "epoch": 153.89, "learning_rate": 2.8488000000000006e-05, "loss": 0.3744, "step": 11080 }, { "epoch": 154.0, "eval_loss": 0.5447834730148315, "eval_runtime": 129.231, "eval_samples_per_second": 4.117, "eval_steps_per_second": 0.518, "eval_wer": 0.22600758500996337, "step": 11088 }, { "epoch": 154.03, "learning_rate": 2.8476571428571432e-05, "loss": 0.382, "step": 11090 }, { "epoch": 154.17, "learning_rate": 2.846514285714286e-05, "loss": 0.3706, "step": 11100 }, { "epoch": 154.3, "learning_rate": 2.845371428571429e-05, "loss": 0.3895, "step": 11110 }, { "epoch": 154.44, "learning_rate": 2.8442285714285716e-05, "loss": 0.3812, "step": 11120 }, { "epoch": 154.58, "learning_rate": 2.8430857142857146e-05, "loss": 0.3625, "step": 11130 }, { "epoch": 154.72, "learning_rate": 2.8419428571428573e-05, "loss": 0.3637, "step": 11140 }, { "epoch": 154.86, "learning_rate": 2.8408000000000003e-05, "loss": 0.3674, "step": 11150 }, { "epoch": 155.0, "learning_rate": 2.839657142857143e-05, "loss": 0.3799, "step": 11160 }, { "epoch": 155.0, "eval_loss": 0.5276015400886536, "eval_runtime": 128.8037, "eval_samples_per_second": 4.13, "eval_steps_per_second": 0.52, "eval_wer": 0.21713698013755867, "step": 11160 }, { "epoch": 155.14, "learning_rate": 2.8385142857142857e-05, "loss": 0.3844, "step": 11170 }, { "epoch": 155.28, "learning_rate": 2.837371428571429e-05, "loss": 0.3738, "step": 11180 }, { "epoch": 155.42, "learning_rate": 2.8362285714285717e-05, "loss": 0.3769, "step": 11190 }, { "epoch": 155.55, "learning_rate": 2.8350857142857147e-05, "loss": 0.3652, "step": 11200 }, { "epoch": 155.69, "learning_rate": 2.8339428571428574e-05, "loss": 0.3758, "step": 11210 }, { "epoch": 155.83, "learning_rate": 2.8328000000000004e-05, "loss": 0.3627, "step": 11220 }, { "epoch": 155.97, "learning_rate": 2.831657142857143e-05, "loss": 0.3953, "step": 11230 }, { "epoch": 156.0, "eval_loss": 0.5545970797538757, "eval_runtime": 129.0649, "eval_samples_per_second": 4.122, "eval_steps_per_second": 0.519, "eval_wer": 0.2262647039917722, "step": 11232 }, { "epoch": 156.11, "learning_rate": 2.8305142857142857e-05, "loss": 0.3852, "step": 11240 }, { "epoch": 156.25, "learning_rate": 2.8293714285714288e-05, "loss": 0.3719, "step": 11250 }, { "epoch": 156.39, "learning_rate": 2.8282285714285714e-05, "loss": 0.3759, "step": 11260 }, { "epoch": 156.53, "learning_rate": 2.8270857142857148e-05, "loss": 0.3838, "step": 11270 }, { "epoch": 156.66, "learning_rate": 2.8259428571428575e-05, "loss": 0.3785, "step": 11280 }, { "epoch": 156.8, "learning_rate": 2.8248000000000005e-05, "loss": 0.3672, "step": 11290 }, { "epoch": 156.94, "learning_rate": 2.823657142857143e-05, "loss": 0.3716, "step": 11300 }, { "epoch": 157.0, "eval_loss": 0.5110045671463013, "eval_runtime": 128.9931, "eval_samples_per_second": 4.124, "eval_steps_per_second": 0.519, "eval_wer": 0.22459343061001477, "step": 11304 }, { "epoch": 157.08, "learning_rate": 2.8225142857142858e-05, "loss": 0.3941, "step": 11310 }, { "epoch": 157.22, "learning_rate": 2.8213714285714288e-05, "loss": 0.3931, "step": 11320 }, { "epoch": 157.36, "learning_rate": 2.8202285714285715e-05, "loss": 0.376, "step": 11330 }, { "epoch": 157.5, "learning_rate": 2.8190857142857145e-05, "loss": 0.3692, "step": 11340 }, { "epoch": 157.64, "learning_rate": 2.8179428571428572e-05, "loss": 0.3746, "step": 11350 }, { "epoch": 157.78, "learning_rate": 2.8168000000000005e-05, "loss": 0.382, "step": 11360 }, { "epoch": 157.91, "learning_rate": 2.8156571428571432e-05, "loss": 0.3725, "step": 11370 }, { "epoch": 158.0, "eval_loss": 0.5385293364524841, "eval_runtime": 129.2791, "eval_samples_per_second": 4.115, "eval_steps_per_second": 0.518, "eval_wer": 0.21932249148293373, "step": 11376 }, { "epoch": 158.06, "learning_rate": 2.814514285714286e-05, "loss": 0.3693, "step": 11380 }, { "epoch": 158.19, "learning_rate": 2.813371428571429e-05, "loss": 0.3577, "step": 11390 }, { "epoch": 158.33, "learning_rate": 2.8122285714285716e-05, "loss": 0.3541, "step": 11400 }, { "epoch": 158.47, "learning_rate": 2.8110857142857146e-05, "loss": 0.3761, "step": 11410 }, { "epoch": 158.61, "learning_rate": 2.8099428571428573e-05, "loss": 0.3812, "step": 11420 }, { "epoch": 158.75, "learning_rate": 2.8088000000000003e-05, "loss": 0.3889, "step": 11430 }, { "epoch": 158.89, "learning_rate": 2.807657142857143e-05, "loss": 0.364, "step": 11440 }, { "epoch": 159.0, "eval_loss": 0.5113765001296997, "eval_runtime": 129.1877, "eval_samples_per_second": 4.118, "eval_steps_per_second": 0.519, "eval_wer": 0.22157228257376102, "step": 11448 }, { "epoch": 159.03, "learning_rate": 2.8065142857142856e-05, "loss": 0.3812, "step": 11450 }, { "epoch": 159.17, "learning_rate": 2.805371428571429e-05, "loss": 0.3498, "step": 11460 }, { "epoch": 159.3, "learning_rate": 2.8042285714285717e-05, "loss": 0.3551, "step": 11470 }, { "epoch": 159.44, "learning_rate": 2.8030857142857147e-05, "loss": 0.3758, "step": 11480 }, { "epoch": 159.58, "learning_rate": 2.8019428571428573e-05, "loss": 0.3788, "step": 11490 }, { "epoch": 159.72, "learning_rate": 2.8008000000000004e-05, "loss": 0.3738, "step": 11500 }, { "epoch": 159.86, "learning_rate": 2.799657142857143e-05, "loss": 0.3676, "step": 11510 }, { "epoch": 160.0, "learning_rate": 2.7985142857142857e-05, "loss": 0.3666, "step": 11520 }, { "epoch": 160.0, "eval_loss": 0.558375895023346, "eval_runtime": 129.3826, "eval_samples_per_second": 4.112, "eval_steps_per_second": 0.518, "eval_wer": 0.2247862698463714, "step": 11520 }, { "epoch": 160.14, "learning_rate": 2.7973714285714287e-05, "loss": 0.3783, "step": 11530 }, { "epoch": 160.28, "learning_rate": 2.7962285714285714e-05, "loss": 0.3676, "step": 11540 }, { "epoch": 160.42, "learning_rate": 2.7950857142857147e-05, "loss": 0.3637, "step": 11550 }, { "epoch": 160.55, "learning_rate": 2.7939428571428574e-05, "loss": 0.3747, "step": 11560 }, { "epoch": 160.69, "learning_rate": 2.7928000000000004e-05, "loss": 0.3698, "step": 11570 }, { "epoch": 160.83, "learning_rate": 2.791657142857143e-05, "loss": 0.3868, "step": 11580 }, { "epoch": 160.97, "learning_rate": 2.7905142857142858e-05, "loss": 0.3797, "step": 11590 }, { "epoch": 161.0, "eval_loss": 0.5313188433647156, "eval_runtime": 128.9946, "eval_samples_per_second": 4.124, "eval_steps_per_second": 0.519, "eval_wer": 0.22382207366458828, "step": 11592 }, { "epoch": 161.11, "learning_rate": 2.7893714285714288e-05, "loss": 0.3717, "step": 11600 }, { "epoch": 161.25, "learning_rate": 2.7882285714285715e-05, "loss": 0.3726, "step": 11610 }, { "epoch": 161.39, "learning_rate": 2.7870857142857145e-05, "loss": 0.3648, "step": 11620 }, { "epoch": 161.53, "learning_rate": 2.785942857142857e-05, "loss": 0.3493, "step": 11630 }, { "epoch": 161.66, "learning_rate": 2.7848000000000005e-05, "loss": 0.3511, "step": 11640 }, { "epoch": 161.8, "learning_rate": 2.7836571428571432e-05, "loss": 0.366, "step": 11650 }, { "epoch": 161.94, "learning_rate": 2.782514285714286e-05, "loss": 0.3704, "step": 11660 }, { "epoch": 162.0, "eval_loss": 0.5542490482330322, "eval_runtime": 129.2237, "eval_samples_per_second": 4.117, "eval_steps_per_second": 0.518, "eval_wer": 0.228064536864434, "step": 11664 }, { "epoch": 162.08, "learning_rate": 2.781371428571429e-05, "loss": 0.3579, "step": 11670 }, { "epoch": 162.22, "learning_rate": 2.7802285714285715e-05, "loss": 0.3634, "step": 11680 }, { "epoch": 162.36, "learning_rate": 2.7790857142857146e-05, "loss": 0.3674, "step": 11690 }, { "epoch": 162.5, "learning_rate": 2.7779428571428572e-05, "loss": 0.3741, "step": 11700 }, { "epoch": 162.64, "learning_rate": 2.7768000000000002e-05, "loss": 0.3575, "step": 11710 }, { "epoch": 162.78, "learning_rate": 2.775657142857143e-05, "loss": 0.3682, "step": 11720 }, { "epoch": 162.91, "learning_rate": 2.7745142857142863e-05, "loss": 0.362, "step": 11730 }, { "epoch": 163.0, "eval_loss": 0.5674021244049072, "eval_runtime": 133.9513, "eval_samples_per_second": 3.972, "eval_steps_per_second": 0.5, "eval_wer": 0.2240791926463971, "step": 11736 }, { "epoch": 163.06, "learning_rate": 2.773371428571429e-05, "loss": 0.369, "step": 11740 }, { "epoch": 163.19, "learning_rate": 2.7722285714285716e-05, "loss": 0.3634, "step": 11750 }, { "epoch": 163.33, "learning_rate": 2.7710857142857146e-05, "loss": 0.3724, "step": 11760 }, { "epoch": 163.47, "learning_rate": 2.7699428571428573e-05, "loss": 0.3531, "step": 11770 }, { "epoch": 163.61, "learning_rate": 2.7688000000000003e-05, "loss": 0.3537, "step": 11780 }, { "epoch": 163.75, "learning_rate": 2.767657142857143e-05, "loss": 0.3626, "step": 11790 }, { "epoch": 163.89, "learning_rate": 2.766514285714286e-05, "loss": 0.3551, "step": 11800 }, { "epoch": 164.0, "eval_loss": 0.5483812689781189, "eval_runtime": 129.7574, "eval_samples_per_second": 4.1, "eval_steps_per_second": 0.516, "eval_wer": 0.22099376486469113, "step": 11808 }, { "epoch": 164.03, "learning_rate": 2.7653714285714287e-05, "loss": 0.3843, "step": 11810 }, { "epoch": 164.17, "learning_rate": 2.7642285714285714e-05, "loss": 0.3549, "step": 11820 }, { "epoch": 164.3, "learning_rate": 2.7630857142857147e-05, "loss": 0.3703, "step": 11830 }, { "epoch": 164.44, "learning_rate": 2.7619428571428574e-05, "loss": 0.3633, "step": 11840 }, { "epoch": 164.58, "learning_rate": 2.7608000000000004e-05, "loss": 0.362, "step": 11850 }, { "epoch": 164.72, "learning_rate": 2.759657142857143e-05, "loss": 0.3638, "step": 11860 }, { "epoch": 164.86, "learning_rate": 2.758514285714286e-05, "loss": 0.3585, "step": 11870 }, { "epoch": 165.0, "learning_rate": 2.7573714285714288e-05, "loss": 0.3765, "step": 11880 }, { "epoch": 165.0, "eval_loss": 0.5380473732948303, "eval_runtime": 131.5659, "eval_samples_per_second": 4.044, "eval_steps_per_second": 0.509, "eval_wer": 0.22523622806453686, "step": 11880 }, { "epoch": 165.14, "learning_rate": 2.7562285714285714e-05, "loss": 0.3623, "step": 11890 }, { "epoch": 165.28, "learning_rate": 2.7550857142857145e-05, "loss": 0.3634, "step": 11900 }, { "epoch": 165.42, "learning_rate": 2.753942857142857e-05, "loss": 0.3657, "step": 11910 }, { "epoch": 165.55, "learning_rate": 2.7528000000000005e-05, "loss": 0.3713, "step": 11920 }, { "epoch": 165.69, "learning_rate": 2.751657142857143e-05, "loss": 0.3744, "step": 11930 }, { "epoch": 165.83, "learning_rate": 2.750514285714286e-05, "loss": 0.3731, "step": 11940 }, { "epoch": 165.97, "learning_rate": 2.749371428571429e-05, "loss": 0.3821, "step": 11950 }, { "epoch": 166.0, "eval_loss": 0.544071614742279, "eval_runtime": 130.2798, "eval_samples_per_second": 4.084, "eval_steps_per_second": 0.514, "eval_wer": 0.22665038246448543, "step": 11952 }, { "epoch": 166.11, "learning_rate": 2.7482285714285715e-05, "loss": 0.3933, "step": 11960 }, { "epoch": 166.25, "learning_rate": 2.7470857142857145e-05, "loss": 0.3795, "step": 11970 }, { "epoch": 166.39, "learning_rate": 2.7459428571428572e-05, "loss": 0.3674, "step": 11980 }, { "epoch": 166.53, "learning_rate": 2.7448000000000002e-05, "loss": 0.3594, "step": 11990 }, { "epoch": 166.66, "learning_rate": 2.743657142857143e-05, "loss": 0.3614, "step": 12000 }, { "epoch": 166.8, "learning_rate": 2.7425142857142862e-05, "loss": 0.3586, "step": 12010 }, { "epoch": 166.94, "learning_rate": 2.741371428571429e-05, "loss": 0.3608, "step": 12020 }, { "epoch": 167.0, "eval_loss": 0.4983361065387726, "eval_runtime": 129.3078, "eval_samples_per_second": 4.114, "eval_steps_per_second": 0.518, "eval_wer": 0.21861541428295944, "step": 12024 }, { "epoch": 167.08, "learning_rate": 2.7402285714285716e-05, "loss": 0.3888, "step": 12030 }, { "epoch": 167.22, "learning_rate": 2.7390857142857146e-05, "loss": 0.3657, "step": 12040 }, { "epoch": 167.36, "learning_rate": 2.7379428571428573e-05, "loss": 0.3571, "step": 12050 }, { "epoch": 167.5, "learning_rate": 2.7368000000000003e-05, "loss": 0.3677, "step": 12060 }, { "epoch": 167.64, "learning_rate": 2.735657142857143e-05, "loss": 0.3684, "step": 12070 }, { "epoch": 167.78, "learning_rate": 2.734514285714286e-05, "loss": 0.3683, "step": 12080 }, { "epoch": 167.91, "learning_rate": 2.7333714285714287e-05, "loss": 0.3595, "step": 12090 }, { "epoch": 168.0, "eval_loss": 0.5064969062805176, "eval_runtime": 129.6298, "eval_samples_per_second": 4.104, "eval_steps_per_second": 0.517, "eval_wer": 0.21655846242848878, "step": 12096 }, { "epoch": 168.06, "learning_rate": 2.7322285714285713e-05, "loss": 0.3663, "step": 12100 }, { "epoch": 168.19, "learning_rate": 2.7310857142857147e-05, "loss": 0.3642, "step": 12110 }, { "epoch": 168.33, "learning_rate": 2.7299428571428574e-05, "loss": 0.3578, "step": 12120 }, { "epoch": 168.47, "learning_rate": 2.7288000000000004e-05, "loss": 0.3557, "step": 12130 }, { "epoch": 168.61, "learning_rate": 2.727657142857143e-05, "loss": 0.3579, "step": 12140 }, { "epoch": 168.75, "learning_rate": 2.726514285714286e-05, "loss": 0.3556, "step": 12150 }, { "epoch": 168.89, "learning_rate": 2.7253714285714287e-05, "loss": 0.3652, "step": 12160 }, { "epoch": 169.0, "eval_loss": 0.5211083292961121, "eval_runtime": 129.0337, "eval_samples_per_second": 4.123, "eval_steps_per_second": 0.519, "eval_wer": 0.2150157485376358, "step": 12168 }, { "epoch": 169.03, "learning_rate": 2.7242285714285714e-05, "loss": 0.3798, "step": 12170 }, { "epoch": 169.17, "learning_rate": 2.7230857142857144e-05, "loss": 0.3585, "step": 12180 }, { "epoch": 169.3, "learning_rate": 2.721942857142857e-05, "loss": 0.3524, "step": 12190 }, { "epoch": 169.44, "learning_rate": 2.7208000000000004e-05, "loss": 0.3595, "step": 12200 }, { "epoch": 169.58, "learning_rate": 2.719657142857143e-05, "loss": 0.3597, "step": 12210 }, { "epoch": 169.72, "learning_rate": 2.718514285714286e-05, "loss": 0.3584, "step": 12220 }, { "epoch": 169.86, "learning_rate": 2.7173714285714288e-05, "loss": 0.3498, "step": 12230 }, { "epoch": 170.0, "learning_rate": 2.7162285714285715e-05, "loss": 0.3635, "step": 12240 }, { "epoch": 170.0, "eval_loss": 0.5341081619262695, "eval_runtime": 129.488, "eval_samples_per_second": 4.108, "eval_steps_per_second": 0.517, "eval_wer": 0.21642990293758438, "step": 12240 }, { "epoch": 170.14, "learning_rate": 2.7150857142857145e-05, "loss": 0.3549, "step": 12250 }, { "epoch": 170.28, "learning_rate": 2.7139428571428572e-05, "loss": 0.3565, "step": 12260 }, { "epoch": 170.42, "learning_rate": 2.7128000000000002e-05, "loss": 0.365, "step": 12270 }, { "epoch": 170.55, "learning_rate": 2.711657142857143e-05, "loss": 0.3586, "step": 12280 }, { "epoch": 170.69, "learning_rate": 2.7105142857142862e-05, "loss": 0.3667, "step": 12290 }, { "epoch": 170.83, "learning_rate": 2.709371428571429e-05, "loss": 0.3436, "step": 12300 }, { "epoch": 170.97, "learning_rate": 2.7082285714285716e-05, "loss": 0.3614, "step": 12310 }, { "epoch": 171.0, "eval_loss": 0.5059003233909607, "eval_runtime": 129.1596, "eval_samples_per_second": 4.119, "eval_steps_per_second": 0.519, "eval_wer": 0.2182940155556984, "step": 12312 }, { "epoch": 171.11, "learning_rate": 2.7070857142857146e-05, "loss": 0.3474, "step": 12320 }, { "epoch": 171.25, "learning_rate": 2.7059428571428572e-05, "loss": 0.3559, "step": 12330 }, { "epoch": 171.39, "learning_rate": 2.7048000000000003e-05, "loss": 0.3481, "step": 12340 }, { "epoch": 171.53, "learning_rate": 2.703657142857143e-05, "loss": 0.3577, "step": 12350 }, { "epoch": 171.66, "learning_rate": 2.702514285714286e-05, "loss": 0.3635, "step": 12360 }, { "epoch": 171.8, "learning_rate": 2.7013714285714286e-05, "loss": 0.3535, "step": 12370 }, { "epoch": 171.94, "learning_rate": 2.700228571428572e-05, "loss": 0.3522, "step": 12380 }, { "epoch": 172.0, "eval_loss": 0.5530246496200562, "eval_runtime": 129.5383, "eval_samples_per_second": 4.107, "eval_steps_per_second": 0.517, "eval_wer": 0.2199010091920036, "step": 12384 }, { "epoch": 172.08, "learning_rate": 2.6990857142857146e-05, "loss": 0.3698, "step": 12390 }, { "epoch": 172.22, "learning_rate": 2.6979428571428573e-05, "loss": 0.354, "step": 12400 }, { "epoch": 172.36, "learning_rate": 2.6968000000000003e-05, "loss": 0.3476, "step": 12410 }, { "epoch": 172.5, "learning_rate": 2.695657142857143e-05, "loss": 0.3474, "step": 12420 }, { "epoch": 172.64, "learning_rate": 2.694514285714286e-05, "loss": 0.351, "step": 12430 }, { "epoch": 172.78, "learning_rate": 2.6933714285714287e-05, "loss": 0.3547, "step": 12440 }, { "epoch": 172.91, "learning_rate": 2.6922285714285717e-05, "loss": 0.3522, "step": 12450 }, { "epoch": 173.0, "eval_loss": 0.5580894351005554, "eval_runtime": 129.6837, "eval_samples_per_second": 4.102, "eval_steps_per_second": 0.517, "eval_wer": 0.2142443915922093, "step": 12456 }, { "epoch": 173.06, "learning_rate": 2.6910857142857144e-05, "loss": 0.3561, "step": 12460 }, { "epoch": 173.19, "learning_rate": 2.689942857142857e-05, "loss": 0.3555, "step": 12470 }, { "epoch": 173.33, "learning_rate": 2.6888000000000004e-05, "loss": 0.3603, "step": 12480 }, { "epoch": 173.47, "learning_rate": 2.687657142857143e-05, "loss": 0.3617, "step": 12490 }, { "epoch": 173.61, "learning_rate": 2.686514285714286e-05, "loss": 0.355, "step": 12500 }, { "epoch": 173.75, "learning_rate": 2.6853714285714288e-05, "loss": 0.3486, "step": 12510 }, { "epoch": 173.89, "learning_rate": 2.6842285714285718e-05, "loss": 0.3503, "step": 12520 }, { "epoch": 174.0, "eval_loss": 0.5394085049629211, "eval_runtime": 129.5462, "eval_samples_per_second": 4.107, "eval_steps_per_second": 0.517, "eval_wer": 0.22112232435559556, "step": 12528 }, { "epoch": 174.03, "learning_rate": 2.6830857142857145e-05, "loss": 0.3762, "step": 12530 }, { "epoch": 174.17, "learning_rate": 2.681942857142857e-05, "loss": 0.3481, "step": 12540 }, { "epoch": 174.3, "learning_rate": 2.6808e-05, "loss": 0.3604, "step": 12550 }, { "epoch": 174.44, "learning_rate": 2.6796571428571428e-05, "loss": 0.3595, "step": 12560 }, { "epoch": 174.58, "learning_rate": 2.6785142857142862e-05, "loss": 0.3524, "step": 12570 }, { "epoch": 174.72, "learning_rate": 2.677371428571429e-05, "loss": 0.3609, "step": 12580 }, { "epoch": 174.86, "learning_rate": 2.676228571428572e-05, "loss": 0.3538, "step": 12590 }, { "epoch": 175.0, "learning_rate": 2.6750857142857145e-05, "loss": 0.3583, "step": 12600 }, { "epoch": 175.0, "eval_loss": 0.546040415763855, "eval_runtime": 129.0674, "eval_samples_per_second": 4.122, "eval_steps_per_second": 0.519, "eval_wer": 0.22523622806453686, "step": 12600 }, { "epoch": 175.14, "learning_rate": 2.6739428571428572e-05, "loss": 0.353, "step": 12610 }, { "epoch": 175.28, "learning_rate": 2.6728000000000002e-05, "loss": 0.3613, "step": 12620 }, { "epoch": 175.42, "learning_rate": 2.671657142857143e-05, "loss": 0.355, "step": 12630 }, { "epoch": 175.55, "learning_rate": 2.670514285714286e-05, "loss": 0.3616, "step": 12640 }, { "epoch": 175.69, "learning_rate": 2.6693714285714286e-05, "loss": 0.364, "step": 12650 }, { "epoch": 175.83, "learning_rate": 2.668228571428572e-05, "loss": 0.3559, "step": 12660 }, { "epoch": 175.97, "learning_rate": 2.6670857142857146e-05, "loss": 0.3562, "step": 12670 }, { "epoch": 176.0, "eval_loss": 0.5198766589164734, "eval_runtime": 129.5241, "eval_samples_per_second": 4.107, "eval_steps_per_second": 0.517, "eval_wer": 0.2223436395191875, "step": 12672 }, { "epoch": 176.11, "learning_rate": 2.6659428571428573e-05, "loss": 0.3742, "step": 12680 }, { "epoch": 176.25, "learning_rate": 2.6648000000000003e-05, "loss": 0.3538, "step": 12690 }, { "epoch": 176.39, "learning_rate": 2.663657142857143e-05, "loss": 0.3485, "step": 12700 }, { "epoch": 176.53, "learning_rate": 2.662514285714286e-05, "loss": 0.3607, "step": 12710 }, { "epoch": 176.66, "learning_rate": 2.6613714285714287e-05, "loss": 0.3571, "step": 12720 }, { "epoch": 176.8, "learning_rate": 2.6602285714285717e-05, "loss": 0.352, "step": 12730 }, { "epoch": 176.94, "learning_rate": 2.6590857142857144e-05, "loss": 0.351, "step": 12740 }, { "epoch": 177.0, "eval_loss": 0.5247741937637329, "eval_runtime": 129.2086, "eval_samples_per_second": 4.117, "eval_steps_per_second": 0.519, "eval_wer": 0.21463007006492255, "step": 12744 }, { "epoch": 177.08, "learning_rate": 2.657942857142857e-05, "loss": 0.3648, "step": 12750 }, { "epoch": 177.22, "learning_rate": 2.6568000000000004e-05, "loss": 0.3553, "step": 12760 }, { "epoch": 177.36, "learning_rate": 2.655657142857143e-05, "loss": 0.3482, "step": 12770 }, { "epoch": 177.5, "learning_rate": 2.654514285714286e-05, "loss": 0.3523, "step": 12780 }, { "epoch": 177.64, "learning_rate": 2.6533714285714287e-05, "loss": 0.3601, "step": 12790 }, { "epoch": 177.78, "learning_rate": 2.6522285714285718e-05, "loss": 0.3681, "step": 12800 }, { "epoch": 177.91, "learning_rate": 2.6510857142857144e-05, "loss": 0.3667, "step": 12810 }, { "epoch": 178.0, "eval_loss": 0.539965033531189, "eval_runtime": 129.5322, "eval_samples_per_second": 4.107, "eval_steps_per_second": 0.517, "eval_wer": 0.21687986115574984, "step": 12816 }, { "epoch": 178.06, "learning_rate": 2.649942857142857e-05, "loss": 0.3608, "step": 12820 }, { "epoch": 178.19, "learning_rate": 2.6489142857142856e-05, "loss": 0.3591, "step": 12830 }, { "epoch": 178.33, "learning_rate": 2.647771428571429e-05, "loss": 0.3543, "step": 12840 }, { "epoch": 178.47, "learning_rate": 2.6466285714285717e-05, "loss": 0.3481, "step": 12850 }, { "epoch": 178.61, "learning_rate": 2.6454857142857147e-05, "loss": 0.3388, "step": 12860 }, { "epoch": 178.75, "learning_rate": 2.6443428571428574e-05, "loss": 0.3556, "step": 12870 }, { "epoch": 178.89, "learning_rate": 2.6432000000000004e-05, "loss": 0.3407, "step": 12880 }, { "epoch": 179.0, "eval_loss": 0.5348556041717529, "eval_runtime": 129.5713, "eval_samples_per_second": 4.106, "eval_steps_per_second": 0.517, "eval_wer": 0.2094876904287459, "step": 12888 }, { "epoch": 179.03, "learning_rate": 2.642057142857143e-05, "loss": 0.3667, "step": 12890 }, { "epoch": 179.17, "learning_rate": 2.6409142857142857e-05, "loss": 0.3517, "step": 12900 }, { "epoch": 179.3, "learning_rate": 2.6397714285714287e-05, "loss": 0.3544, "step": 12910 }, { "epoch": 179.44, "learning_rate": 2.6386285714285714e-05, "loss": 0.3488, "step": 12920 }, { "epoch": 179.58, "learning_rate": 2.6374857142857148e-05, "loss": 0.3417, "step": 12930 }, { "epoch": 179.72, "learning_rate": 2.6363428571428574e-05, "loss": 0.3521, "step": 12940 }, { "epoch": 179.86, "learning_rate": 2.6352000000000005e-05, "loss": 0.3465, "step": 12950 }, { "epoch": 180.0, "learning_rate": 2.634057142857143e-05, "loss": 0.3563, "step": 12960 }, { "epoch": 180.0, "eval_loss": 0.5258911848068237, "eval_runtime": 129.3927, "eval_samples_per_second": 4.112, "eval_steps_per_second": 0.518, "eval_wer": 0.21160892202866877, "step": 12960 }, { "epoch": 180.14, "learning_rate": 2.6329142857142858e-05, "loss": 0.3555, "step": 12970 }, { "epoch": 180.28, "learning_rate": 2.6317714285714288e-05, "loss": 0.3387, "step": 12980 }, { "epoch": 180.42, "learning_rate": 2.6306285714285715e-05, "loss": 0.3509, "step": 12990 }, { "epoch": 180.55, "learning_rate": 2.6294857142857145e-05, "loss": 0.3515, "step": 13000 }, { "epoch": 180.69, "learning_rate": 2.6283428571428572e-05, "loss": 0.3406, "step": 13010 }, { "epoch": 180.83, "learning_rate": 2.6272000000000005e-05, "loss": 0.3488, "step": 13020 }, { "epoch": 180.97, "learning_rate": 2.6260571428571432e-05, "loss": 0.3656, "step": 13030 }, { "epoch": 181.0, "eval_loss": 0.5129957795143127, "eval_runtime": 129.2391, "eval_samples_per_second": 4.116, "eval_steps_per_second": 0.518, "eval_wer": 0.21148036253776434, "step": 13032 }, { "epoch": 181.11, "learning_rate": 2.624914285714286e-05, "loss": 0.3499, "step": 13040 }, { "epoch": 181.25, "learning_rate": 2.623771428571429e-05, "loss": 0.3461, "step": 13050 }, { "epoch": 181.39, "learning_rate": 2.6226285714285716e-05, "loss": 0.3454, "step": 13060 }, { "epoch": 181.53, "learning_rate": 2.6214857142857146e-05, "loss": 0.3444, "step": 13070 }, { "epoch": 181.66, "learning_rate": 2.6203428571428573e-05, "loss": 0.3574, "step": 13080 }, { "epoch": 181.8, "learning_rate": 2.6192000000000003e-05, "loss": 0.3494, "step": 13090 }, { "epoch": 181.94, "learning_rate": 2.618057142857143e-05, "loss": 0.3714, "step": 13100 }, { "epoch": 182.0, "eval_loss": 0.5071449279785156, "eval_runtime": 129.5836, "eval_samples_per_second": 4.105, "eval_steps_per_second": 0.517, "eval_wer": 0.2151443080285402, "step": 13104 }, { "epoch": 182.08, "learning_rate": 2.6169142857142856e-05, "loss": 0.3503, "step": 13110 }, { "epoch": 182.22, "learning_rate": 2.615771428571429e-05, "loss": 0.3471, "step": 13120 }, { "epoch": 182.36, "learning_rate": 2.6146285714285716e-05, "loss": 0.3385, "step": 13130 }, { "epoch": 182.5, "learning_rate": 2.6134857142857147e-05, "loss": 0.3537, "step": 13140 }, { "epoch": 182.64, "learning_rate": 2.6123428571428573e-05, "loss": 0.3466, "step": 13150 }, { "epoch": 182.78, "learning_rate": 2.6112000000000003e-05, "loss": 0.3536, "step": 13160 }, { "epoch": 182.91, "learning_rate": 2.610057142857143e-05, "loss": 0.3565, "step": 13170 }, { "epoch": 183.0, "eval_loss": 0.5418967604637146, "eval_runtime": 129.0574, "eval_samples_per_second": 4.122, "eval_steps_per_second": 0.519, "eval_wer": 0.22054380664652568, "step": 13176 }, { "epoch": 183.06, "learning_rate": 2.6089142857142857e-05, "loss": 0.3669, "step": 13180 }, { "epoch": 183.19, "learning_rate": 2.6077714285714287e-05, "loss": 0.3616, "step": 13190 }, { "epoch": 183.33, "learning_rate": 2.6066285714285714e-05, "loss": 0.3618, "step": 13200 }, { "epoch": 183.47, "learning_rate": 2.6054857142857147e-05, "loss": 0.35, "step": 13210 }, { "epoch": 183.61, "learning_rate": 2.6043428571428574e-05, "loss": 0.3519, "step": 13220 }, { "epoch": 183.75, "learning_rate": 2.6032000000000004e-05, "loss": 0.3514, "step": 13230 }, { "epoch": 183.89, "learning_rate": 2.602057142857143e-05, "loss": 0.3521, "step": 13240 }, { "epoch": 184.0, "eval_loss": 0.5379987955093384, "eval_runtime": 129.1812, "eval_samples_per_second": 4.118, "eval_steps_per_second": 0.519, "eval_wer": 0.22504338882818023, "step": 13248 }, { "epoch": 184.03, "learning_rate": 2.6009142857142858e-05, "loss": 0.375, "step": 13250 }, { "epoch": 184.17, "learning_rate": 2.5997714285714288e-05, "loss": 0.3462, "step": 13260 }, { "epoch": 184.3, "learning_rate": 2.5986285714285715e-05, "loss": 0.3608, "step": 13270 }, { "epoch": 184.44, "learning_rate": 2.5974857142857145e-05, "loss": 0.3552, "step": 13280 }, { "epoch": 184.58, "learning_rate": 2.596342857142857e-05, "loss": 0.3642, "step": 13290 }, { "epoch": 184.72, "learning_rate": 2.5952000000000005e-05, "loss": 0.3516, "step": 13300 }, { "epoch": 184.86, "learning_rate": 2.5940571428571432e-05, "loss": 0.3548, "step": 13310 }, { "epoch": 185.0, "learning_rate": 2.592914285714286e-05, "loss": 0.3605, "step": 13320 }, { "epoch": 185.0, "eval_loss": 0.5436675548553467, "eval_runtime": 129.5724, "eval_samples_per_second": 4.106, "eval_steps_per_second": 0.517, "eval_wer": 0.2229864369737096, "step": 13320 }, { "epoch": 185.14, "learning_rate": 2.591771428571429e-05, "loss": 0.3611, "step": 13330 }, { "epoch": 185.28, "learning_rate": 2.5906285714285715e-05, "loss": 0.3622, "step": 13340 }, { "epoch": 185.42, "learning_rate": 2.5894857142857145e-05, "loss": 0.362, "step": 13350 }, { "epoch": 185.55, "learning_rate": 2.5883428571428572e-05, "loss": 0.3612, "step": 13360 }, { "epoch": 185.69, "learning_rate": 2.5872000000000002e-05, "loss": 0.365, "step": 13370 }, { "epoch": 185.83, "learning_rate": 2.586057142857143e-05, "loss": 0.3508, "step": 13380 }, { "epoch": 185.97, "learning_rate": 2.5849142857142856e-05, "loss": 0.3508, "step": 13390 }, { "epoch": 186.0, "eval_loss": 0.539088785648346, "eval_runtime": 129.6711, "eval_samples_per_second": 4.103, "eval_steps_per_second": 0.517, "eval_wer": 0.22253647875554414, "step": 13392 }, { "epoch": 186.11, "learning_rate": 2.583771428571429e-05, "loss": 0.3648, "step": 13400 }, { "epoch": 186.25, "learning_rate": 2.5826285714285716e-05, "loss": 0.3693, "step": 13410 }, { "epoch": 186.39, "learning_rate": 2.5814857142857146e-05, "loss": 0.3441, "step": 13420 }, { "epoch": 186.53, "learning_rate": 2.5803428571428573e-05, "loss": 0.3671, "step": 13430 }, { "epoch": 186.66, "learning_rate": 2.5792000000000003e-05, "loss": 0.3591, "step": 13440 }, { "epoch": 186.8, "learning_rate": 2.578057142857143e-05, "loss": 0.3622, "step": 13450 }, { "epoch": 186.94, "learning_rate": 2.576914285714286e-05, "loss": 0.3746, "step": 13460 }, { "epoch": 187.0, "eval_loss": 0.5425940155982971, "eval_runtime": 129.04, "eval_samples_per_second": 4.123, "eval_steps_per_second": 0.519, "eval_wer": 0.22735745966445972, "step": 13464 }, { "epoch": 187.08, "learning_rate": 2.5757714285714287e-05, "loss": 0.3672, "step": 13470 }, { "epoch": 187.22, "learning_rate": 2.5746285714285713e-05, "loss": 0.376, "step": 13480 }, { "epoch": 187.36, "learning_rate": 2.5734857142857147e-05, "loss": 0.3522, "step": 13490 }, { "epoch": 187.5, "learning_rate": 2.5723428571428574e-05, "loss": 0.3431, "step": 13500 }, { "epoch": 187.64, "learning_rate": 2.5712000000000004e-05, "loss": 0.3691, "step": 13510 }, { "epoch": 187.78, "learning_rate": 2.570057142857143e-05, "loss": 0.3626, "step": 13520 }, { "epoch": 187.91, "learning_rate": 2.568914285714286e-05, "loss": 0.3478, "step": 13530 }, { "epoch": 188.0, "eval_loss": 0.5824282169342041, "eval_runtime": 129.1908, "eval_samples_per_second": 4.118, "eval_steps_per_second": 0.519, "eval_wer": 0.2247219901009192, "step": 13536 }, { "epoch": 188.06, "learning_rate": 2.5677714285714287e-05, "loss": 0.3569, "step": 13540 }, { "epoch": 188.19, "learning_rate": 2.5666285714285714e-05, "loss": 0.3597, "step": 13550 }, { "epoch": 188.33, "learning_rate": 2.5654857142857144e-05, "loss": 0.3554, "step": 13560 }, { "epoch": 188.47, "learning_rate": 2.564342857142857e-05, "loss": 0.3496, "step": 13570 }, { "epoch": 188.61, "learning_rate": 2.5632000000000005e-05, "loss": 0.3382, "step": 13580 }, { "epoch": 188.75, "learning_rate": 2.562057142857143e-05, "loss": 0.3464, "step": 13590 }, { "epoch": 188.89, "learning_rate": 2.560914285714286e-05, "loss": 0.3475, "step": 13600 }, { "epoch": 189.0, "eval_loss": 0.5232582092285156, "eval_runtime": 128.7639, "eval_samples_per_second": 4.132, "eval_steps_per_second": 0.52, "eval_wer": 0.21032332711962462, "step": 13608 }, { "epoch": 189.03, "learning_rate": 2.5597714285714288e-05, "loss": 0.3427, "step": 13610 }, { "epoch": 189.17, "learning_rate": 2.5586285714285715e-05, "loss": 0.3416, "step": 13620 }, { "epoch": 189.3, "learning_rate": 2.5574857142857145e-05, "loss": 0.3515, "step": 13630 }, { "epoch": 189.44, "learning_rate": 2.5563428571428572e-05, "loss": 0.3451, "step": 13640 }, { "epoch": 189.58, "learning_rate": 2.5552000000000002e-05, "loss": 0.3393, "step": 13650 }, { "epoch": 189.72, "learning_rate": 2.554057142857143e-05, "loss": 0.35, "step": 13660 }, { "epoch": 189.86, "learning_rate": 2.5529142857142862e-05, "loss": 0.3397, "step": 13670 }, { "epoch": 190.0, "learning_rate": 2.551771428571429e-05, "loss": 0.3676, "step": 13680 }, { "epoch": 190.0, "eval_loss": 0.5214197635650635, "eval_runtime": 128.9585, "eval_samples_per_second": 4.125, "eval_steps_per_second": 0.52, "eval_wer": 0.21218743973773863, "step": 13680 }, { "epoch": 190.14, "learning_rate": 2.5506285714285716e-05, "loss": 0.354, "step": 13690 }, { "epoch": 190.28, "learning_rate": 2.5494857142857146e-05, "loss": 0.3603, "step": 13700 }, { "epoch": 190.42, "learning_rate": 2.5483428571428573e-05, "loss": 0.3488, "step": 13710 }, { "epoch": 190.55, "learning_rate": 2.5472000000000003e-05, "loss": 0.3504, "step": 13720 }, { "epoch": 190.69, "learning_rate": 2.546057142857143e-05, "loss": 0.3608, "step": 13730 }, { "epoch": 190.83, "learning_rate": 2.544914285714286e-05, "loss": 0.3463, "step": 13740 }, { "epoch": 190.97, "learning_rate": 2.5437714285714286e-05, "loss": 0.3579, "step": 13750 }, { "epoch": 191.0, "eval_loss": 0.5267397165298462, "eval_runtime": 130.1751, "eval_samples_per_second": 4.087, "eval_steps_per_second": 0.515, "eval_wer": 0.21238027897409525, "step": 13752 }, { "epoch": 191.11, "learning_rate": 2.5426285714285713e-05, "loss": 0.3558, "step": 13760 }, { "epoch": 191.25, "learning_rate": 2.5414857142857147e-05, "loss": 0.3347, "step": 13770 }, { "epoch": 191.39, "learning_rate": 2.5403428571428573e-05, "loss": 0.3483, "step": 13780 }, { "epoch": 191.53, "learning_rate": 2.5392000000000004e-05, "loss": 0.3568, "step": 13790 }, { "epoch": 191.66, "learning_rate": 2.538057142857143e-05, "loss": 0.3724, "step": 13800 }, { "epoch": 191.8, "learning_rate": 2.536914285714286e-05, "loss": 0.3612, "step": 13810 }, { "epoch": 191.94, "learning_rate": 2.5357714285714287e-05, "loss": 0.3563, "step": 13820 }, { "epoch": 192.0, "eval_loss": 0.5343008041381836, "eval_runtime": 129.5959, "eval_samples_per_second": 4.105, "eval_steps_per_second": 0.517, "eval_wer": 0.21321591566497397, "step": 13824 }, { "epoch": 192.08, "learning_rate": 2.5346285714285714e-05, "loss": 0.3582, "step": 13830 }, { "epoch": 192.22, "learning_rate": 2.5334857142857144e-05, "loss": 0.3491, "step": 13840 }, { "epoch": 192.36, "learning_rate": 2.532342857142857e-05, "loss": 0.3318, "step": 13850 }, { "epoch": 192.5, "learning_rate": 2.5312000000000004e-05, "loss": 0.3457, "step": 13860 }, { "epoch": 192.64, "learning_rate": 2.530057142857143e-05, "loss": 0.3481, "step": 13870 }, { "epoch": 192.78, "learning_rate": 2.528914285714286e-05, "loss": 0.3544, "step": 13880 }, { "epoch": 192.91, "learning_rate": 2.5277714285714288e-05, "loss": 0.3531, "step": 13890 }, { "epoch": 193.0, "eval_loss": 0.5204878449440002, "eval_runtime": 129.9473, "eval_samples_per_second": 4.094, "eval_steps_per_second": 0.516, "eval_wer": 0.22047952690107347, "step": 13896 }, { "epoch": 193.06, "learning_rate": 2.5266285714285715e-05, "loss": 0.3516, "step": 13900 }, { "epoch": 193.19, "learning_rate": 2.5254857142857145e-05, "loss": 0.3568, "step": 13910 }, { "epoch": 193.33, "learning_rate": 2.524342857142857e-05, "loss": 0.3629, "step": 13920 }, { "epoch": 193.47, "learning_rate": 2.5232e-05, "loss": 0.3491, "step": 13930 }, { "epoch": 193.61, "learning_rate": 2.522057142857143e-05, "loss": 0.3341, "step": 13940 }, { "epoch": 193.75, "learning_rate": 2.5209142857142862e-05, "loss": 0.3538, "step": 13950 }, { "epoch": 193.89, "learning_rate": 2.519771428571429e-05, "loss": 0.3424, "step": 13960 }, { "epoch": 194.0, "eval_loss": 0.5195679664611816, "eval_runtime": 129.1069, "eval_samples_per_second": 4.121, "eval_steps_per_second": 0.519, "eval_wer": 0.21964389021019476, "step": 13968 }, { "epoch": 194.03, "learning_rate": 2.5186285714285715e-05, "loss": 0.3573, "step": 13970 }, { "epoch": 194.17, "learning_rate": 2.5174857142857146e-05, "loss": 0.3536, "step": 13980 }, { "epoch": 194.3, "learning_rate": 2.5163428571428572e-05, "loss": 0.3462, "step": 13990 }, { "epoch": 194.44, "learning_rate": 2.5152000000000002e-05, "loss": 0.3543, "step": 14000 }, { "epoch": 194.58, "learning_rate": 2.514057142857143e-05, "loss": 0.3531, "step": 14010 }, { "epoch": 194.72, "learning_rate": 2.512914285714286e-05, "loss": 0.3487, "step": 14020 }, { "epoch": 194.86, "learning_rate": 2.5117714285714286e-05, "loss": 0.3299, "step": 14030 }, { "epoch": 195.0, "learning_rate": 2.5106285714285713e-05, "loss": 0.3617, "step": 14040 }, { "epoch": 195.0, "eval_loss": 0.5301965475082397, "eval_runtime": 129.3387, "eval_samples_per_second": 4.113, "eval_steps_per_second": 0.518, "eval_wer": 0.22221508002828308, "step": 14040 }, { "epoch": 195.14, "learning_rate": 2.5094857142857146e-05, "loss": 0.3513, "step": 14050 }, { "epoch": 195.28, "learning_rate": 2.5083428571428573e-05, "loss": 0.342, "step": 14060 }, { "epoch": 195.42, "learning_rate": 2.5072000000000003e-05, "loss": 0.3432, "step": 14070 }, { "epoch": 195.55, "learning_rate": 2.506057142857143e-05, "loss": 0.3424, "step": 14080 }, { "epoch": 195.69, "learning_rate": 2.504914285714286e-05, "loss": 0.3489, "step": 14090 }, { "epoch": 195.83, "learning_rate": 2.5037714285714287e-05, "loss": 0.3466, "step": 14100 }, { "epoch": 195.97, "learning_rate": 2.5026285714285717e-05, "loss": 0.3461, "step": 14110 }, { "epoch": 196.0, "eval_loss": 0.5365616679191589, "eval_runtime": 128.8739, "eval_samples_per_second": 4.128, "eval_steps_per_second": 0.52, "eval_wer": 0.22041524715562127, "step": 14112 }, { "epoch": 196.11, "learning_rate": 2.5014857142857144e-05, "loss": 0.3596, "step": 14120 }, { "epoch": 196.25, "learning_rate": 2.500342857142857e-05, "loss": 0.3457, "step": 14130 }, { "epoch": 196.39, "learning_rate": 2.4992000000000004e-05, "loss": 0.3452, "step": 14140 }, { "epoch": 196.53, "learning_rate": 2.498057142857143e-05, "loss": 0.344, "step": 14150 }, { "epoch": 196.66, "learning_rate": 2.496914285714286e-05, "loss": 0.3426, "step": 14160 }, { "epoch": 196.8, "learning_rate": 2.4957714285714288e-05, "loss": 0.336, "step": 14170 }, { "epoch": 196.94, "learning_rate": 2.4946285714285718e-05, "loss": 0.3524, "step": 14180 }, { "epoch": 197.0, "eval_loss": 0.5383471846580505, "eval_runtime": 129.0682, "eval_samples_per_second": 4.122, "eval_steps_per_second": 0.519, "eval_wer": 0.22118660410104776, "step": 14184 }, { "epoch": 197.08, "learning_rate": 2.4934857142857144e-05, "loss": 0.366, "step": 14190 }, { "epoch": 197.22, "learning_rate": 2.492342857142857e-05, "loss": 0.3418, "step": 14200 }, { "epoch": 197.36, "learning_rate": 2.4912e-05, "loss": 0.3468, "step": 14210 }, { "epoch": 197.5, "learning_rate": 2.4900571428571428e-05, "loss": 0.3493, "step": 14220 }, { "epoch": 197.64, "learning_rate": 2.488914285714286e-05, "loss": 0.3408, "step": 14230 }, { "epoch": 197.78, "learning_rate": 2.487771428571429e-05, "loss": 0.3471, "step": 14240 }, { "epoch": 197.91, "learning_rate": 2.486628571428572e-05, "loss": 0.3354, "step": 14250 }, { "epoch": 198.0, "eval_loss": 0.5279358625411987, "eval_runtime": 129.4694, "eval_samples_per_second": 4.109, "eval_steps_per_second": 0.517, "eval_wer": 0.21655846242848878, "step": 14256 }, { "epoch": 198.06, "learning_rate": 2.4854857142857145e-05, "loss": 0.3574, "step": 14260 }, { "epoch": 198.19, "learning_rate": 2.4843428571428572e-05, "loss": 0.3508, "step": 14270 }, { "epoch": 198.33, "learning_rate": 2.4832000000000002e-05, "loss": 0.3387, "step": 14280 }, { "epoch": 198.47, "learning_rate": 2.482057142857143e-05, "loss": 0.3402, "step": 14290 }, { "epoch": 198.61, "learning_rate": 2.480914285714286e-05, "loss": 0.3294, "step": 14300 }, { "epoch": 198.75, "learning_rate": 2.4797714285714286e-05, "loss": 0.3396, "step": 14310 }, { "epoch": 198.89, "learning_rate": 2.478628571428572e-05, "loss": 0.3501, "step": 14320 }, { "epoch": 199.0, "eval_loss": 0.5234560370445251, "eval_runtime": 129.3721, "eval_samples_per_second": 4.112, "eval_steps_per_second": 0.518, "eval_wer": 0.21649418268303658, "step": 14328 }, { "epoch": 199.03, "learning_rate": 2.4774857142857146e-05, "loss": 0.3607, "step": 14330 }, { "epoch": 199.17, "learning_rate": 2.4763428571428573e-05, "loss": 0.3333, "step": 14340 }, { "epoch": 199.3, "learning_rate": 2.4752000000000003e-05, "loss": 0.332, "step": 14350 }, { "epoch": 199.44, "learning_rate": 2.474057142857143e-05, "loss": 0.3408, "step": 14360 }, { "epoch": 199.58, "learning_rate": 2.472914285714286e-05, "loss": 0.3349, "step": 14370 }, { "epoch": 199.72, "learning_rate": 2.4717714285714287e-05, "loss": 0.345, "step": 14380 }, { "epoch": 199.86, "learning_rate": 2.4706285714285717e-05, "loss": 0.3448, "step": 14390 }, { "epoch": 200.0, "learning_rate": 2.4694857142857143e-05, "loss": 0.3384, "step": 14400 }, { "epoch": 200.0, "eval_loss": 0.533034086227417, "eval_runtime": 129.3055, "eval_samples_per_second": 4.114, "eval_steps_per_second": 0.518, "eval_wer": 0.2152085877739924, "step": 14400 }, { "epoch": 200.14, "learning_rate": 2.468342857142857e-05, "loss": 0.3527, "step": 14410 }, { "epoch": 200.28, "learning_rate": 2.4672000000000004e-05, "loss": 0.3339, "step": 14420 }, { "epoch": 200.42, "learning_rate": 2.466057142857143e-05, "loss": 0.3473, "step": 14430 }, { "epoch": 200.55, "learning_rate": 2.464914285714286e-05, "loss": 0.3513, "step": 14440 }, { "epoch": 200.69, "learning_rate": 2.4637714285714287e-05, "loss": 0.3487, "step": 14450 }, { "epoch": 200.83, "learning_rate": 2.4626285714285717e-05, "loss": 0.3425, "step": 14460 }, { "epoch": 200.97, "learning_rate": 2.4614857142857144e-05, "loss": 0.3565, "step": 14470 }, { "epoch": 201.0, "eval_loss": 0.5262418389320374, "eval_runtime": 129.5672, "eval_samples_per_second": 4.106, "eval_steps_per_second": 0.517, "eval_wer": 0.22105804461014333, "step": 14472 }, { "epoch": 201.11, "learning_rate": 2.460342857142857e-05, "loss": 0.3563, "step": 14480 }, { "epoch": 201.25, "learning_rate": 2.4592e-05, "loss": 0.3533, "step": 14490 }, { "epoch": 201.39, "learning_rate": 2.4580571428571428e-05, "loss": 0.3398, "step": 14500 }, { "epoch": 201.53, "learning_rate": 2.456914285714286e-05, "loss": 0.3536, "step": 14510 }, { "epoch": 201.66, "learning_rate": 2.4557714285714288e-05, "loss": 0.3488, "step": 14520 }, { "epoch": 201.8, "learning_rate": 2.4546285714285718e-05, "loss": 0.3443, "step": 14530 }, { "epoch": 201.94, "learning_rate": 2.4534857142857145e-05, "loss": 0.3385, "step": 14540 }, { "epoch": 202.0, "eval_loss": 0.5403549671173096, "eval_runtime": 128.9055, "eval_samples_per_second": 4.127, "eval_steps_per_second": 0.52, "eval_wer": 0.21726553962846307, "step": 14544 }, { "epoch": 202.08, "learning_rate": 2.452342857142857e-05, "loss": 0.3586, "step": 14550 }, { "epoch": 202.22, "learning_rate": 2.4512000000000002e-05, "loss": 0.3641, "step": 14560 }, { "epoch": 202.36, "learning_rate": 2.450057142857143e-05, "loss": 0.3643, "step": 14570 }, { "epoch": 202.5, "learning_rate": 2.448914285714286e-05, "loss": 0.3664, "step": 14580 }, { "epoch": 202.64, "learning_rate": 2.4477714285714285e-05, "loss": 0.3567, "step": 14590 }, { "epoch": 202.78, "learning_rate": 2.446628571428572e-05, "loss": 0.35, "step": 14600 }, { "epoch": 202.91, "learning_rate": 2.4454857142857146e-05, "loss": 0.3533, "step": 14610 }, { "epoch": 203.0, "eval_loss": 0.5465120077133179, "eval_runtime": 129.2949, "eval_samples_per_second": 4.115, "eval_steps_per_second": 0.518, "eval_wer": 0.22092948511923893, "step": 14616 }, { "epoch": 203.06, "learning_rate": 2.4443428571428572e-05, "loss": 0.3611, "step": 14620 }, { "epoch": 203.19, "learning_rate": 2.4432000000000003e-05, "loss": 0.3584, "step": 14630 }, { "epoch": 203.33, "learning_rate": 2.442057142857143e-05, "loss": 0.3612, "step": 14640 }, { "epoch": 203.47, "learning_rate": 2.440914285714286e-05, "loss": 0.3779, "step": 14650 }, { "epoch": 203.61, "learning_rate": 2.4397714285714286e-05, "loss": 0.3574, "step": 14660 }, { "epoch": 203.75, "learning_rate": 2.4386285714285716e-05, "loss": 0.346, "step": 14670 }, { "epoch": 203.89, "learning_rate": 2.4374857142857143e-05, "loss": 0.3503, "step": 14680 }, { "epoch": 204.0, "eval_loss": 0.524337887763977, "eval_runtime": 129.3279, "eval_samples_per_second": 4.114, "eval_steps_per_second": 0.518, "eval_wer": 0.2222793597737353, "step": 14688 }, { "epoch": 204.03, "learning_rate": 2.436342857142857e-05, "loss": 0.3544, "step": 14690 }, { "epoch": 204.17, "learning_rate": 2.4352000000000003e-05, "loss": 0.3636, "step": 14700 }, { "epoch": 204.3, "learning_rate": 2.434057142857143e-05, "loss": 0.3526, "step": 14710 }, { "epoch": 204.44, "learning_rate": 2.432914285714286e-05, "loss": 0.3517, "step": 14720 }, { "epoch": 204.58, "learning_rate": 2.4317714285714287e-05, "loss": 0.368, "step": 14730 }, { "epoch": 204.72, "learning_rate": 2.4306285714285717e-05, "loss": 0.3606, "step": 14740 }, { "epoch": 204.86, "learning_rate": 2.4294857142857144e-05, "loss": 0.3362, "step": 14750 }, { "epoch": 205.0, "learning_rate": 2.4283428571428574e-05, "loss": 0.3529, "step": 14760 }, { "epoch": 205.0, "eval_loss": 0.5610824227333069, "eval_runtime": 130.2165, "eval_samples_per_second": 4.086, "eval_steps_per_second": 0.515, "eval_wer": 0.22761457864626855, "step": 14760 }, { "epoch": 205.14, "learning_rate": 2.4272e-05, "loss": 0.3503, "step": 14770 }, { "epoch": 205.28, "learning_rate": 2.4260571428571427e-05, "loss": 0.3632, "step": 14780 }, { "epoch": 205.42, "learning_rate": 2.424914285714286e-05, "loss": 0.3398, "step": 14790 }, { "epoch": 205.55, "learning_rate": 2.4237714285714288e-05, "loss": 0.3384, "step": 14800 }, { "epoch": 205.69, "learning_rate": 2.4226285714285718e-05, "loss": 0.3328, "step": 14810 }, { "epoch": 205.83, "learning_rate": 2.4214857142857145e-05, "loss": 0.3504, "step": 14820 }, { "epoch": 205.97, "learning_rate": 2.4203428571428575e-05, "loss": 0.3555, "step": 14830 }, { "epoch": 206.0, "eval_loss": 0.5436542630195618, "eval_runtime": 129.2193, "eval_samples_per_second": 4.117, "eval_steps_per_second": 0.518, "eval_wer": 0.22086520537378673, "step": 14832 }, { "epoch": 206.11, "learning_rate": 2.4192e-05, "loss": 0.3506, "step": 14840 }, { "epoch": 206.25, "learning_rate": 2.4180571428571428e-05, "loss": 0.3503, "step": 14850 }, { "epoch": 206.39, "learning_rate": 2.416914285714286e-05, "loss": 0.3541, "step": 14860 }, { "epoch": 206.53, "learning_rate": 2.4157714285714285e-05, "loss": 0.342, "step": 14870 }, { "epoch": 206.66, "learning_rate": 2.414628571428572e-05, "loss": 0.3463, "step": 14880 }, { "epoch": 206.8, "learning_rate": 2.4134857142857145e-05, "loss": 0.356, "step": 14890 }, { "epoch": 206.94, "learning_rate": 2.4123428571428576e-05, "loss": 0.3548, "step": 14900 }, { "epoch": 207.0, "eval_loss": 0.5401390194892883, "eval_runtime": 129.175, "eval_samples_per_second": 4.118, "eval_steps_per_second": 0.519, "eval_wer": 0.22485054959182363, "step": 14904 }, { "epoch": 207.08, "learning_rate": 2.4112000000000002e-05, "loss": 0.3619, "step": 14910 }, { "epoch": 207.22, "learning_rate": 2.410057142857143e-05, "loss": 0.3402, "step": 14920 }, { "epoch": 207.36, "learning_rate": 2.408914285714286e-05, "loss": 0.3367, "step": 14930 }, { "epoch": 207.5, "learning_rate": 2.4077714285714286e-05, "loss": 0.3465, "step": 14940 }, { "epoch": 207.64, "learning_rate": 2.4066285714285716e-05, "loss": 0.3419, "step": 14950 }, { "epoch": 207.78, "learning_rate": 2.4054857142857143e-05, "loss": 0.3536, "step": 14960 }, { "epoch": 207.91, "learning_rate": 2.4043428571428576e-05, "loss": 0.3417, "step": 14970 }, { "epoch": 208.0, "eval_loss": 0.5643130540847778, "eval_runtime": 129.4829, "eval_samples_per_second": 4.109, "eval_steps_per_second": 0.517, "eval_wer": 0.2303786077007135, "step": 14976 }, { "epoch": 208.06, "learning_rate": 2.4032000000000003e-05, "loss": 0.3578, "step": 14980 }, { "epoch": 208.19, "learning_rate": 2.402171428571429e-05, "loss": 0.3498, "step": 14990 }, { "epoch": 208.33, "learning_rate": 2.4010285714285715e-05, "loss": 0.3416, "step": 15000 }, { "epoch": 208.47, "learning_rate": 2.3998857142857145e-05, "loss": 0.337, "step": 15010 }, { "epoch": 208.61, "learning_rate": 2.3987428571428572e-05, "loss": 0.3334, "step": 15020 }, { "epoch": 208.75, "learning_rate": 2.3976000000000002e-05, "loss": 0.3377, "step": 15030 }, { "epoch": 208.89, "learning_rate": 2.396457142857143e-05, "loss": 0.3271, "step": 15040 }, { "epoch": 209.0, "eval_loss": 0.535629153251648, "eval_runtime": 130.0173, "eval_samples_per_second": 4.092, "eval_steps_per_second": 0.515, "eval_wer": 0.2182940155556984, "step": 15048 }, { "epoch": 209.03, "learning_rate": 2.3953142857142856e-05, "loss": 0.3497, "step": 15050 }, { "epoch": 209.17, "learning_rate": 2.394171428571429e-05, "loss": 0.3335, "step": 15060 }, { "epoch": 209.3, "learning_rate": 2.3930285714285716e-05, "loss": 0.3377, "step": 15070 }, { "epoch": 209.44, "learning_rate": 2.3918857142857146e-05, "loss": 0.3502, "step": 15080 }, { "epoch": 209.58, "learning_rate": 2.3907428571428573e-05, "loss": 0.3331, "step": 15090 }, { "epoch": 209.72, "learning_rate": 2.3896000000000003e-05, "loss": 0.3403, "step": 15100 }, { "epoch": 209.86, "learning_rate": 2.388457142857143e-05, "loss": 0.3422, "step": 15110 }, { "epoch": 210.0, "learning_rate": 2.3873142857142856e-05, "loss": 0.344, "step": 15120 }, { "epoch": 210.0, "eval_loss": 0.5299952030181885, "eval_runtime": 129.6097, "eval_samples_per_second": 4.105, "eval_steps_per_second": 0.517, "eval_wer": 0.21726553962846307, "step": 15120 }, { "epoch": 210.14, "learning_rate": 2.3861714285714287e-05, "loss": 0.3367, "step": 15130 }, { "epoch": 210.28, "learning_rate": 2.3850285714285713e-05, "loss": 0.3381, "step": 15140 }, { "epoch": 210.42, "learning_rate": 2.3838857142857147e-05, "loss": 0.3461, "step": 15150 }, { "epoch": 210.55, "learning_rate": 2.3827428571428574e-05, "loss": 0.3373, "step": 15160 }, { "epoch": 210.69, "learning_rate": 2.3816000000000004e-05, "loss": 0.333, "step": 15170 }, { "epoch": 210.83, "learning_rate": 2.380457142857143e-05, "loss": 0.3386, "step": 15180 }, { "epoch": 210.97, "learning_rate": 2.3793142857142857e-05, "loss": 0.3416, "step": 15190 }, { "epoch": 211.0, "eval_loss": 0.5343140363693237, "eval_runtime": 128.9741, "eval_samples_per_second": 4.125, "eval_steps_per_second": 0.519, "eval_wer": 0.21694414090120204, "step": 15192 }, { "epoch": 211.11, "learning_rate": 2.3781714285714287e-05, "loss": 0.3405, "step": 15200 }, { "epoch": 211.25, "learning_rate": 2.3770285714285714e-05, "loss": 0.3419, "step": 15210 }, { "epoch": 211.39, "learning_rate": 2.3758857142857144e-05, "loss": 0.3341, "step": 15220 }, { "epoch": 211.53, "learning_rate": 2.374742857142857e-05, "loss": 0.3349, "step": 15230 }, { "epoch": 211.66, "learning_rate": 2.3736000000000004e-05, "loss": 0.3392, "step": 15240 }, { "epoch": 211.8, "learning_rate": 2.372457142857143e-05, "loss": 0.3379, "step": 15250 }, { "epoch": 211.94, "learning_rate": 2.371314285714286e-05, "loss": 0.3393, "step": 15260 }, { "epoch": 212.0, "eval_loss": 0.5677480101585388, "eval_runtime": 129.1615, "eval_samples_per_second": 4.119, "eval_steps_per_second": 0.519, "eval_wer": 0.22060808639197788, "step": 15264 }, { "epoch": 212.08, "learning_rate": 2.3701714285714288e-05, "loss": 0.3505, "step": 15270 }, { "epoch": 212.22, "learning_rate": 2.3690285714285715e-05, "loss": 0.3373, "step": 15280 }, { "epoch": 212.36, "learning_rate": 2.3678857142857145e-05, "loss": 0.3341, "step": 15290 }, { "epoch": 212.5, "learning_rate": 2.3667428571428572e-05, "loss": 0.3326, "step": 15300 }, { "epoch": 212.64, "learning_rate": 2.3656000000000002e-05, "loss": 0.3328, "step": 15310 }, { "epoch": 212.78, "learning_rate": 2.364457142857143e-05, "loss": 0.3343, "step": 15320 }, { "epoch": 212.91, "learning_rate": 2.3633142857142862e-05, "loss": 0.3356, "step": 15330 }, { "epoch": 213.0, "eval_loss": 0.5514068603515625, "eval_runtime": 129.6214, "eval_samples_per_second": 4.104, "eval_steps_per_second": 0.517, "eval_wer": 0.21938677122838593, "step": 15336 }, { "epoch": 213.06, "learning_rate": 2.362171428571429e-05, "loss": 0.3392, "step": 15340 }, { "epoch": 213.19, "learning_rate": 2.3610285714285716e-05, "loss": 0.3413, "step": 15350 }, { "epoch": 213.33, "learning_rate": 2.3598857142857146e-05, "loss": 0.3192, "step": 15360 }, { "epoch": 213.47, "learning_rate": 2.3587428571428573e-05, "loss": 0.346, "step": 15370 }, { "epoch": 213.61, "learning_rate": 2.3576000000000003e-05, "loss": 0.3314, "step": 15380 }, { "epoch": 213.75, "learning_rate": 2.356457142857143e-05, "loss": 0.3331, "step": 15390 }, { "epoch": 213.89, "learning_rate": 2.355314285714286e-05, "loss": 0.3344, "step": 15400 }, { "epoch": 214.0, "eval_loss": 0.5526800751686096, "eval_runtime": 129.2555, "eval_samples_per_second": 4.116, "eval_steps_per_second": 0.518, "eval_wer": 0.2198367294465514, "step": 15408 }, { "epoch": 214.03, "learning_rate": 2.3541714285714286e-05, "loss": 0.3358, "step": 15410 }, { "epoch": 214.17, "learning_rate": 2.3530285714285713e-05, "loss": 0.3387, "step": 15420 }, { "epoch": 214.3, "learning_rate": 2.3518857142857147e-05, "loss": 0.3331, "step": 15430 }, { "epoch": 214.44, "learning_rate": 2.3507428571428573e-05, "loss": 0.3334, "step": 15440 }, { "epoch": 214.58, "learning_rate": 2.3496000000000003e-05, "loss": 0.3224, "step": 15450 }, { "epoch": 214.72, "learning_rate": 2.348457142857143e-05, "loss": 0.3383, "step": 15460 }, { "epoch": 214.86, "learning_rate": 2.347314285714286e-05, "loss": 0.3136, "step": 15470 }, { "epoch": 215.0, "learning_rate": 2.3461714285714287e-05, "loss": 0.3303, "step": 15480 }, { "epoch": 215.0, "eval_loss": 0.5589979290962219, "eval_runtime": 129.2737, "eval_samples_per_second": 4.115, "eval_steps_per_second": 0.518, "eval_wer": 0.21463007006492255, "step": 15480 }, { "epoch": 215.14, "learning_rate": 2.3450285714285714e-05, "loss": 0.344, "step": 15490 }, { "epoch": 215.28, "learning_rate": 2.3438857142857144e-05, "loss": 0.3363, "step": 15500 }, { "epoch": 215.42, "learning_rate": 2.342742857142857e-05, "loss": 0.3365, "step": 15510 }, { "epoch": 215.55, "learning_rate": 2.3416000000000004e-05, "loss": 0.3372, "step": 15520 }, { "epoch": 215.69, "learning_rate": 2.340457142857143e-05, "loss": 0.3479, "step": 15530 }, { "epoch": 215.83, "learning_rate": 2.339314285714286e-05, "loss": 0.3426, "step": 15540 }, { "epoch": 215.97, "learning_rate": 2.3381714285714288e-05, "loss": 0.3503, "step": 15550 }, { "epoch": 216.0, "eval_loss": 0.568139910697937, "eval_runtime": 129.5977, "eval_samples_per_second": 4.105, "eval_steps_per_second": 0.517, "eval_wer": 0.22420775213730154, "step": 15552 }, { "epoch": 216.11, "learning_rate": 2.3370285714285715e-05, "loss": 0.3339, "step": 15560 }, { "epoch": 216.25, "learning_rate": 2.3358857142857145e-05, "loss": 0.3325, "step": 15570 }, { "epoch": 216.39, "learning_rate": 2.334742857142857e-05, "loss": 0.3271, "step": 15580 }, { "epoch": 216.53, "learning_rate": 2.3336e-05, "loss": 0.3272, "step": 15590 }, { "epoch": 216.66, "learning_rate": 2.3324571428571428e-05, "loss": 0.3262, "step": 15600 }, { "epoch": 216.8, "learning_rate": 2.3313142857142862e-05, "loss": 0.3283, "step": 15610 }, { "epoch": 216.94, "learning_rate": 2.330171428571429e-05, "loss": 0.339, "step": 15620 }, { "epoch": 217.0, "eval_loss": 0.5318368077278137, "eval_runtime": 129.2557, "eval_samples_per_second": 4.116, "eval_steps_per_second": 0.518, "eval_wer": 0.21861541428295944, "step": 15624 }, { "epoch": 217.08, "learning_rate": 2.3290285714285715e-05, "loss": 0.3409, "step": 15630 }, { "epoch": 217.22, "learning_rate": 2.3278857142857145e-05, "loss": 0.3385, "step": 15640 }, { "epoch": 217.36, "learning_rate": 2.3267428571428572e-05, "loss": 0.318, "step": 15650 }, { "epoch": 217.5, "learning_rate": 2.3256000000000002e-05, "loss": 0.3158, "step": 15660 }, { "epoch": 217.64, "learning_rate": 2.324457142857143e-05, "loss": 0.3237, "step": 15670 }, { "epoch": 217.78, "learning_rate": 2.323314285714286e-05, "loss": 0.3356, "step": 15680 }, { "epoch": 217.91, "learning_rate": 2.3221714285714286e-05, "loss": 0.3361, "step": 15690 }, { "epoch": 218.0, "eval_loss": 0.5368818640708923, "eval_runtime": 129.5744, "eval_samples_per_second": 4.106, "eval_steps_per_second": 0.517, "eval_wer": 0.224657710355467, "step": 15696 }, { "epoch": 218.06, "learning_rate": 2.3210285714285713e-05, "loss": 0.3501, "step": 15700 }, { "epoch": 218.19, "learning_rate": 2.3198857142857146e-05, "loss": 0.3353, "step": 15710 }, { "epoch": 218.33, "learning_rate": 2.3187428571428573e-05, "loss": 0.3206, "step": 15720 }, { "epoch": 218.47, "learning_rate": 2.3176000000000003e-05, "loss": 0.3416, "step": 15730 }, { "epoch": 218.61, "learning_rate": 2.316457142857143e-05, "loss": 0.3282, "step": 15740 }, { "epoch": 218.75, "learning_rate": 2.315314285714286e-05, "loss": 0.3429, "step": 15750 }, { "epoch": 218.89, "learning_rate": 2.3141714285714287e-05, "loss": 0.334, "step": 15760 }, { "epoch": 219.0, "eval_loss": 0.5172927975654602, "eval_runtime": 129.7687, "eval_samples_per_second": 4.1, "eval_steps_per_second": 0.516, "eval_wer": 0.2152085877739924, "step": 15768 }, { "epoch": 219.03, "learning_rate": 2.3130285714285713e-05, "loss": 0.3343, "step": 15770 }, { "epoch": 219.17, "learning_rate": 2.3118857142857144e-05, "loss": 0.3326, "step": 15780 }, { "epoch": 219.3, "learning_rate": 2.310742857142857e-05, "loss": 0.3321, "step": 15790 }, { "epoch": 219.44, "learning_rate": 2.3096000000000004e-05, "loss": 0.3318, "step": 15800 }, { "epoch": 219.58, "learning_rate": 2.308457142857143e-05, "loss": 0.3129, "step": 15810 }, { "epoch": 219.72, "learning_rate": 2.307314285714286e-05, "loss": 0.3343, "step": 15820 }, { "epoch": 219.86, "learning_rate": 2.3061714285714287e-05, "loss": 0.3214, "step": 15830 }, { "epoch": 220.0, "learning_rate": 2.3050285714285718e-05, "loss": 0.3222, "step": 15840 }, { "epoch": 220.0, "eval_loss": 0.5965456962585449, "eval_runtime": 130.7121, "eval_samples_per_second": 4.07, "eval_steps_per_second": 0.513, "eval_wer": 0.22356495468277945, "step": 15840 }, { "epoch": 220.14, "learning_rate": 2.3038857142857144e-05, "loss": 0.3383, "step": 15850 }, { "epoch": 220.28, "learning_rate": 2.302742857142857e-05, "loss": 0.346, "step": 15860 }, { "epoch": 220.42, "learning_rate": 2.3016e-05, "loss": 0.3248, "step": 15870 }, { "epoch": 220.55, "learning_rate": 2.3004571428571428e-05, "loss": 0.3175, "step": 15880 }, { "epoch": 220.69, "learning_rate": 2.299314285714286e-05, "loss": 0.3256, "step": 15890 }, { "epoch": 220.83, "learning_rate": 2.2981714285714288e-05, "loss": 0.3393, "step": 15900 }, { "epoch": 220.97, "learning_rate": 2.297028571428572e-05, "loss": 0.3247, "step": 15910 }, { "epoch": 221.0, "eval_loss": 0.5543392300605774, "eval_runtime": 129.5382, "eval_samples_per_second": 4.107, "eval_steps_per_second": 0.517, "eval_wer": 0.21649418268303658, "step": 15912 }, { "epoch": 221.11, "learning_rate": 2.2958857142857145e-05, "loss": 0.3287, "step": 15920 }, { "epoch": 221.25, "learning_rate": 2.2947428571428572e-05, "loss": 0.3202, "step": 15930 }, { "epoch": 221.39, "learning_rate": 2.2936000000000002e-05, "loss": 0.3172, "step": 15940 }, { "epoch": 221.53, "learning_rate": 2.292457142857143e-05, "loss": 0.327, "step": 15950 }, { "epoch": 221.66, "learning_rate": 2.291314285714286e-05, "loss": 0.3281, "step": 15960 }, { "epoch": 221.8, "learning_rate": 2.2901714285714286e-05, "loss": 0.3207, "step": 15970 }, { "epoch": 221.94, "learning_rate": 2.289028571428572e-05, "loss": 0.338, "step": 15980 }, { "epoch": 222.0, "eval_loss": 0.5835712552070618, "eval_runtime": 129.2189, "eval_samples_per_second": 4.117, "eval_steps_per_second": 0.518, "eval_wer": 0.21777977759208073, "step": 15984 }, { "epoch": 222.08, "learning_rate": 2.2878857142857146e-05, "loss": 0.3344, "step": 15990 }, { "epoch": 222.22, "learning_rate": 2.2867428571428573e-05, "loss": 0.3294, "step": 16000 }, { "epoch": 222.36, "learning_rate": 2.2856000000000003e-05, "loss": 0.3198, "step": 16010 }, { "epoch": 222.5, "learning_rate": 2.284457142857143e-05, "loss": 0.3121, "step": 16020 }, { "epoch": 222.64, "learning_rate": 2.283314285714286e-05, "loss": 0.3248, "step": 16030 }, { "epoch": 222.78, "learning_rate": 2.2821714285714286e-05, "loss": 0.3261, "step": 16040 }, { "epoch": 222.91, "learning_rate": 2.2810285714285717e-05, "loss": 0.3112, "step": 16050 }, { "epoch": 223.0, "eval_loss": 0.5572813153266907, "eval_runtime": 128.9396, "eval_samples_per_second": 4.126, "eval_steps_per_second": 0.52, "eval_wer": 0.21707270039210644, "step": 16056 }, { "epoch": 223.06, "learning_rate": 2.2798857142857143e-05, "loss": 0.3344, "step": 16060 }, { "epoch": 223.19, "learning_rate": 2.278742857142857e-05, "loss": 0.3201, "step": 16070 }, { "epoch": 223.33, "learning_rate": 2.2776000000000004e-05, "loss": 0.3147, "step": 16080 }, { "epoch": 223.47, "learning_rate": 2.276457142857143e-05, "loss": 0.3309, "step": 16090 }, { "epoch": 223.61, "learning_rate": 2.275314285714286e-05, "loss": 0.3119, "step": 16100 }, { "epoch": 223.75, "learning_rate": 2.2741714285714287e-05, "loss": 0.314, "step": 16110 }, { "epoch": 223.89, "learning_rate": 2.2730285714285717e-05, "loss": 0.3203, "step": 16120 }, { "epoch": 224.0, "eval_loss": 0.5829967260360718, "eval_runtime": 129.121, "eval_samples_per_second": 4.12, "eval_steps_per_second": 0.519, "eval_wer": 0.21964389021019476, "step": 16128 }, { "epoch": 224.03, "learning_rate": 2.2718857142857144e-05, "loss": 0.3438, "step": 16130 }, { "epoch": 224.17, "learning_rate": 2.270742857142857e-05, "loss": 0.3377, "step": 16140 }, { "epoch": 224.3, "learning_rate": 2.2696e-05, "loss": 0.3212, "step": 16150 }, { "epoch": 224.44, "learning_rate": 2.2684571428571428e-05, "loss": 0.3266, "step": 16160 }, { "epoch": 224.58, "learning_rate": 2.267314285714286e-05, "loss": 0.3383, "step": 16170 }, { "epoch": 224.72, "learning_rate": 2.2662857142857147e-05, "loss": 0.3373, "step": 16180 }, { "epoch": 224.86, "learning_rate": 2.2651428571428573e-05, "loss": 0.3257, "step": 16190 }, { "epoch": 225.0, "learning_rate": 2.264e-05, "loss": 0.3294, "step": 16200 }, { "epoch": 225.0, "eval_loss": 0.5814815759658813, "eval_runtime": 129.3549, "eval_samples_per_second": 4.113, "eval_steps_per_second": 0.518, "eval_wer": 0.2197724497010992, "step": 16200 }, { "epoch": 225.14, "learning_rate": 2.262857142857143e-05, "loss": 0.336, "step": 16210 }, { "epoch": 225.28, "learning_rate": 2.2617142857142857e-05, "loss": 0.3256, "step": 16220 }, { "epoch": 225.42, "learning_rate": 2.2605714285714287e-05, "loss": 0.3208, "step": 16230 }, { "epoch": 225.55, "learning_rate": 2.2594285714285714e-05, "loss": 0.3336, "step": 16240 }, { "epoch": 225.69, "learning_rate": 2.2582857142857147e-05, "loss": 0.3394, "step": 16250 }, { "epoch": 225.83, "learning_rate": 2.2571428571428574e-05, "loss": 0.3205, "step": 16260 }, { "epoch": 225.97, "learning_rate": 2.256e-05, "loss": 0.3392, "step": 16270 }, { "epoch": 226.0, "eval_loss": 0.5641466379165649, "eval_runtime": 128.7079, "eval_samples_per_second": 4.133, "eval_steps_per_second": 0.521, "eval_wer": 0.21630134344667995, "step": 16272 }, { "epoch": 226.11, "learning_rate": 2.254857142857143e-05, "loss": 0.3254, "step": 16280 }, { "epoch": 226.25, "learning_rate": 2.2537142857142858e-05, "loss": 0.3258, "step": 16290 }, { "epoch": 226.39, "learning_rate": 2.2525714285714288e-05, "loss": 0.3293, "step": 16300 }, { "epoch": 226.53, "learning_rate": 2.2514285714285715e-05, "loss": 0.3379, "step": 16310 }, { "epoch": 226.66, "learning_rate": 2.2502857142857145e-05, "loss": 0.3238, "step": 16320 }, { "epoch": 226.8, "learning_rate": 2.249142857142857e-05, "loss": 0.3184, "step": 16330 }, { "epoch": 226.94, "learning_rate": 2.2480000000000005e-05, "loss": 0.3332, "step": 16340 }, { "epoch": 227.0, "eval_loss": 0.5769838690757751, "eval_runtime": 129.3799, "eval_samples_per_second": 4.112, "eval_steps_per_second": 0.518, "eval_wer": 0.22035096741016905, "step": 16344 }, { "epoch": 227.08, "learning_rate": 2.2468571428571432e-05, "loss": 0.3314, "step": 16350 }, { "epoch": 227.22, "learning_rate": 2.245714285714286e-05, "loss": 0.3319, "step": 16360 }, { "epoch": 227.36, "learning_rate": 2.244571428571429e-05, "loss": 0.3368, "step": 16370 }, { "epoch": 227.5, "learning_rate": 2.2434285714285715e-05, "loss": 0.3307, "step": 16380 }, { "epoch": 227.64, "learning_rate": 2.2422857142857145e-05, "loss": 0.3364, "step": 16390 }, { "epoch": 227.78, "learning_rate": 2.2411428571428572e-05, "loss": 0.3237, "step": 16400 }, { "epoch": 227.91, "learning_rate": 2.2400000000000002e-05, "loss": 0.3365, "step": 16410 }, { "epoch": 228.0, "eval_loss": 0.5843015909194946, "eval_runtime": 129.6291, "eval_samples_per_second": 4.104, "eval_steps_per_second": 0.517, "eval_wer": 0.21810117631934178, "step": 16416 }, { "epoch": 228.06, "learning_rate": 2.238857142857143e-05, "loss": 0.3311, "step": 16420 }, { "epoch": 228.19, "learning_rate": 2.2377142857142856e-05, "loss": 0.3274, "step": 16430 }, { "epoch": 228.33, "learning_rate": 2.236571428571429e-05, "loss": 0.3255, "step": 16440 }, { "epoch": 228.47, "learning_rate": 2.2354285714285716e-05, "loss": 0.3316, "step": 16450 }, { "epoch": 228.61, "learning_rate": 2.2342857142857146e-05, "loss": 0.3227, "step": 16460 }, { "epoch": 228.75, "learning_rate": 2.2331428571428573e-05, "loss": 0.3321, "step": 16470 }, { "epoch": 228.89, "learning_rate": 2.2320000000000003e-05, "loss": 0.3186, "step": 16480 }, { "epoch": 229.0, "eval_loss": 0.5834778547286987, "eval_runtime": 128.9834, "eval_samples_per_second": 4.125, "eval_steps_per_second": 0.519, "eval_wer": 0.223114996464614, "step": 16488 }, { "epoch": 229.03, "learning_rate": 2.230857142857143e-05, "loss": 0.3454, "step": 16490 }, { "epoch": 229.17, "learning_rate": 2.2297142857142857e-05, "loss": 0.334, "step": 16500 }, { "epoch": 229.3, "learning_rate": 2.2285714285714287e-05, "loss": 0.3173, "step": 16510 }, { "epoch": 229.44, "learning_rate": 2.2274285714285714e-05, "loss": 0.3296, "step": 16520 }, { "epoch": 229.58, "learning_rate": 2.2262857142857147e-05, "loss": 0.3286, "step": 16530 }, { "epoch": 229.72, "learning_rate": 2.2251428571428574e-05, "loss": 0.3312, "step": 16540 }, { "epoch": 229.86, "learning_rate": 2.2240000000000004e-05, "loss": 0.3171, "step": 16550 }, { "epoch": 230.0, "learning_rate": 2.222857142857143e-05, "loss": 0.3329, "step": 16560 }, { "epoch": 230.0, "eval_loss": 0.5866855382919312, "eval_runtime": 129.7754, "eval_samples_per_second": 4.099, "eval_steps_per_second": 0.516, "eval_wer": 0.22195796104647425, "step": 16560 }, { "epoch": 230.14, "learning_rate": 2.2217142857142857e-05, "loss": 0.3359, "step": 16570 }, { "epoch": 230.28, "learning_rate": 2.2205714285714288e-05, "loss": 0.3343, "step": 16580 }, { "epoch": 230.42, "learning_rate": 2.2194285714285714e-05, "loss": 0.3325, "step": 16590 }, { "epoch": 230.55, "learning_rate": 2.2182857142857144e-05, "loss": 0.3149, "step": 16600 }, { "epoch": 230.69, "learning_rate": 2.217142857142857e-05, "loss": 0.3283, "step": 16610 }, { "epoch": 230.83, "learning_rate": 2.2160000000000005e-05, "loss": 0.3324, "step": 16620 }, { "epoch": 230.97, "learning_rate": 2.214857142857143e-05, "loss": 0.3257, "step": 16630 }, { "epoch": 231.0, "eval_loss": 0.6080511808395386, "eval_runtime": 129.1549, "eval_samples_per_second": 4.119, "eval_steps_per_second": 0.519, "eval_wer": 0.21964389021019476, "step": 16632 }, { "epoch": 231.11, "learning_rate": 2.2137142857142858e-05, "loss": 0.3295, "step": 16640 }, { "epoch": 231.25, "learning_rate": 2.2125714285714288e-05, "loss": 0.3187, "step": 16650 }, { "epoch": 231.39, "learning_rate": 2.2114285714285715e-05, "loss": 0.3288, "step": 16660 }, { "epoch": 231.53, "learning_rate": 2.2102857142857145e-05, "loss": 0.3208, "step": 16670 }, { "epoch": 231.66, "learning_rate": 2.2091428571428572e-05, "loss": 0.3238, "step": 16680 }, { "epoch": 231.8, "learning_rate": 2.2080000000000002e-05, "loss": 0.3262, "step": 16690 }, { "epoch": 231.94, "learning_rate": 2.206857142857143e-05, "loss": 0.3183, "step": 16700 }, { "epoch": 232.0, "eval_loss": 0.5943585634231567, "eval_runtime": 129.4071, "eval_samples_per_second": 4.111, "eval_steps_per_second": 0.518, "eval_wer": 0.22195796104647425, "step": 16704 }, { "epoch": 232.08, "learning_rate": 2.2057142857142856e-05, "loss": 0.3252, "step": 16710 }, { "epoch": 232.22, "learning_rate": 2.204571428571429e-05, "loss": 0.3304, "step": 16720 }, { "epoch": 232.36, "learning_rate": 2.2034285714285716e-05, "loss": 0.3201, "step": 16730 }, { "epoch": 232.5, "learning_rate": 2.2022857142857146e-05, "loss": 0.322, "step": 16740 }, { "epoch": 232.64, "learning_rate": 2.2011428571428573e-05, "loss": 0.3144, "step": 16750 }, { "epoch": 232.78, "learning_rate": 2.2000000000000003e-05, "loss": 0.3187, "step": 16760 }, { "epoch": 232.91, "learning_rate": 2.198857142857143e-05, "loss": 0.3315, "step": 16770 }, { "epoch": 233.0, "eval_loss": 0.606001079082489, "eval_runtime": 129.3157, "eval_samples_per_second": 4.114, "eval_steps_per_second": 0.518, "eval_wer": 0.22215080028283088, "step": 16776 }, { "epoch": 233.06, "learning_rate": 2.1977142857142856e-05, "loss": 0.3312, "step": 16780 }, { "epoch": 233.19, "learning_rate": 2.1965714285714286e-05, "loss": 0.329, "step": 16790 }, { "epoch": 233.33, "learning_rate": 2.1954285714285713e-05, "loss": 0.3268, "step": 16800 }, { "epoch": 233.47, "learning_rate": 2.1942857142857147e-05, "loss": 0.3224, "step": 16810 }, { "epoch": 233.61, "learning_rate": 2.1931428571428573e-05, "loss": 0.323, "step": 16820 }, { "epoch": 233.75, "learning_rate": 2.1920000000000004e-05, "loss": 0.3256, "step": 16830 }, { "epoch": 233.89, "learning_rate": 2.190857142857143e-05, "loss": 0.3269, "step": 16840 }, { "epoch": 234.0, "eval_loss": 0.6267737746238708, "eval_runtime": 129.7959, "eval_samples_per_second": 4.099, "eval_steps_per_second": 0.516, "eval_wer": 0.22600758500996337, "step": 16848 }, { "epoch": 234.03, "learning_rate": 2.1897142857142857e-05, "loss": 0.3314, "step": 16850 }, { "epoch": 234.17, "learning_rate": 2.1885714285714287e-05, "loss": 0.3395, "step": 16860 }, { "epoch": 234.3, "learning_rate": 2.1874285714285714e-05, "loss": 0.323, "step": 16870 }, { "epoch": 234.44, "learning_rate": 2.1862857142857144e-05, "loss": 0.3153, "step": 16880 }, { "epoch": 234.58, "learning_rate": 2.185142857142857e-05, "loss": 0.3213, "step": 16890 }, { "epoch": 234.72, "learning_rate": 2.1840000000000004e-05, "loss": 0.3188, "step": 16900 }, { "epoch": 234.86, "learning_rate": 2.182857142857143e-05, "loss": 0.3187, "step": 16910 }, { "epoch": 235.0, "learning_rate": 2.1817142857142858e-05, "loss": 0.3191, "step": 16920 }, { "epoch": 235.0, "eval_loss": 0.5795890688896179, "eval_runtime": 129.0797, "eval_samples_per_second": 4.121, "eval_steps_per_second": 0.519, "eval_wer": 0.2182940155556984, "step": 16920 }, { "epoch": 235.14, "learning_rate": 2.1805714285714288e-05, "loss": 0.3296, "step": 16930 }, { "epoch": 235.28, "learning_rate": 2.1794285714285715e-05, "loss": 0.3164, "step": 16940 }, { "epoch": 235.42, "learning_rate": 2.1782857142857145e-05, "loss": 0.3163, "step": 16950 }, { "epoch": 235.55, "learning_rate": 2.177142857142857e-05, "loss": 0.3181, "step": 16960 }, { "epoch": 235.69, "learning_rate": 2.1760000000000002e-05, "loss": 0.321, "step": 16970 }, { "epoch": 235.83, "learning_rate": 2.174857142857143e-05, "loss": 0.3231, "step": 16980 }, { "epoch": 235.97, "learning_rate": 2.1737142857142862e-05, "loss": 0.3395, "step": 16990 }, { "epoch": 236.0, "eval_loss": 0.6139715909957886, "eval_runtime": 129.4808, "eval_samples_per_second": 4.109, "eval_steps_per_second": 0.517, "eval_wer": 0.22568618628270232, "step": 16992 }, { "epoch": 236.11, "learning_rate": 2.172571428571429e-05, "loss": 0.3186, "step": 17000 }, { "epoch": 236.25, "learning_rate": 2.1714285714285715e-05, "loss": 0.3284, "step": 17010 }, { "epoch": 236.39, "learning_rate": 2.1702857142857146e-05, "loss": 0.3185, "step": 17020 }, { "epoch": 236.53, "learning_rate": 2.1691428571428572e-05, "loss": 0.3247, "step": 17030 }, { "epoch": 236.66, "learning_rate": 2.1680000000000002e-05, "loss": 0.3256, "step": 17040 }, { "epoch": 236.8, "learning_rate": 2.166857142857143e-05, "loss": 0.3175, "step": 17050 }, { "epoch": 236.94, "learning_rate": 2.165714285714286e-05, "loss": 0.3186, "step": 17060 }, { "epoch": 237.0, "eval_loss": 0.630214273929596, "eval_runtime": 129.6671, "eval_samples_per_second": 4.103, "eval_steps_per_second": 0.517, "eval_wer": 0.22774313813717298, "step": 17064 }, { "epoch": 237.08, "learning_rate": 2.1645714285714286e-05, "loss": 0.3204, "step": 17070 }, { "epoch": 237.22, "learning_rate": 2.1634285714285713e-05, "loss": 0.3224, "step": 17080 }, { "epoch": 237.36, "learning_rate": 2.1622857142857146e-05, "loss": 0.3254, "step": 17090 }, { "epoch": 237.5, "learning_rate": 2.1611428571428573e-05, "loss": 0.3158, "step": 17100 }, { "epoch": 237.64, "learning_rate": 2.1600000000000003e-05, "loss": 0.3211, "step": 17110 }, { "epoch": 237.78, "learning_rate": 2.158857142857143e-05, "loss": 0.3153, "step": 17120 }, { "epoch": 237.91, "learning_rate": 2.157714285714286e-05, "loss": 0.3264, "step": 17130 }, { "epoch": 238.0, "eval_loss": 0.575238049030304, "eval_runtime": 128.7771, "eval_samples_per_second": 4.131, "eval_steps_per_second": 0.52, "eval_wer": 0.21938677122838593, "step": 17136 }, { "epoch": 238.06, "learning_rate": 2.1565714285714287e-05, "loss": 0.3249, "step": 17140 }, { "epoch": 238.19, "learning_rate": 2.1554285714285714e-05, "loss": 0.3083, "step": 17150 }, { "epoch": 238.33, "learning_rate": 2.1542857142857144e-05, "loss": 0.303, "step": 17160 }, { "epoch": 238.47, "learning_rate": 2.153142857142857e-05, "loss": 0.3232, "step": 17170 }, { "epoch": 238.61, "learning_rate": 2.1520000000000004e-05, "loss": 0.3127, "step": 17180 }, { "epoch": 238.75, "learning_rate": 2.150857142857143e-05, "loss": 0.3219, "step": 17190 }, { "epoch": 238.89, "learning_rate": 2.149714285714286e-05, "loss": 0.3181, "step": 17200 }, { "epoch": 239.0, "eval_loss": 0.6066352128982544, "eval_runtime": 129.1933, "eval_samples_per_second": 4.118, "eval_steps_per_second": 0.519, "eval_wer": 0.21957961046474256, "step": 17208 }, { "epoch": 239.03, "learning_rate": 2.1485714285714288e-05, "loss": 0.3227, "step": 17210 }, { "epoch": 239.17, "learning_rate": 2.1474285714285714e-05, "loss": 0.3273, "step": 17220 }, { "epoch": 239.3, "learning_rate": 2.1462857142857145e-05, "loss": 0.3231, "step": 17230 }, { "epoch": 239.44, "learning_rate": 2.145142857142857e-05, "loss": 0.315, "step": 17240 }, { "epoch": 239.58, "learning_rate": 2.144e-05, "loss": 0.3191, "step": 17250 }, { "epoch": 239.72, "learning_rate": 2.1428571428571428e-05, "loss": 0.3355, "step": 17260 }, { "epoch": 239.86, "learning_rate": 2.141714285714286e-05, "loss": 0.3325, "step": 17270 }, { "epoch": 240.0, "learning_rate": 2.140571428571429e-05, "loss": 0.3201, "step": 17280 }, { "epoch": 240.0, "eval_loss": 0.6012704968452454, "eval_runtime": 129.0145, "eval_samples_per_second": 4.124, "eval_steps_per_second": 0.519, "eval_wer": 0.2223436395191875, "step": 17280 }, { "epoch": 240.14, "learning_rate": 2.1394285714285715e-05, "loss": 0.3273, "step": 17290 }, { "epoch": 240.28, "learning_rate": 2.1382857142857145e-05, "loss": 0.3184, "step": 17300 }, { "epoch": 240.42, "learning_rate": 2.1371428571428572e-05, "loss": 0.3227, "step": 17310 }, { "epoch": 240.55, "learning_rate": 2.1360000000000002e-05, "loss": 0.311, "step": 17320 }, { "epoch": 240.69, "learning_rate": 2.134857142857143e-05, "loss": 0.3247, "step": 17330 }, { "epoch": 240.83, "learning_rate": 2.133714285714286e-05, "loss": 0.317, "step": 17340 }, { "epoch": 240.97, "learning_rate": 2.1325714285714286e-05, "loss": 0.3242, "step": 17350 }, { "epoch": 241.0, "eval_loss": 0.5960102677345276, "eval_runtime": 129.4308, "eval_samples_per_second": 4.11, "eval_steps_per_second": 0.518, "eval_wer": 0.2207366458828823, "step": 17352 }, { "epoch": 241.11, "learning_rate": 2.1314285714285713e-05, "loss": 0.32, "step": 17360 }, { "epoch": 241.25, "learning_rate": 2.1302857142857146e-05, "loss": 0.311, "step": 17370 }, { "epoch": 241.39, "learning_rate": 2.1291428571428573e-05, "loss": 0.3091, "step": 17380 }, { "epoch": 241.53, "learning_rate": 2.1280000000000003e-05, "loss": 0.3154, "step": 17390 }, { "epoch": 241.66, "learning_rate": 2.126857142857143e-05, "loss": 0.3252, "step": 17400 }, { "epoch": 241.8, "learning_rate": 2.125714285714286e-05, "loss": 0.3213, "step": 17410 }, { "epoch": 241.94, "learning_rate": 2.1245714285714287e-05, "loss": 0.3194, "step": 17420 }, { "epoch": 242.0, "eval_loss": 0.609286904335022, "eval_runtime": 129.3361, "eval_samples_per_second": 4.113, "eval_steps_per_second": 0.518, "eval_wer": 0.23114996464614, "step": 17424 }, { "epoch": 242.08, "learning_rate": 2.1234285714285713e-05, "loss": 0.3141, "step": 17430 }, { "epoch": 242.22, "learning_rate": 2.1222857142857143e-05, "loss": 0.3217, "step": 17440 }, { "epoch": 242.36, "learning_rate": 2.121142857142857e-05, "loss": 0.3198, "step": 17450 }, { "epoch": 242.5, "learning_rate": 2.1200000000000004e-05, "loss": 0.3267, "step": 17460 }, { "epoch": 242.64, "learning_rate": 2.118857142857143e-05, "loss": 0.3211, "step": 17470 }, { "epoch": 242.78, "learning_rate": 2.117714285714286e-05, "loss": 0.316, "step": 17480 }, { "epoch": 242.91, "learning_rate": 2.1165714285714287e-05, "loss": 0.3203, "step": 17490 }, { "epoch": 243.0, "eval_loss": 0.6047176122665405, "eval_runtime": 129.1457, "eval_samples_per_second": 4.119, "eval_steps_per_second": 0.519, "eval_wer": 0.228064536864434, "step": 17496 }, { "epoch": 243.06, "learning_rate": 2.1154285714285714e-05, "loss": 0.33, "step": 17500 }, { "epoch": 243.19, "learning_rate": 2.1142857142857144e-05, "loss": 0.3193, "step": 17510 }, { "epoch": 243.33, "learning_rate": 2.113142857142857e-05, "loss": 0.3265, "step": 17520 }, { "epoch": 243.47, "learning_rate": 2.112e-05, "loss": 0.3237, "step": 17530 }, { "epoch": 243.61, "learning_rate": 2.1108571428571428e-05, "loss": 0.314, "step": 17540 }, { "epoch": 243.75, "learning_rate": 2.109714285714286e-05, "loss": 0.3088, "step": 17550 }, { "epoch": 243.89, "learning_rate": 2.1085714285714288e-05, "loss": 0.3173, "step": 17560 }, { "epoch": 244.0, "eval_loss": 0.6260218620300293, "eval_runtime": 129.3351, "eval_samples_per_second": 4.113, "eval_steps_per_second": 0.518, "eval_wer": 0.22845021533714727, "step": 17568 }, { "epoch": 244.03, "learning_rate": 2.1074285714285715e-05, "loss": 0.3345, "step": 17570 }, { "epoch": 244.17, "learning_rate": 2.1062857142857145e-05, "loss": 0.3177, "step": 17580 }, { "epoch": 244.3, "learning_rate": 2.1051428571428572e-05, "loss": 0.3152, "step": 17590 }, { "epoch": 244.44, "learning_rate": 2.1040000000000002e-05, "loss": 0.3202, "step": 17600 }, { "epoch": 244.58, "learning_rate": 2.102857142857143e-05, "loss": 0.3094, "step": 17610 }, { "epoch": 244.72, "learning_rate": 2.101714285714286e-05, "loss": 0.3241, "step": 17620 }, { "epoch": 244.86, "learning_rate": 2.1005714285714285e-05, "loss": 0.3114, "step": 17630 }, { "epoch": 245.0, "learning_rate": 2.099428571428572e-05, "loss": 0.3118, "step": 17640 }, { "epoch": 245.0, "eval_loss": 0.5961326360702515, "eval_runtime": 129.3255, "eval_samples_per_second": 4.114, "eval_steps_per_second": 0.518, "eval_wer": 0.22433631162820594, "step": 17640 }, { "epoch": 245.14, "learning_rate": 2.0982857142857146e-05, "loss": 0.3148, "step": 17650 }, { "epoch": 245.28, "learning_rate": 2.0971428571428572e-05, "loss": 0.3216, "step": 17660 }, { "epoch": 245.42, "learning_rate": 2.0960000000000003e-05, "loss": 0.3144, "step": 17670 }, { "epoch": 245.55, "learning_rate": 2.094857142857143e-05, "loss": 0.316, "step": 17680 }, { "epoch": 245.69, "learning_rate": 2.093714285714286e-05, "loss": 0.3131, "step": 17690 }, { "epoch": 245.83, "learning_rate": 2.0925714285714286e-05, "loss": 0.2971, "step": 17700 }, { "epoch": 245.97, "learning_rate": 2.091428571428572e-05, "loss": 0.3172, "step": 17710 }, { "epoch": 246.0, "eval_loss": 0.6314952373504639, "eval_runtime": 129.1896, "eval_samples_per_second": 4.118, "eval_steps_per_second": 0.519, "eval_wer": 0.22420775213730154, "step": 17712 }, { "epoch": 246.11, "learning_rate": 2.0902857142857143e-05, "loss": 0.3137, "step": 17720 }, { "epoch": 246.25, "learning_rate": 2.089142857142857e-05, "loss": 0.3164, "step": 17730 }, { "epoch": 246.39, "learning_rate": 2.0880000000000003e-05, "loss": 0.31, "step": 17740 }, { "epoch": 246.53, "learning_rate": 2.086857142857143e-05, "loss": 0.3156, "step": 17750 }, { "epoch": 246.66, "learning_rate": 2.085714285714286e-05, "loss": 0.3194, "step": 17760 }, { "epoch": 246.8, "learning_rate": 2.0845714285714287e-05, "loss": 0.3181, "step": 17770 }, { "epoch": 246.94, "learning_rate": 2.0834285714285717e-05, "loss": 0.332, "step": 17780 }, { "epoch": 247.0, "eval_loss": 0.6412584185600281, "eval_runtime": 128.904, "eval_samples_per_second": 4.127, "eval_steps_per_second": 0.52, "eval_wer": 0.22504338882818023, "step": 17784 }, { "epoch": 247.08, "learning_rate": 2.0822857142857144e-05, "loss": 0.3254, "step": 17790 }, { "epoch": 247.22, "learning_rate": 2.081142857142857e-05, "loss": 0.3211, "step": 17800 }, { "epoch": 247.36, "learning_rate": 2.08e-05, "loss": 0.328, "step": 17810 }, { "epoch": 247.5, "learning_rate": 2.0788571428571427e-05, "loss": 0.3229, "step": 17820 }, { "epoch": 247.64, "learning_rate": 2.077714285714286e-05, "loss": 0.3227, "step": 17830 }, { "epoch": 247.78, "learning_rate": 2.0765714285714288e-05, "loss": 0.3134, "step": 17840 }, { "epoch": 247.91, "learning_rate": 2.0754285714285718e-05, "loss": 0.3315, "step": 17850 }, { "epoch": 248.0, "eval_loss": 0.6260495781898499, "eval_runtime": 129.1436, "eval_samples_per_second": 4.119, "eval_steps_per_second": 0.519, "eval_wer": 0.22902873304621713, "step": 17856 }, { "epoch": 248.06, "learning_rate": 2.0742857142857145e-05, "loss": 0.3209, "step": 17860 }, { "epoch": 248.19, "learning_rate": 2.073142857142857e-05, "loss": 0.327, "step": 17870 }, { "epoch": 248.33, "learning_rate": 2.072e-05, "loss": 0.3176, "step": 17880 }, { "epoch": 248.47, "learning_rate": 2.0708571428571428e-05, "loss": 0.3243, "step": 17890 }, { "epoch": 248.61, "learning_rate": 2.069714285714286e-05, "loss": 0.3223, "step": 17900 }, { "epoch": 248.75, "learning_rate": 2.0685714285714285e-05, "loss": 0.3236, "step": 17910 }, { "epoch": 248.89, "learning_rate": 2.067428571428572e-05, "loss": 0.3222, "step": 17920 }, { "epoch": 249.0, "eval_loss": 0.6174905896186829, "eval_runtime": 129.2962, "eval_samples_per_second": 4.115, "eval_steps_per_second": 0.518, "eval_wer": 0.23070000642797456, "step": 17928 }, { "epoch": 249.03, "learning_rate": 2.0662857142857145e-05, "loss": 0.3255, "step": 17930 }, { "epoch": 249.17, "learning_rate": 2.0651428571428572e-05, "loss": 0.3246, "step": 17940 }, { "epoch": 249.3, "learning_rate": 2.0640000000000002e-05, "loss": 0.3156, "step": 17950 }, { "epoch": 249.44, "learning_rate": 2.062857142857143e-05, "loss": 0.3278, "step": 17960 }, { "epoch": 249.58, "learning_rate": 2.061714285714286e-05, "loss": 0.3164, "step": 17970 }, { "epoch": 249.72, "learning_rate": 2.0605714285714286e-05, "loss": 0.3297, "step": 17980 }, { "epoch": 249.86, "learning_rate": 2.059428571428572e-05, "loss": 0.3132, "step": 17990 }, { "epoch": 250.0, "learning_rate": 2.0582857142857143e-05, "loss": 0.3291, "step": 18000 }, { "epoch": 250.0, "eval_loss": 0.6004659533500671, "eval_runtime": 129.0389, "eval_samples_per_second": 4.123, "eval_steps_per_second": 0.519, "eval_wer": 0.22825737610079064, "step": 18000 }, { "epoch": 250.14, "learning_rate": 2.057142857142857e-05, "loss": 0.3356, "step": 18010 }, { "epoch": 250.28, "learning_rate": 2.0560000000000003e-05, "loss": 0.326, "step": 18020 }, { "epoch": 250.42, "learning_rate": 2.054857142857143e-05, "loss": 0.3173, "step": 18030 }, { "epoch": 250.55, "learning_rate": 2.053714285714286e-05, "loss": 0.3185, "step": 18040 }, { "epoch": 250.69, "learning_rate": 2.0525714285714287e-05, "loss": 0.3373, "step": 18050 }, { "epoch": 250.83, "learning_rate": 2.0514285714285717e-05, "loss": 0.3318, "step": 18060 }, { "epoch": 250.97, "learning_rate": 2.0502857142857144e-05, "loss": 0.3321, "step": 18070 }, { "epoch": 251.0, "eval_loss": 0.6299486756324768, "eval_runtime": 129.1139, "eval_samples_per_second": 4.12, "eval_steps_per_second": 0.519, "eval_wer": 0.23114996464614, "step": 18072 }, { "epoch": 251.11, "learning_rate": 2.049142857142857e-05, "loss": 0.323, "step": 18080 }, { "epoch": 251.25, "learning_rate": 2.048e-05, "loss": 0.3378, "step": 18090 }, { "epoch": 251.39, "learning_rate": 2.0468571428571427e-05, "loss": 0.3254, "step": 18100 }, { "epoch": 251.53, "learning_rate": 2.045714285714286e-05, "loss": 0.3231, "step": 18110 }, { "epoch": 251.66, "learning_rate": 2.0445714285714287e-05, "loss": 0.3249, "step": 18120 }, { "epoch": 251.8, "learning_rate": 2.0434285714285718e-05, "loss": 0.3227, "step": 18130 }, { "epoch": 251.94, "learning_rate": 2.0422857142857144e-05, "loss": 0.3338, "step": 18140 }, { "epoch": 252.0, "eval_loss": 0.6010589003562927, "eval_runtime": 129.4425, "eval_samples_per_second": 4.11, "eval_steps_per_second": 0.518, "eval_wer": 0.2310214051552356, "step": 18144 }, { "epoch": 252.08, "learning_rate": 2.041142857142857e-05, "loss": 0.3157, "step": 18150 }, { "epoch": 252.22, "learning_rate": 2.04e-05, "loss": 0.3118, "step": 18160 }, { "epoch": 252.36, "learning_rate": 2.0388571428571428e-05, "loss": 0.3096, "step": 18170 }, { "epoch": 252.5, "learning_rate": 2.037714285714286e-05, "loss": 0.319, "step": 18180 }, { "epoch": 252.64, "learning_rate": 2.0365714285714285e-05, "loss": 0.3209, "step": 18190 }, { "epoch": 252.78, "learning_rate": 2.035428571428572e-05, "loss": 0.3285, "step": 18200 }, { "epoch": 252.91, "learning_rate": 2.0342857142857145e-05, "loss": 0.3274, "step": 18210 }, { "epoch": 253.0, "eval_loss": 0.5661605000495911, "eval_runtime": 130.6733, "eval_samples_per_second": 4.071, "eval_steps_per_second": 0.513, "eval_wer": 0.22028668766471685, "step": 18216 }, { "epoch": 253.06, "learning_rate": 2.0331428571428575e-05, "loss": 0.3128, "step": 18220 }, { "epoch": 253.19, "learning_rate": 2.0320000000000002e-05, "loss": 0.3211, "step": 18230 }, { "epoch": 253.33, "learning_rate": 2.030857142857143e-05, "loss": 0.3122, "step": 18240 }, { "epoch": 253.47, "learning_rate": 2.029714285714286e-05, "loss": 0.3213, "step": 18250 }, { "epoch": 253.61, "learning_rate": 2.0285714285714286e-05, "loss": 0.3163, "step": 18260 }, { "epoch": 253.75, "learning_rate": 2.027428571428572e-05, "loss": 0.3322, "step": 18270 }, { "epoch": 253.89, "learning_rate": 2.0262857142857142e-05, "loss": 0.3148, "step": 18280 }, { "epoch": 254.0, "eval_loss": 0.6139088869094849, "eval_runtime": 129.3719, "eval_samples_per_second": 4.112, "eval_steps_per_second": 0.518, "eval_wer": 0.2344282316642026, "step": 18288 }, { "epoch": 254.03, "learning_rate": 2.0251428571428576e-05, "loss": 0.3416, "step": 18290 }, { "epoch": 254.17, "learning_rate": 2.0240000000000003e-05, "loss": 0.3301, "step": 18300 }, { "epoch": 254.3, "learning_rate": 2.022857142857143e-05, "loss": 0.3311, "step": 18310 }, { "epoch": 254.44, "learning_rate": 2.021714285714286e-05, "loss": 0.3338, "step": 18320 }, { "epoch": 254.58, "learning_rate": 2.0205714285714286e-05, "loss": 0.3303, "step": 18330 }, { "epoch": 254.72, "learning_rate": 2.0194285714285716e-05, "loss": 0.3335, "step": 18340 }, { "epoch": 254.86, "learning_rate": 2.0182857142857143e-05, "loss": 0.3295, "step": 18350 }, { "epoch": 255.0, "learning_rate": 2.0171428571428577e-05, "loss": 0.3295, "step": 18360 }, { "epoch": 255.0, "eval_loss": 0.6183280944824219, "eval_runtime": 129.8414, "eval_samples_per_second": 4.097, "eval_steps_per_second": 0.516, "eval_wer": 0.24606286559105225, "step": 18360 }, { "epoch": 255.14, "learning_rate": 2.016e-05, "loss": 0.3335, "step": 18370 }, { "epoch": 255.28, "learning_rate": 2.0148571428571427e-05, "loss": 0.3275, "step": 18380 }, { "epoch": 255.42, "learning_rate": 2.013714285714286e-05, "loss": 0.3344, "step": 18390 }, { "epoch": 255.55, "learning_rate": 2.0125714285714287e-05, "loss": 0.3281, "step": 18400 }, { "epoch": 255.69, "learning_rate": 2.0114285714285717e-05, "loss": 0.3303, "step": 18410 }, { "epoch": 255.83, "learning_rate": 2.0102857142857144e-05, "loss": 0.3224, "step": 18420 }, { "epoch": 255.97, "learning_rate": 2.0091428571428574e-05, "loss": 0.3169, "step": 18430 }, { "epoch": 256.0, "eval_loss": 0.6135612726211548, "eval_runtime": 129.225, "eval_samples_per_second": 4.117, "eval_steps_per_second": 0.518, "eval_wer": 0.22832165584624284, "step": 18432 }, { "epoch": 256.11, "learning_rate": 2.008e-05, "loss": 0.3272, "step": 18440 }, { "epoch": 256.25, "learning_rate": 2.0068571428571428e-05, "loss": 0.3333, "step": 18450 }, { "epoch": 256.39, "learning_rate": 2.005714285714286e-05, "loss": 0.3197, "step": 18460 }, { "epoch": 256.53, "learning_rate": 2.0045714285714284e-05, "loss": 0.3352, "step": 18470 }, { "epoch": 256.66, "learning_rate": 2.0034285714285718e-05, "loss": 0.3371, "step": 18480 }, { "epoch": 256.8, "learning_rate": 2.0022857142857145e-05, "loss": 0.3341, "step": 18490 }, { "epoch": 256.94, "learning_rate": 2.0011428571428575e-05, "loss": 0.3431, "step": 18500 }, { "epoch": 257.0, "eval_loss": 0.6445194482803345, "eval_runtime": 129.3941, "eval_samples_per_second": 4.111, "eval_steps_per_second": 0.518, "eval_wer": 0.24458443144565148, "step": 18504 }, { "epoch": 257.08, "learning_rate": 2e-05, "loss": 0.3428, "step": 18510 }, { "epoch": 257.22, "learning_rate": 1.9988571428571432e-05, "loss": 0.3437, "step": 18520 }, { "epoch": 257.36, "learning_rate": 1.997714285714286e-05, "loss": 0.3318, "step": 18530 }, { "epoch": 257.5, "learning_rate": 1.996571428571429e-05, "loss": 0.34, "step": 18540 }, { "epoch": 257.64, "learning_rate": 1.9954285714285715e-05, "loss": 0.3337, "step": 18550 }, { "epoch": 257.78, "learning_rate": 1.9942857142857142e-05, "loss": 0.3303, "step": 18560 }, { "epoch": 257.91, "learning_rate": 1.9931428571428572e-05, "loss": 0.3209, "step": 18570 }, { "epoch": 258.0, "eval_loss": 0.612432599067688, "eval_runtime": 129.5906, "eval_samples_per_second": 4.105, "eval_steps_per_second": 0.517, "eval_wer": 0.24374879475477276, "step": 18576 }, { "epoch": 258.06, "learning_rate": 1.9920000000000002e-05, "loss": 0.3379, "step": 18580 }, { "epoch": 258.19, "learning_rate": 1.990857142857143e-05, "loss": 0.3428, "step": 18590 }, { "epoch": 258.33, "learning_rate": 1.989714285714286e-05, "loss": 0.3348, "step": 18600 }, { "epoch": 258.47, "learning_rate": 1.988571428571429e-05, "loss": 0.3306, "step": 18610 }, { "epoch": 258.61, "learning_rate": 1.9874285714285716e-05, "loss": 0.3312, "step": 18620 }, { "epoch": 258.75, "learning_rate": 1.9862857142857143e-05, "loss": 0.3323, "step": 18630 }, { "epoch": 258.89, "learning_rate": 1.9851428571428573e-05, "loss": 0.3405, "step": 18640 }, { "epoch": 259.0, "eval_loss": 0.6209958791732788, "eval_runtime": 129.1781, "eval_samples_per_second": 4.118, "eval_steps_per_second": 0.519, "eval_wer": 0.24464871119110368, "step": 18648 }, { "epoch": 259.03, "learning_rate": 1.9840000000000003e-05, "loss": 0.3451, "step": 18650 }, { "epoch": 259.17, "learning_rate": 1.982857142857143e-05, "loss": 0.3263, "step": 18660 }, { "epoch": 259.3, "learning_rate": 1.981714285714286e-05, "loss": 0.3422, "step": 18670 }, { "epoch": 259.44, "learning_rate": 1.9805714285714287e-05, "loss": 0.3271, "step": 18680 }, { "epoch": 259.58, "learning_rate": 1.9794285714285717e-05, "loss": 0.3328, "step": 18690 }, { "epoch": 259.72, "learning_rate": 1.9782857142857144e-05, "loss": 0.3363, "step": 18700 }, { "epoch": 259.86, "learning_rate": 1.9771428571428574e-05, "loss": 0.3217, "step": 18710 }, { "epoch": 260.0, "learning_rate": 1.976e-05, "loss": 0.3317, "step": 18720 }, { "epoch": 260.0, "eval_loss": 0.6088146567344666, "eval_runtime": 129.0971, "eval_samples_per_second": 4.121, "eval_steps_per_second": 0.519, "eval_wer": 0.23500674937327248, "step": 18720 }, { "epoch": 260.14, "learning_rate": 1.974857142857143e-05, "loss": 0.3304, "step": 18730 }, { "epoch": 260.28, "learning_rate": 1.973714285714286e-05, "loss": 0.3258, "step": 18740 }, { "epoch": 260.42, "learning_rate": 1.9725714285714288e-05, "loss": 0.3243, "step": 18750 }, { "epoch": 260.55, "learning_rate": 1.9714285714285718e-05, "loss": 0.3194, "step": 18760 }, { "epoch": 260.69, "learning_rate": 1.9702857142857144e-05, "loss": 0.3228, "step": 18770 }, { "epoch": 260.83, "learning_rate": 1.969142857142857e-05, "loss": 0.3223, "step": 18780 }, { "epoch": 260.97, "learning_rate": 1.968e-05, "loss": 0.3265, "step": 18790 }, { "epoch": 261.0, "eval_loss": 0.579181969165802, "eval_runtime": 132.5859, "eval_samples_per_second": 4.012, "eval_steps_per_second": 0.505, "eval_wer": 0.23237127980973196, "step": 18792 }, { "epoch": 261.11, "learning_rate": 1.966857142857143e-05, "loss": 0.3255, "step": 18800 }, { "epoch": 261.25, "learning_rate": 1.9657142857142858e-05, "loss": 0.3163, "step": 18810 }, { "epoch": 261.39, "learning_rate": 1.964571428571429e-05, "loss": 0.3142, "step": 18820 }, { "epoch": 261.53, "learning_rate": 1.963428571428572e-05, "loss": 0.3284, "step": 18830 }, { "epoch": 261.66, "learning_rate": 1.9622857142857142e-05, "loss": 0.3285, "step": 18840 }, { "epoch": 261.8, "learning_rate": 1.9611428571428572e-05, "loss": 0.3297, "step": 18850 }, { "epoch": 261.94, "learning_rate": 1.9600000000000002e-05, "loss": 0.332, "step": 18860 }, { "epoch": 262.0, "eval_loss": 0.632605254650116, "eval_runtime": 129.2806, "eval_samples_per_second": 4.115, "eval_steps_per_second": 0.518, "eval_wer": 0.24272031882753745, "step": 18864 }, { "epoch": 262.08, "learning_rate": 1.958857142857143e-05, "loss": 0.3458, "step": 18870 }, { "epoch": 262.22, "learning_rate": 1.957714285714286e-05, "loss": 0.3289, "step": 18880 }, { "epoch": 262.36, "learning_rate": 1.956571428571429e-05, "loss": 0.3139, "step": 18890 }, { "epoch": 262.5, "learning_rate": 1.9554285714285716e-05, "loss": 0.3211, "step": 18900 }, { "epoch": 262.64, "learning_rate": 1.9542857142857143e-05, "loss": 0.3196, "step": 18910 }, { "epoch": 262.78, "learning_rate": 1.9531428571428573e-05, "loss": 0.3162, "step": 18920 }, { "epoch": 262.91, "learning_rate": 1.9520000000000003e-05, "loss": 0.3179, "step": 18930 }, { "epoch": 263.0, "eval_loss": 0.617436408996582, "eval_runtime": 129.2601, "eval_samples_per_second": 4.116, "eval_steps_per_second": 0.518, "eval_wer": 0.22562190653725012, "step": 18936 }, { "epoch": 263.06, "learning_rate": 1.950857142857143e-05, "loss": 0.3198, "step": 18940 }, { "epoch": 263.19, "learning_rate": 1.949714285714286e-05, "loss": 0.3221, "step": 18950 }, { "epoch": 263.33, "learning_rate": 1.9485714285714286e-05, "loss": 0.3053, "step": 18960 }, { "epoch": 263.47, "learning_rate": 1.9474285714285717e-05, "loss": 0.3145, "step": 18970 }, { "epoch": 263.61, "learning_rate": 1.9462857142857147e-05, "loss": 0.309, "step": 18980 }, { "epoch": 263.75, "learning_rate": 1.9451428571428573e-05, "loss": 0.322, "step": 18990 }, { "epoch": 263.89, "learning_rate": 1.944e-05, "loss": 0.3119, "step": 19000 }, { "epoch": 264.0, "eval_loss": 0.6337862014770508, "eval_runtime": 129.5529, "eval_samples_per_second": 4.106, "eval_steps_per_second": 0.517, "eval_wer": 0.22774313813717298, "step": 19008 }, { "epoch": 264.03, "learning_rate": 1.942857142857143e-05, "loss": 0.3298, "step": 19010 }, { "epoch": 264.17, "learning_rate": 1.941714285714286e-05, "loss": 0.3136, "step": 19020 }, { "epoch": 264.3, "learning_rate": 1.9405714285714287e-05, "loss": 0.3137, "step": 19030 }, { "epoch": 264.44, "learning_rate": 1.9394285714285717e-05, "loss": 0.3247, "step": 19040 }, { "epoch": 264.58, "learning_rate": 1.9382857142857144e-05, "loss": 0.302, "step": 19050 }, { "epoch": 264.72, "learning_rate": 1.937142857142857e-05, "loss": 0.3158, "step": 19060 }, { "epoch": 264.86, "learning_rate": 1.936e-05, "loss": 0.3044, "step": 19070 }, { "epoch": 265.0, "learning_rate": 1.934857142857143e-05, "loss": 0.3223, "step": 19080 }, { "epoch": 265.0, "eval_loss": 0.6236149072647095, "eval_runtime": 129.0959, "eval_samples_per_second": 4.121, "eval_steps_per_second": 0.519, "eval_wer": 0.22131516359195216, "step": 19080 }, { "epoch": 265.14, "learning_rate": 1.9337142857142858e-05, "loss": 0.3156, "step": 19090 }, { "epoch": 265.28, "learning_rate": 1.9325714285714288e-05, "loss": 0.3173, "step": 19100 }, { "epoch": 265.42, "learning_rate": 1.9314285714285718e-05, "loss": 0.3034, "step": 19110 }, { "epoch": 265.55, "learning_rate": 1.9302857142857145e-05, "loss": 0.3045, "step": 19120 }, { "epoch": 265.69, "learning_rate": 1.929142857142857e-05, "loss": 0.3218, "step": 19130 }, { "epoch": 265.83, "learning_rate": 1.9280000000000002e-05, "loss": 0.3018, "step": 19140 }, { "epoch": 265.97, "learning_rate": 1.926857142857143e-05, "loss": 0.315, "step": 19150 }, { "epoch": 266.0, "eval_loss": 0.6025270223617554, "eval_runtime": 128.9816, "eval_samples_per_second": 4.125, "eval_steps_per_second": 0.519, "eval_wer": 0.2263289837372244, "step": 19152 }, { "epoch": 266.11, "learning_rate": 1.925714285714286e-05, "loss": 0.3082, "step": 19160 }, { "epoch": 266.25, "learning_rate": 1.924571428571429e-05, "loss": 0.3129, "step": 19170 }, { "epoch": 266.39, "learning_rate": 1.9234285714285716e-05, "loss": 0.3068, "step": 19180 }, { "epoch": 266.53, "learning_rate": 1.9222857142857146e-05, "loss": 0.3137, "step": 19190 }, { "epoch": 266.66, "learning_rate": 1.9211428571428572e-05, "loss": 0.3103, "step": 19200 }, { "epoch": 266.8, "learning_rate": 1.9200000000000003e-05, "loss": 0.3061, "step": 19210 }, { "epoch": 266.94, "learning_rate": 1.918857142857143e-05, "loss": 0.3214, "step": 19220 }, { "epoch": 267.0, "eval_loss": 0.5880905389785767, "eval_runtime": 129.5754, "eval_samples_per_second": 4.106, "eval_steps_per_second": 0.517, "eval_wer": 0.22433631162820594, "step": 19224 }, { "epoch": 267.08, "learning_rate": 1.917714285714286e-05, "loss": 0.3195, "step": 19230 }, { "epoch": 267.22, "learning_rate": 1.9165714285714286e-05, "loss": 0.3063, "step": 19240 }, { "epoch": 267.36, "learning_rate": 1.9154285714285716e-05, "loss": 0.2926, "step": 19250 }, { "epoch": 267.5, "learning_rate": 1.9142857142857146e-05, "loss": 0.3081, "step": 19260 }, { "epoch": 267.64, "learning_rate": 1.9131428571428573e-05, "loss": 0.3106, "step": 19270 }, { "epoch": 267.78, "learning_rate": 1.912e-05, "loss": 0.3022, "step": 19280 }, { "epoch": 267.91, "learning_rate": 1.910857142857143e-05, "loss": 0.3184, "step": 19290 }, { "epoch": 268.0, "eval_loss": 0.59419846534729, "eval_runtime": 129.5752, "eval_samples_per_second": 4.106, "eval_steps_per_second": 0.517, "eval_wer": 0.22253647875554414, "step": 19296 }, { "epoch": 268.06, "learning_rate": 1.909714285714286e-05, "loss": 0.3095, "step": 19300 }, { "epoch": 268.19, "learning_rate": 1.9085714285714287e-05, "loss": 0.3092, "step": 19310 }, { "epoch": 268.33, "learning_rate": 1.9074285714285717e-05, "loss": 0.3166, "step": 19320 }, { "epoch": 268.47, "learning_rate": 1.9062857142857144e-05, "loss": 0.3077, "step": 19330 }, { "epoch": 268.61, "learning_rate": 1.9051428571428574e-05, "loss": 0.2951, "step": 19340 }, { "epoch": 268.75, "learning_rate": 1.904e-05, "loss": 0.3049, "step": 19350 }, { "epoch": 268.89, "learning_rate": 1.902857142857143e-05, "loss": 0.3083, "step": 19360 }, { "epoch": 269.0, "eval_loss": 0.5835778117179871, "eval_runtime": 129.6825, "eval_samples_per_second": 4.102, "eval_steps_per_second": 0.517, "eval_wer": 0.22086520537378673, "step": 19368 }, { "epoch": 269.03, "learning_rate": 1.9017142857142858e-05, "loss": 0.3139, "step": 19370 }, { "epoch": 269.17, "learning_rate": 1.9005714285714288e-05, "loss": 0.312, "step": 19380 }, { "epoch": 269.3, "learning_rate": 1.8994285714285718e-05, "loss": 0.294, "step": 19390 }, { "epoch": 269.44, "learning_rate": 1.8982857142857145e-05, "loss": 0.302, "step": 19400 }, { "epoch": 269.58, "learning_rate": 1.8971428571428575e-05, "loss": 0.2941, "step": 19410 }, { "epoch": 269.72, "learning_rate": 1.896e-05, "loss": 0.3132, "step": 19420 }, { "epoch": 269.86, "learning_rate": 1.8948571428571428e-05, "loss": 0.3056, "step": 19430 }, { "epoch": 270.0, "learning_rate": 1.893714285714286e-05, "loss": 0.3098, "step": 19440 }, { "epoch": 270.0, "eval_loss": 0.5843570232391357, "eval_runtime": 129.4036, "eval_samples_per_second": 4.111, "eval_steps_per_second": 0.518, "eval_wer": 0.2191939319920293, "step": 19440 }, { "epoch": 270.14, "learning_rate": 1.892571428571429e-05, "loss": 0.3017, "step": 19450 }, { "epoch": 270.28, "learning_rate": 1.8914285714285715e-05, "loss": 0.3093, "step": 19460 }, { "epoch": 270.42, "learning_rate": 1.8902857142857145e-05, "loss": 0.3101, "step": 19470 }, { "epoch": 270.55, "learning_rate": 1.8891428571428575e-05, "loss": 0.2984, "step": 19480 }, { "epoch": 270.69, "learning_rate": 1.8880000000000002e-05, "loss": 0.3014, "step": 19490 }, { "epoch": 270.83, "learning_rate": 1.886857142857143e-05, "loss": 0.3051, "step": 19500 }, { "epoch": 270.97, "learning_rate": 1.885714285714286e-05, "loss": 0.2992, "step": 19510 }, { "epoch": 271.0, "eval_loss": 0.5972372889518738, "eval_runtime": 129.1594, "eval_samples_per_second": 4.119, "eval_steps_per_second": 0.519, "eval_wer": 0.22182940155556985, "step": 19512 }, { "epoch": 271.11, "learning_rate": 1.8845714285714286e-05, "loss": 0.2972, "step": 19520 }, { "epoch": 271.25, "learning_rate": 1.8834285714285716e-05, "loss": 0.2992, "step": 19530 }, { "epoch": 271.39, "learning_rate": 1.8822857142857146e-05, "loss": 0.2979, "step": 19540 }, { "epoch": 271.53, "learning_rate": 1.8811428571428573e-05, "loss": 0.2974, "step": 19550 }, { "epoch": 271.66, "learning_rate": 1.88e-05, "loss": 0.2993, "step": 19560 }, { "epoch": 271.8, "learning_rate": 1.878857142857143e-05, "loss": 0.3028, "step": 19570 }, { "epoch": 271.94, "learning_rate": 1.877714285714286e-05, "loss": 0.3118, "step": 19580 }, { "epoch": 272.0, "eval_loss": 0.5768290162086487, "eval_runtime": 129.2876, "eval_samples_per_second": 4.115, "eval_steps_per_second": 0.518, "eval_wer": 0.22202224079192645, "step": 19584 }, { "epoch": 272.08, "learning_rate": 1.8765714285714287e-05, "loss": 0.3104, "step": 19590 }, { "epoch": 272.22, "learning_rate": 1.8754285714285717e-05, "loss": 0.3218, "step": 19600 }, { "epoch": 272.36, "learning_rate": 1.8742857142857143e-05, "loss": 0.3009, "step": 19610 }, { "epoch": 272.5, "learning_rate": 1.8731428571428574e-05, "loss": 0.3087, "step": 19620 }, { "epoch": 272.64, "learning_rate": 1.8720000000000004e-05, "loss": 0.299, "step": 19630 }, { "epoch": 272.78, "learning_rate": 1.870857142857143e-05, "loss": 0.3102, "step": 19640 }, { "epoch": 272.91, "learning_rate": 1.8697142857142857e-05, "loss": 0.3112, "step": 19650 }, { "epoch": 273.0, "eval_loss": 0.5926473736763, "eval_runtime": 129.3255, "eval_samples_per_second": 4.114, "eval_steps_per_second": 0.518, "eval_wer": 0.2166870219193932, "step": 19656 }, { "epoch": 273.06, "learning_rate": 1.8685714285714287e-05, "loss": 0.3125, "step": 19660 }, { "epoch": 273.19, "learning_rate": 1.8674285714285717e-05, "loss": 0.3066, "step": 19670 }, { "epoch": 273.33, "learning_rate": 1.8662857142857144e-05, "loss": 0.3018, "step": 19680 }, { "epoch": 273.47, "learning_rate": 1.8651428571428574e-05, "loss": 0.3127, "step": 19690 }, { "epoch": 273.61, "learning_rate": 1.864e-05, "loss": 0.2984, "step": 19700 }, { "epoch": 273.75, "learning_rate": 1.8628571428571428e-05, "loss": 0.2975, "step": 19710 }, { "epoch": 273.89, "learning_rate": 1.8617142857142858e-05, "loss": 0.2994, "step": 19720 }, { "epoch": 274.0, "eval_loss": 0.6055723428726196, "eval_runtime": 129.8983, "eval_samples_per_second": 4.096, "eval_steps_per_second": 0.516, "eval_wer": 0.22266503824644854, "step": 19728 }, { "epoch": 274.03, "learning_rate": 1.8605714285714288e-05, "loss": 0.3229, "step": 19730 }, { "epoch": 274.17, "learning_rate": 1.8594285714285715e-05, "loss": 0.3056, "step": 19740 }, { "epoch": 274.3, "learning_rate": 1.8582857142857145e-05, "loss": 0.2943, "step": 19750 }, { "epoch": 274.44, "learning_rate": 1.8571428571428575e-05, "loss": 0.3085, "step": 19760 }, { "epoch": 274.58, "learning_rate": 1.8560000000000002e-05, "loss": 0.3124, "step": 19770 }, { "epoch": 274.72, "learning_rate": 1.854857142857143e-05, "loss": 0.3012, "step": 19780 }, { "epoch": 274.86, "learning_rate": 1.853714285714286e-05, "loss": 0.2977, "step": 19790 }, { "epoch": 275.0, "learning_rate": 1.8525714285714285e-05, "loss": 0.3041, "step": 19800 }, { "epoch": 275.0, "eval_loss": 0.5793389081954956, "eval_runtime": 129.2795, "eval_samples_per_second": 4.115, "eval_steps_per_second": 0.518, "eval_wer": 0.22452915086456257, "step": 19800 }, { "epoch": 275.14, "learning_rate": 1.8514285714285716e-05, "loss": 0.3149, "step": 19810 }, { "epoch": 275.28, "learning_rate": 1.8502857142857146e-05, "loss": 0.3031, "step": 19820 }, { "epoch": 275.42, "learning_rate": 1.8491428571428573e-05, "loss": 0.2928, "step": 19830 }, { "epoch": 275.55, "learning_rate": 1.8480000000000003e-05, "loss": 0.2995, "step": 19840 }, { "epoch": 275.69, "learning_rate": 1.846857142857143e-05, "loss": 0.3137, "step": 19850 }, { "epoch": 275.83, "learning_rate": 1.845714285714286e-05, "loss": 0.2946, "step": 19860 }, { "epoch": 275.97, "learning_rate": 1.8445714285714286e-05, "loss": 0.3072, "step": 19870 }, { "epoch": 276.0, "eval_loss": 0.6187883615493774, "eval_runtime": 129.543, "eval_samples_per_second": 4.107, "eval_steps_per_second": 0.517, "eval_wer": 0.22767885839172078, "step": 19872 }, { "epoch": 276.11, "learning_rate": 1.8434285714285716e-05, "loss": 0.3094, "step": 19880 }, { "epoch": 276.25, "learning_rate": 1.8422857142857143e-05, "loss": 0.3155, "step": 19890 }, { "epoch": 276.39, "learning_rate": 1.8411428571428573e-05, "loss": 0.3029, "step": 19900 }, { "epoch": 276.53, "learning_rate": 1.8400000000000003e-05, "loss": 0.3065, "step": 19910 }, { "epoch": 276.66, "learning_rate": 1.838857142857143e-05, "loss": 0.2989, "step": 19920 }, { "epoch": 276.8, "learning_rate": 1.8377142857142857e-05, "loss": 0.303, "step": 19930 }, { "epoch": 276.94, "learning_rate": 1.8365714285714287e-05, "loss": 0.3042, "step": 19940 }, { "epoch": 277.0, "eval_loss": 0.5931434631347656, "eval_runtime": 129.2928, "eval_samples_per_second": 4.115, "eval_steps_per_second": 0.518, "eval_wer": 0.22510766857363246, "step": 19944 }, { "epoch": 277.08, "learning_rate": 1.8354285714285717e-05, "loss": 0.3014, "step": 19950 }, { "epoch": 277.22, "learning_rate": 1.8342857142857144e-05, "loss": 0.3191, "step": 19960 }, { "epoch": 277.36, "learning_rate": 1.8331428571428574e-05, "loss": 0.2934, "step": 19970 }, { "epoch": 277.5, "learning_rate": 1.832e-05, "loss": 0.3073, "step": 19980 }, { "epoch": 277.64, "learning_rate": 1.830857142857143e-05, "loss": 0.3115, "step": 19990 }, { "epoch": 277.78, "learning_rate": 1.8297142857142858e-05, "loss": 0.3026, "step": 20000 }, { "epoch": 277.91, "learning_rate": 1.8285714285714288e-05, "loss": 0.3107, "step": 20010 }, { "epoch": 278.0, "eval_loss": 0.6204590797424316, "eval_runtime": 129.1836, "eval_samples_per_second": 4.118, "eval_steps_per_second": 0.519, "eval_wer": 0.22163656231921322, "step": 20016 }, { "epoch": 278.06, "learning_rate": 1.8274285714285715e-05, "loss": 0.3159, "step": 20020 }, { "epoch": 278.19, "learning_rate": 1.8262857142857145e-05, "loss": 0.3114, "step": 20030 }, { "epoch": 278.33, "learning_rate": 1.8251428571428575e-05, "loss": 0.2971, "step": 20040 }, { "epoch": 278.47, "learning_rate": 1.824e-05, "loss": 0.3141, "step": 20050 }, { "epoch": 278.61, "learning_rate": 1.822857142857143e-05, "loss": 0.2922, "step": 20060 }, { "epoch": 278.75, "learning_rate": 1.821714285714286e-05, "loss": 0.3135, "step": 20070 }, { "epoch": 278.89, "learning_rate": 1.8205714285714285e-05, "loss": 0.3077, "step": 20080 }, { "epoch": 279.0, "eval_loss": 0.6001317501068115, "eval_runtime": 129.5418, "eval_samples_per_second": 4.107, "eval_steps_per_second": 0.517, "eval_wer": 0.22086520537378673, "step": 20088 }, { "epoch": 279.03, "learning_rate": 1.8194285714285715e-05, "loss": 0.3064, "step": 20090 }, { "epoch": 279.17, "learning_rate": 1.8182857142857145e-05, "loss": 0.3224, "step": 20100 }, { "epoch": 279.3, "learning_rate": 1.8171428571428572e-05, "loss": 0.3031, "step": 20110 }, { "epoch": 279.44, "learning_rate": 1.8160000000000002e-05, "loss": 0.2987, "step": 20120 }, { "epoch": 279.58, "learning_rate": 1.8148571428571432e-05, "loss": 0.309, "step": 20130 }, { "epoch": 279.72, "learning_rate": 1.813714285714286e-05, "loss": 0.302, "step": 20140 }, { "epoch": 279.86, "learning_rate": 1.8125714285714286e-05, "loss": 0.2896, "step": 20150 }, { "epoch": 280.0, "learning_rate": 1.8114285714285716e-05, "loss": 0.2903, "step": 20160 }, { "epoch": 280.0, "eval_loss": 0.6002232432365417, "eval_runtime": 129.8361, "eval_samples_per_second": 4.097, "eval_steps_per_second": 0.516, "eval_wer": 0.2141158321013049, "step": 20160 }, { "epoch": 280.14, "learning_rate": 1.8102857142857143e-05, "loss": 0.3073, "step": 20170 }, { "epoch": 280.28, "learning_rate": 1.8091428571428573e-05, "loss": 0.308, "step": 20180 }, { "epoch": 280.42, "learning_rate": 1.8080000000000003e-05, "loss": 0.2982, "step": 20190 }, { "epoch": 280.55, "learning_rate": 1.806857142857143e-05, "loss": 0.3018, "step": 20200 }, { "epoch": 280.69, "learning_rate": 1.8057142857142857e-05, "loss": 0.2995, "step": 20210 }, { "epoch": 280.83, "learning_rate": 1.8045714285714287e-05, "loss": 0.3018, "step": 20220 }, { "epoch": 280.97, "learning_rate": 1.8034285714285717e-05, "loss": 0.3124, "step": 20230 }, { "epoch": 281.0, "eval_loss": 0.5781813263893127, "eval_runtime": 129.754, "eval_samples_per_second": 4.1, "eval_steps_per_second": 0.516, "eval_wer": 0.2167513016648454, "step": 20232 }, { "epoch": 281.11, "learning_rate": 1.8022857142857144e-05, "loss": 0.2999, "step": 20240 }, { "epoch": 281.25, "learning_rate": 1.8011428571428574e-05, "loss": 0.3009, "step": 20250 }, { "epoch": 281.39, "learning_rate": 1.8e-05, "loss": 0.2961, "step": 20260 }, { "epoch": 281.53, "learning_rate": 1.798857142857143e-05, "loss": 0.2975, "step": 20270 }, { "epoch": 281.66, "learning_rate": 1.797714285714286e-05, "loss": 0.3028, "step": 20280 }, { "epoch": 281.8, "learning_rate": 1.7966857142857143e-05, "loss": 0.3017, "step": 20290 }, { "epoch": 281.94, "learning_rate": 1.7955428571428573e-05, "loss": 0.3043, "step": 20300 }, { "epoch": 282.0, "eval_loss": 0.6104644536972046, "eval_runtime": 129.3839, "eval_samples_per_second": 4.112, "eval_steps_per_second": 0.518, "eval_wer": 0.21874397377386384, "step": 20304 }, { "epoch": 282.08, "learning_rate": 1.7944000000000003e-05, "loss": 0.3069, "step": 20310 }, { "epoch": 282.22, "learning_rate": 1.793257142857143e-05, "loss": 0.3013, "step": 20320 }, { "epoch": 282.36, "learning_rate": 1.792114285714286e-05, "loss": 0.2964, "step": 20330 }, { "epoch": 282.5, "learning_rate": 1.7909714285714287e-05, "loss": 0.3043, "step": 20340 }, { "epoch": 282.64, "learning_rate": 1.7898285714285713e-05, "loss": 0.3069, "step": 20350 }, { "epoch": 282.78, "learning_rate": 1.7886857142857144e-05, "loss": 0.3086, "step": 20360 }, { "epoch": 282.91, "learning_rate": 1.7875428571428574e-05, "loss": 0.3007, "step": 20370 }, { "epoch": 283.0, "eval_loss": 0.610522449016571, "eval_runtime": 129.0879, "eval_samples_per_second": 4.121, "eval_steps_per_second": 0.519, "eval_wer": 0.22125088384649996, "step": 20376 }, { "epoch": 283.06, "learning_rate": 1.7864e-05, "loss": 0.3115, "step": 20380 }, { "epoch": 283.19, "learning_rate": 1.785257142857143e-05, "loss": 0.3151, "step": 20390 }, { "epoch": 283.33, "learning_rate": 1.784114285714286e-05, "loss": 0.2998, "step": 20400 }, { "epoch": 283.47, "learning_rate": 1.7829714285714287e-05, "loss": 0.3035, "step": 20410 }, { "epoch": 283.61, "learning_rate": 1.7818285714285718e-05, "loss": 0.2938, "step": 20420 }, { "epoch": 283.75, "learning_rate": 1.7806857142857144e-05, "loss": 0.3108, "step": 20430 }, { "epoch": 283.89, "learning_rate": 1.779542857142857e-05, "loss": 0.3023, "step": 20440 }, { "epoch": 284.0, "eval_loss": 0.6011126637458801, "eval_runtime": 129.5594, "eval_samples_per_second": 4.106, "eval_steps_per_second": 0.517, "eval_wer": 0.22324355595551842, "step": 20448 }, { "epoch": 284.03, "learning_rate": 1.7784e-05, "loss": 0.3029, "step": 20450 }, { "epoch": 284.17, "learning_rate": 1.777257142857143e-05, "loss": 0.3071, "step": 20460 }, { "epoch": 284.3, "learning_rate": 1.7761142857142858e-05, "loss": 0.297, "step": 20470 }, { "epoch": 284.44, "learning_rate": 1.7749714285714288e-05, "loss": 0.3101, "step": 20480 }, { "epoch": 284.58, "learning_rate": 1.773828571428572e-05, "loss": 0.308, "step": 20490 }, { "epoch": 284.72, "learning_rate": 1.7726857142857145e-05, "loss": 0.2999, "step": 20500 }, { "epoch": 284.86, "learning_rate": 1.7715428571428572e-05, "loss": 0.2931, "step": 20510 }, { "epoch": 285.0, "learning_rate": 1.7704000000000002e-05, "loss": 0.3062, "step": 20520 }, { "epoch": 285.0, "eval_loss": 0.5966695547103882, "eval_runtime": 129.3214, "eval_samples_per_second": 4.114, "eval_steps_per_second": 0.518, "eval_wer": 0.21951533071929036, "step": 20520 }, { "epoch": 285.14, "learning_rate": 1.769257142857143e-05, "loss": 0.3036, "step": 20530 }, { "epoch": 285.28, "learning_rate": 1.768114285714286e-05, "loss": 0.3011, "step": 20540 }, { "epoch": 285.42, "learning_rate": 1.766971428571429e-05, "loss": 0.3018, "step": 20550 }, { "epoch": 285.55, "learning_rate": 1.7658285714285716e-05, "loss": 0.2916, "step": 20560 }, { "epoch": 285.69, "learning_rate": 1.7646857142857142e-05, "loss": 0.3058, "step": 20570 }, { "epoch": 285.83, "learning_rate": 1.7635428571428573e-05, "loss": 0.2924, "step": 20580 }, { "epoch": 285.97, "learning_rate": 1.7624000000000003e-05, "loss": 0.3093, "step": 20590 }, { "epoch": 286.0, "eval_loss": 0.6570582985877991, "eval_runtime": 129.4623, "eval_samples_per_second": 4.109, "eval_steps_per_second": 0.518, "eval_wer": 0.22575046602815452, "step": 20592 }, { "epoch": 286.11, "learning_rate": 1.761257142857143e-05, "loss": 0.3047, "step": 20600 }, { "epoch": 286.25, "learning_rate": 1.760114285714286e-05, "loss": 0.3103, "step": 20610 }, { "epoch": 286.39, "learning_rate": 1.7589714285714286e-05, "loss": 0.3119, "step": 20620 }, { "epoch": 286.53, "learning_rate": 1.7578285714285716e-05, "loss": 0.3133, "step": 20630 }, { "epoch": 286.66, "learning_rate": 1.7566857142857143e-05, "loss": 0.2989, "step": 20640 }, { "epoch": 286.8, "learning_rate": 1.7555428571428573e-05, "loss": 0.3056, "step": 20650 }, { "epoch": 286.94, "learning_rate": 1.7544e-05, "loss": 0.3041, "step": 20660 }, { "epoch": 287.0, "eval_loss": 0.595576822757721, "eval_runtime": 128.9293, "eval_samples_per_second": 4.126, "eval_steps_per_second": 0.52, "eval_wer": 0.22131516359195216, "step": 20664 }, { "epoch": 287.08, "learning_rate": 1.753257142857143e-05, "loss": 0.3075, "step": 20670 }, { "epoch": 287.22, "learning_rate": 1.752114285714286e-05, "loss": 0.306, "step": 20680 }, { "epoch": 287.36, "learning_rate": 1.7509714285714287e-05, "loss": 0.303, "step": 20690 }, { "epoch": 287.5, "learning_rate": 1.7498285714285717e-05, "loss": 0.3041, "step": 20700 }, { "epoch": 287.64, "learning_rate": 1.7486857142857144e-05, "loss": 0.3023, "step": 20710 }, { "epoch": 287.78, "learning_rate": 1.747542857142857e-05, "loss": 0.3007, "step": 20720 }, { "epoch": 287.91, "learning_rate": 1.7464e-05, "loss": 0.3083, "step": 20730 }, { "epoch": 288.0, "eval_loss": 0.5903686881065369, "eval_runtime": 129.2949, "eval_samples_per_second": 4.115, "eval_steps_per_second": 0.518, "eval_wer": 0.22530050780998906, "step": 20736 }, { "epoch": 288.06, "learning_rate": 1.745257142857143e-05, "loss": 0.3101, "step": 20740 }, { "epoch": 288.19, "learning_rate": 1.7441142857142858e-05, "loss": 0.3073, "step": 20750 }, { "epoch": 288.33, "learning_rate": 1.7429714285714288e-05, "loss": 0.3024, "step": 20760 }, { "epoch": 288.47, "learning_rate": 1.7418285714285718e-05, "loss": 0.3092, "step": 20770 }, { "epoch": 288.61, "learning_rate": 1.7406857142857145e-05, "loss": 0.3032, "step": 20780 }, { "epoch": 288.75, "learning_rate": 1.739542857142857e-05, "loss": 0.3204, "step": 20790 }, { "epoch": 288.89, "learning_rate": 1.7384e-05, "loss": 0.3037, "step": 20800 }, { "epoch": 289.0, "eval_loss": 0.6096267700195312, "eval_runtime": 128.9555, "eval_samples_per_second": 4.125, "eval_steps_per_second": 0.52, "eval_wer": 0.22947869126438258, "step": 20808 }, { "epoch": 289.03, "learning_rate": 1.737257142857143e-05, "loss": 0.3156, "step": 20810 }, { "epoch": 289.17, "learning_rate": 1.736114285714286e-05, "loss": 0.2958, "step": 20820 }, { "epoch": 289.3, "learning_rate": 1.734971428571429e-05, "loss": 0.2933, "step": 20830 }, { "epoch": 289.44, "learning_rate": 1.7338285714285715e-05, "loss": 0.3063, "step": 20840 }, { "epoch": 289.58, "learning_rate": 1.7326857142857145e-05, "loss": 0.2996, "step": 20850 }, { "epoch": 289.72, "learning_rate": 1.7315428571428572e-05, "loss": 0.3081, "step": 20860 }, { "epoch": 289.86, "learning_rate": 1.7304000000000002e-05, "loss": 0.3092, "step": 20870 }, { "epoch": 290.0, "learning_rate": 1.729257142857143e-05, "loss": 0.3064, "step": 20880 }, { "epoch": 290.0, "eval_loss": 0.5958283543586731, "eval_runtime": 129.2744, "eval_samples_per_second": 4.115, "eval_steps_per_second": 0.518, "eval_wer": 0.22324355595551842, "step": 20880 }, { "epoch": 290.14, "learning_rate": 1.728114285714286e-05, "loss": 0.2969, "step": 20890 }, { "epoch": 290.28, "learning_rate": 1.7269714285714286e-05, "loss": 0.2998, "step": 20900 }, { "epoch": 290.42, "learning_rate": 1.7258285714285716e-05, "loss": 0.2991, "step": 20910 }, { "epoch": 290.55, "learning_rate": 1.7246857142857146e-05, "loss": 0.2952, "step": 20920 }, { "epoch": 290.69, "learning_rate": 1.7235428571428573e-05, "loss": 0.3029, "step": 20930 }, { "epoch": 290.83, "learning_rate": 1.7224e-05, "loss": 0.2941, "step": 20940 }, { "epoch": 290.97, "learning_rate": 1.721257142857143e-05, "loss": 0.3136, "step": 20950 }, { "epoch": 291.0, "eval_loss": 0.6134020090103149, "eval_runtime": 129.4557, "eval_samples_per_second": 4.11, "eval_steps_per_second": 0.518, "eval_wer": 0.22497910908272803, "step": 20952 }, { "epoch": 291.11, "learning_rate": 1.720114285714286e-05, "loss": 0.3056, "step": 20960 }, { "epoch": 291.25, "learning_rate": 1.7189714285714287e-05, "loss": 0.3085, "step": 20970 }, { "epoch": 291.39, "learning_rate": 1.7178285714285717e-05, "loss": 0.3002, "step": 20980 }, { "epoch": 291.53, "learning_rate": 1.7166857142857144e-05, "loss": 0.3021, "step": 20990 }, { "epoch": 291.66, "learning_rate": 1.715542857142857e-05, "loss": 0.306, "step": 21000 }, { "epoch": 291.8, "learning_rate": 1.7144e-05, "loss": 0.3049, "step": 21010 }, { "epoch": 291.94, "learning_rate": 1.713257142857143e-05, "loss": 0.3042, "step": 21020 }, { "epoch": 292.0, "eval_loss": 0.6144478917121887, "eval_runtime": 130.1858, "eval_samples_per_second": 4.086, "eval_steps_per_second": 0.515, "eval_wer": 0.21893681301022047, "step": 21024 }, { "epoch": 292.08, "learning_rate": 1.7121142857142857e-05, "loss": 0.3045, "step": 21030 }, { "epoch": 292.22, "learning_rate": 1.7109714285714288e-05, "loss": 0.3017, "step": 21040 }, { "epoch": 292.36, "learning_rate": 1.7098285714285718e-05, "loss": 0.2991, "step": 21050 }, { "epoch": 292.5, "learning_rate": 1.7086857142857144e-05, "loss": 0.3024, "step": 21060 }, { "epoch": 292.64, "learning_rate": 1.7075428571428575e-05, "loss": 0.3005, "step": 21070 }, { "epoch": 292.78, "learning_rate": 1.7064e-05, "loss": 0.3002, "step": 21080 }, { "epoch": 292.91, "learning_rate": 1.7052571428571428e-05, "loss": 0.2967, "step": 21090 }, { "epoch": 293.0, "eval_loss": 0.6086431741714478, "eval_runtime": 128.9622, "eval_samples_per_second": 4.125, "eval_steps_per_second": 0.52, "eval_wer": 0.22819309635533844, "step": 21096 }, { "epoch": 293.06, "learning_rate": 1.7041142857142858e-05, "loss": 0.3035, "step": 21100 }, { "epoch": 293.19, "learning_rate": 1.7029714285714288e-05, "loss": 0.3012, "step": 21110 }, { "epoch": 293.33, "learning_rate": 1.7018285714285715e-05, "loss": 0.2918, "step": 21120 }, { "epoch": 293.47, "learning_rate": 1.7006857142857145e-05, "loss": 0.3158, "step": 21130 }, { "epoch": 293.61, "learning_rate": 1.6995428571428575e-05, "loss": 0.2745, "step": 21140 }, { "epoch": 293.75, "learning_rate": 1.6984000000000002e-05, "loss": 0.2944, "step": 21150 }, { "epoch": 293.89, "learning_rate": 1.697257142857143e-05, "loss": 0.2952, "step": 21160 }, { "epoch": 294.0, "eval_loss": 0.6178327202796936, "eval_runtime": 129.5227, "eval_samples_per_second": 4.107, "eval_steps_per_second": 0.517, "eval_wer": 0.22845021533714727, "step": 21168 }, { "epoch": 294.03, "learning_rate": 1.696114285714286e-05, "loss": 0.3098, "step": 21170 }, { "epoch": 294.17, "learning_rate": 1.6949714285714286e-05, "loss": 0.3097, "step": 21180 }, { "epoch": 294.3, "learning_rate": 1.6938285714285716e-05, "loss": 0.3034, "step": 21190 }, { "epoch": 294.44, "learning_rate": 1.6926857142857146e-05, "loss": 0.301, "step": 21200 }, { "epoch": 294.58, "learning_rate": 1.6915428571428573e-05, "loss": 0.2944, "step": 21210 }, { "epoch": 294.72, "learning_rate": 1.6904e-05, "loss": 0.3093, "step": 21220 }, { "epoch": 294.86, "learning_rate": 1.689257142857143e-05, "loss": 0.3082, "step": 21230 }, { "epoch": 295.0, "learning_rate": 1.688114285714286e-05, "loss": 0.301, "step": 21240 }, { "epoch": 295.0, "eval_loss": 0.5923818945884705, "eval_runtime": 130.2972, "eval_samples_per_second": 4.083, "eval_steps_per_second": 0.514, "eval_wer": 0.21893681301022047, "step": 21240 }, { "epoch": 295.14, "learning_rate": 1.6869714285714286e-05, "loss": 0.3083, "step": 21250 }, { "epoch": 295.28, "learning_rate": 1.6858285714285717e-05, "loss": 0.2986, "step": 21260 }, { "epoch": 295.42, "learning_rate": 1.6846857142857143e-05, "loss": 0.2978, "step": 21270 }, { "epoch": 295.55, "learning_rate": 1.6835428571428573e-05, "loss": 0.2985, "step": 21280 }, { "epoch": 295.69, "learning_rate": 1.6824e-05, "loss": 0.2963, "step": 21290 }, { "epoch": 295.83, "learning_rate": 1.681257142857143e-05, "loss": 0.2917, "step": 21300 }, { "epoch": 295.97, "learning_rate": 1.6801142857142857e-05, "loss": 0.3058, "step": 21310 }, { "epoch": 296.0, "eval_loss": 0.6031795144081116, "eval_runtime": 129.2463, "eval_samples_per_second": 4.116, "eval_steps_per_second": 0.518, "eval_wer": 0.21925821173748153, "step": 21312 }, { "epoch": 296.11, "learning_rate": 1.6789714285714287e-05, "loss": 0.2964, "step": 21320 }, { "epoch": 296.25, "learning_rate": 1.6778285714285717e-05, "loss": 0.294, "step": 21330 }, { "epoch": 296.39, "learning_rate": 1.6766857142857144e-05, "loss": 0.2981, "step": 21340 }, { "epoch": 296.53, "learning_rate": 1.6755428571428574e-05, "loss": 0.2955, "step": 21350 }, { "epoch": 296.66, "learning_rate": 1.6744e-05, "loss": 0.2938, "step": 21360 }, { "epoch": 296.8, "learning_rate": 1.6732571428571428e-05, "loss": 0.289, "step": 21370 }, { "epoch": 296.94, "learning_rate": 1.6721142857142858e-05, "loss": 0.2983, "step": 21380 }, { "epoch": 297.0, "eval_loss": 0.5822866559028625, "eval_runtime": 129.849, "eval_samples_per_second": 4.097, "eval_steps_per_second": 0.516, "eval_wer": 0.2182940155556984, "step": 21384 }, { "epoch": 297.08, "learning_rate": 1.6709714285714288e-05, "loss": 0.3014, "step": 21390 }, { "epoch": 297.22, "learning_rate": 1.6698285714285715e-05, "loss": 0.298, "step": 21400 }, { "epoch": 297.36, "learning_rate": 1.6686857142857145e-05, "loss": 0.2825, "step": 21410 }, { "epoch": 297.5, "learning_rate": 1.6675428571428575e-05, "loss": 0.2908, "step": 21420 }, { "epoch": 297.64, "learning_rate": 1.6664000000000002e-05, "loss": 0.2937, "step": 21430 }, { "epoch": 297.78, "learning_rate": 1.665257142857143e-05, "loss": 0.2961, "step": 21440 }, { "epoch": 297.91, "learning_rate": 1.664114285714286e-05, "loss": 0.2793, "step": 21450 }, { "epoch": 298.0, "eval_loss": 0.5929964780807495, "eval_runtime": 130.2429, "eval_samples_per_second": 4.085, "eval_steps_per_second": 0.514, "eval_wer": 0.21951533071929036, "step": 21456 }, { "epoch": 298.06, "learning_rate": 1.6629714285714285e-05, "loss": 0.3135, "step": 21460 }, { "epoch": 298.19, "learning_rate": 1.6618285714285715e-05, "loss": 0.3, "step": 21470 }, { "epoch": 298.33, "learning_rate": 1.6606857142857146e-05, "loss": 0.2834, "step": 21480 }, { "epoch": 298.47, "learning_rate": 1.6595428571428572e-05, "loss": 0.2932, "step": 21490 }, { "epoch": 298.61, "learning_rate": 1.6584000000000002e-05, "loss": 0.2971, "step": 21500 }, { "epoch": 298.75, "learning_rate": 1.657257142857143e-05, "loss": 0.2982, "step": 21510 }, { "epoch": 298.89, "learning_rate": 1.656114285714286e-05, "loss": 0.2936, "step": 21520 }, { "epoch": 299.0, "eval_loss": 0.6165506839752197, "eval_runtime": 130.1005, "eval_samples_per_second": 4.089, "eval_steps_per_second": 0.515, "eval_wer": 0.2215080028283088, "step": 21528 }, { "epoch": 299.03, "learning_rate": 1.6549714285714286e-05, "loss": 0.308, "step": 21530 }, { "epoch": 299.17, "learning_rate": 1.6538285714285716e-05, "loss": 0.2923, "step": 21540 }, { "epoch": 299.3, "learning_rate": 1.6526857142857143e-05, "loss": 0.2898, "step": 21550 }, { "epoch": 299.44, "learning_rate": 1.6515428571428573e-05, "loss": 0.3078, "step": 21560 }, { "epoch": 299.58, "learning_rate": 1.6504000000000003e-05, "loss": 0.2902, "step": 21570 }, { "epoch": 299.72, "learning_rate": 1.649257142857143e-05, "loss": 0.2953, "step": 21580 }, { "epoch": 299.86, "learning_rate": 1.6481142857142857e-05, "loss": 0.2923, "step": 21590 }, { "epoch": 300.0, "learning_rate": 1.6469714285714287e-05, "loss": 0.298, "step": 21600 }, { "epoch": 300.0, "eval_loss": 0.5864111185073853, "eval_runtime": 129.999, "eval_samples_per_second": 4.092, "eval_steps_per_second": 0.515, "eval_wer": 0.2159156649739667, "step": 21600 }, { "epoch": 300.14, "learning_rate": 1.6458285714285717e-05, "loss": 0.2839, "step": 21610 }, { "epoch": 300.28, "learning_rate": 1.6446857142857144e-05, "loss": 0.2902, "step": 21620 }, { "epoch": 300.42, "learning_rate": 1.6435428571428574e-05, "loss": 0.2991, "step": 21630 }, { "epoch": 300.55, "learning_rate": 1.6424e-05, "loss": 0.293, "step": 21640 }, { "epoch": 300.69, "learning_rate": 1.6412571428571427e-05, "loss": 0.2972, "step": 21650 }, { "epoch": 300.83, "learning_rate": 1.6401142857142858e-05, "loss": 0.2893, "step": 21660 }, { "epoch": 300.97, "learning_rate": 1.6389714285714288e-05, "loss": 0.2949, "step": 21670 }, { "epoch": 301.0, "eval_loss": 0.6049138307571411, "eval_runtime": 129.795, "eval_samples_per_second": 4.099, "eval_steps_per_second": 0.516, "eval_wer": 0.21597994471941892, "step": 21672 }, { "epoch": 301.11, "learning_rate": 1.6378285714285714e-05, "loss": 0.2858, "step": 21680 }, { "epoch": 301.25, "learning_rate": 1.6366857142857145e-05, "loss": 0.2955, "step": 21690 }, { "epoch": 301.39, "learning_rate": 1.6355428571428575e-05, "loss": 0.2849, "step": 21700 }, { "epoch": 301.53, "learning_rate": 1.6344e-05, "loss": 0.2876, "step": 21710 }, { "epoch": 301.66, "learning_rate": 1.633257142857143e-05, "loss": 0.2953, "step": 21720 }, { "epoch": 301.8, "learning_rate": 1.6321142857142858e-05, "loss": 0.2881, "step": 21730 }, { "epoch": 301.94, "learning_rate": 1.6309714285714285e-05, "loss": 0.2948, "step": 21740 }, { "epoch": 302.0, "eval_loss": 0.5745234489440918, "eval_runtime": 130.5994, "eval_samples_per_second": 4.074, "eval_steps_per_second": 0.513, "eval_wer": 0.21732981937391527, "step": 21744 }, { "epoch": 302.08, "learning_rate": 1.6298285714285715e-05, "loss": 0.2929, "step": 21750 }, { "epoch": 302.22, "learning_rate": 1.6286857142857145e-05, "loss": 0.3012, "step": 21760 }, { "epoch": 302.36, "learning_rate": 1.6275428571428572e-05, "loss": 0.2864, "step": 21770 }, { "epoch": 302.5, "learning_rate": 1.6264000000000002e-05, "loss": 0.2966, "step": 21780 }, { "epoch": 302.64, "learning_rate": 1.6252571428571432e-05, "loss": 0.292, "step": 21790 }, { "epoch": 302.78, "learning_rate": 1.624114285714286e-05, "loss": 0.282, "step": 21800 }, { "epoch": 302.91, "learning_rate": 1.6229714285714286e-05, "loss": 0.2809, "step": 21810 }, { "epoch": 303.0, "eval_loss": 0.5698898434638977, "eval_runtime": 129.7461, "eval_samples_per_second": 4.1, "eval_steps_per_second": 0.516, "eval_wer": 0.21732981937391527, "step": 21816 }, { "epoch": 303.06, "learning_rate": 1.6218285714285716e-05, "loss": 0.3008, "step": 21820 }, { "epoch": 303.19, "learning_rate": 1.6206857142857143e-05, "loss": 0.2856, "step": 21830 }, { "epoch": 303.33, "learning_rate": 1.6195428571428573e-05, "loss": 0.2935, "step": 21840 }, { "epoch": 303.47, "learning_rate": 1.6184000000000003e-05, "loss": 0.2954, "step": 21850 }, { "epoch": 303.61, "learning_rate": 1.617257142857143e-05, "loss": 0.2721, "step": 21860 }, { "epoch": 303.75, "learning_rate": 1.6161142857142856e-05, "loss": 0.2837, "step": 21870 }, { "epoch": 303.89, "learning_rate": 1.6149714285714287e-05, "loss": 0.2854, "step": 21880 }, { "epoch": 304.0, "eval_loss": 0.5894419550895691, "eval_runtime": 131.6383, "eval_samples_per_second": 4.041, "eval_steps_per_second": 0.509, "eval_wer": 0.22433631162820594, "step": 21888 }, { "epoch": 304.03, "learning_rate": 1.6138285714285717e-05, "loss": 0.2938, "step": 21890 }, { "epoch": 304.17, "learning_rate": 1.6126857142857143e-05, "loss": 0.2903, "step": 21900 }, { "epoch": 304.3, "learning_rate": 1.6115428571428574e-05, "loss": 0.2797, "step": 21910 }, { "epoch": 304.44, "learning_rate": 1.6104e-05, "loss": 0.2832, "step": 21920 }, { "epoch": 304.58, "learning_rate": 1.609257142857143e-05, "loss": 0.2913, "step": 21930 }, { "epoch": 304.72, "learning_rate": 1.6081142857142857e-05, "loss": 0.2961, "step": 21940 }, { "epoch": 304.86, "learning_rate": 1.6069714285714287e-05, "loss": 0.2738, "step": 21950 }, { "epoch": 305.0, "learning_rate": 1.6058285714285714e-05, "loss": 0.2908, "step": 21960 }, { "epoch": 305.0, "eval_loss": 0.6123014688491821, "eval_runtime": 129.3073, "eval_samples_per_second": 4.114, "eval_steps_per_second": 0.518, "eval_wer": 0.22285787748280517, "step": 21960 }, { "epoch": 305.14, "learning_rate": 1.6046857142857144e-05, "loss": 0.2849, "step": 21970 }, { "epoch": 305.28, "learning_rate": 1.6035428571428574e-05, "loss": 0.3271, "step": 21980 }, { "epoch": 305.42, "learning_rate": 1.6024e-05, "loss": 0.2845, "step": 21990 }, { "epoch": 305.55, "learning_rate": 1.601257142857143e-05, "loss": 0.2795, "step": 22000 }, { "epoch": 305.69, "learning_rate": 1.6001142857142858e-05, "loss": 0.2947, "step": 22010 }, { "epoch": 305.83, "learning_rate": 1.5989714285714285e-05, "loss": 0.2782, "step": 22020 }, { "epoch": 305.97, "learning_rate": 1.5978285714285715e-05, "loss": 0.2948, "step": 22030 }, { "epoch": 306.0, "eval_loss": 0.5965629816055298, "eval_runtime": 131.1634, "eval_samples_per_second": 4.056, "eval_steps_per_second": 0.511, "eval_wer": 0.21623706370122775, "step": 22032 }, { "epoch": 306.11, "learning_rate": 1.5966857142857145e-05, "loss": 0.2868, "step": 22040 }, { "epoch": 306.25, "learning_rate": 1.5955428571428572e-05, "loss": 0.2893, "step": 22050 }, { "epoch": 306.39, "learning_rate": 1.5944000000000002e-05, "loss": 0.2852, "step": 22060 }, { "epoch": 306.53, "learning_rate": 1.5932571428571432e-05, "loss": 0.2917, "step": 22070 }, { "epoch": 306.66, "learning_rate": 1.592114285714286e-05, "loss": 0.2786, "step": 22080 }, { "epoch": 306.8, "learning_rate": 1.5909714285714285e-05, "loss": 0.2797, "step": 22090 }, { "epoch": 306.94, "learning_rate": 1.5898285714285716e-05, "loss": 0.2997, "step": 22100 }, { "epoch": 307.0, "eval_loss": 0.6029682755470276, "eval_runtime": 129.353, "eval_samples_per_second": 4.113, "eval_steps_per_second": 0.518, "eval_wer": 0.21803689657388955, "step": 22104 }, { "epoch": 307.08, "learning_rate": 1.5886857142857142e-05, "loss": 0.2931, "step": 22110 }, { "epoch": 307.22, "learning_rate": 1.5875428571428572e-05, "loss": 0.2888, "step": 22120 }, { "epoch": 307.36, "learning_rate": 1.5864000000000003e-05, "loss": 0.2804, "step": 22130 }, { "epoch": 307.5, "learning_rate": 1.585257142857143e-05, "loss": 0.2763, "step": 22140 }, { "epoch": 307.64, "learning_rate": 1.584114285714286e-05, "loss": 0.2896, "step": 22150 }, { "epoch": 307.78, "learning_rate": 1.5829714285714286e-05, "loss": 0.2849, "step": 22160 }, { "epoch": 307.91, "learning_rate": 1.5818285714285716e-05, "loss": 0.2906, "step": 22170 }, { "epoch": 308.0, "eval_loss": 0.5919510722160339, "eval_runtime": 131.7655, "eval_samples_per_second": 4.037, "eval_steps_per_second": 0.508, "eval_wer": 0.218486854792055, "step": 22176 }, { "epoch": 308.06, "learning_rate": 1.5806857142857143e-05, "loss": 0.2882, "step": 22180 }, { "epoch": 308.19, "learning_rate": 1.5795428571428573e-05, "loss": 0.2911, "step": 22190 }, { "epoch": 308.33, "learning_rate": 1.5784e-05, "loss": 0.2791, "step": 22200 }, { "epoch": 308.47, "learning_rate": 1.577257142857143e-05, "loss": 0.2941, "step": 22210 }, { "epoch": 308.61, "learning_rate": 1.576114285714286e-05, "loss": 0.2811, "step": 22220 }, { "epoch": 308.75, "learning_rate": 1.5749714285714287e-05, "loss": 0.2787, "step": 22230 }, { "epoch": 308.89, "learning_rate": 1.5738285714285714e-05, "loss": 0.2778, "step": 22240 }, { "epoch": 309.0, "eval_loss": 0.5913086533546448, "eval_runtime": 129.5588, "eval_samples_per_second": 4.106, "eval_steps_per_second": 0.517, "eval_wer": 0.21205888024683422, "step": 22248 }, { "epoch": 309.03, "learning_rate": 1.5726857142857144e-05, "loss": 0.2808, "step": 22250 }, { "epoch": 309.17, "learning_rate": 1.5715428571428574e-05, "loss": 0.2789, "step": 22260 }, { "epoch": 309.3, "learning_rate": 1.5704e-05, "loss": 0.2894, "step": 22270 }, { "epoch": 309.44, "learning_rate": 1.569257142857143e-05, "loss": 0.2889, "step": 22280 }, { "epoch": 309.58, "learning_rate": 1.5681142857142858e-05, "loss": 0.2791, "step": 22290 }, { "epoch": 309.72, "learning_rate": 1.5669714285714288e-05, "loss": 0.2831, "step": 22300 }, { "epoch": 309.86, "learning_rate": 1.5658285714285715e-05, "loss": 0.2786, "step": 22310 }, { "epoch": 310.0, "learning_rate": 1.5646857142857145e-05, "loss": 0.281, "step": 22320 }, { "epoch": 310.0, "eval_loss": 0.6019668579101562, "eval_runtime": 129.7468, "eval_samples_per_second": 4.1, "eval_steps_per_second": 0.516, "eval_wer": 0.21205888024683422, "step": 22320 }, { "epoch": 310.14, "learning_rate": 1.563542857142857e-05, "loss": 0.2931, "step": 22330 }, { "epoch": 310.28, "learning_rate": 1.5624e-05, "loss": 0.2832, "step": 22340 }, { "epoch": 310.42, "learning_rate": 1.561257142857143e-05, "loss": 0.2854, "step": 22350 }, { "epoch": 310.55, "learning_rate": 1.560114285714286e-05, "loss": 0.2888, "step": 22360 }, { "epoch": 310.69, "learning_rate": 1.558971428571429e-05, "loss": 0.2949, "step": 22370 }, { "epoch": 310.83, "learning_rate": 1.5578285714285715e-05, "loss": 0.2913, "step": 22380 }, { "epoch": 310.97, "learning_rate": 1.5566857142857142e-05, "loss": 0.2852, "step": 22390 }, { "epoch": 311.0, "eval_loss": 0.5814172029495239, "eval_runtime": 129.0045, "eval_samples_per_second": 4.124, "eval_steps_per_second": 0.519, "eval_wer": 0.21700842064665424, "step": 22392 }, { "epoch": 311.11, "learning_rate": 1.5555428571428572e-05, "loss": 0.2857, "step": 22400 }, { "epoch": 311.25, "learning_rate": 1.5545142857142858e-05, "loss": 0.2817, "step": 22410 }, { "epoch": 311.39, "learning_rate": 1.5533714285714288e-05, "loss": 0.2844, "step": 22420 }, { "epoch": 311.53, "learning_rate": 1.5522285714285718e-05, "loss": 0.288, "step": 22430 }, { "epoch": 311.66, "learning_rate": 1.5510857142857145e-05, "loss": 0.2844, "step": 22440 }, { "epoch": 311.8, "learning_rate": 1.549942857142857e-05, "loss": 0.2798, "step": 22450 }, { "epoch": 311.94, "learning_rate": 1.5488e-05, "loss": 0.278, "step": 22460 }, { "epoch": 312.0, "eval_loss": 0.5930659770965576, "eval_runtime": 129.3086, "eval_samples_per_second": 4.114, "eval_steps_per_second": 0.518, "eval_wer": 0.2151443080285402, "step": 22464 }, { "epoch": 312.08, "learning_rate": 1.5476571428571428e-05, "loss": 0.2765, "step": 22470 }, { "epoch": 312.22, "learning_rate": 1.546514285714286e-05, "loss": 0.2907, "step": 22480 }, { "epoch": 312.36, "learning_rate": 1.545371428571429e-05, "loss": 0.2736, "step": 22490 }, { "epoch": 312.5, "learning_rate": 1.5442285714285715e-05, "loss": 0.2791, "step": 22500 }, { "epoch": 312.64, "learning_rate": 1.5430857142857145e-05, "loss": 0.2822, "step": 22510 }, { "epoch": 312.78, "learning_rate": 1.5419428571428572e-05, "loss": 0.2711, "step": 22520 }, { "epoch": 312.91, "learning_rate": 1.5408000000000002e-05, "loss": 0.2743, "step": 22530 }, { "epoch": 313.0, "eval_loss": 0.6072708964347839, "eval_runtime": 129.5149, "eval_samples_per_second": 4.108, "eval_steps_per_second": 0.517, "eval_wer": 0.21790833708298515, "step": 22536 }, { "epoch": 313.06, "learning_rate": 1.539657142857143e-05, "loss": 0.282, "step": 22540 }, { "epoch": 313.19, "learning_rate": 1.538514285714286e-05, "loss": 0.2743, "step": 22550 }, { "epoch": 313.33, "learning_rate": 1.5373714285714286e-05, "loss": 0.2743, "step": 22560 }, { "epoch": 313.47, "learning_rate": 1.5362285714285716e-05, "loss": 0.2839, "step": 22570 }, { "epoch": 313.61, "learning_rate": 1.5350857142857146e-05, "loss": 0.2809, "step": 22580 }, { "epoch": 313.75, "learning_rate": 1.5339428571428573e-05, "loss": 0.2666, "step": 22590 }, { "epoch": 313.89, "learning_rate": 1.5328e-05, "loss": 0.2757, "step": 22600 }, { "epoch": 314.0, "eval_loss": 0.6173780560493469, "eval_runtime": 132.4093, "eval_samples_per_second": 4.018, "eval_steps_per_second": 0.506, "eval_wer": 0.21533714726489683, "step": 22608 }, { "epoch": 314.03, "learning_rate": 1.531657142857143e-05, "loss": 0.2951, "step": 22610 }, { "epoch": 314.17, "learning_rate": 1.530514285714286e-05, "loss": 0.2744, "step": 22620 }, { "epoch": 314.3, "learning_rate": 1.5293714285714287e-05, "loss": 0.2894, "step": 22630 }, { "epoch": 314.44, "learning_rate": 1.5282285714285717e-05, "loss": 0.2812, "step": 22640 }, { "epoch": 314.58, "learning_rate": 1.5270857142857143e-05, "loss": 0.2777, "step": 22650 }, { "epoch": 314.72, "learning_rate": 1.525942857142857e-05, "loss": 0.2815, "step": 22660 }, { "epoch": 314.86, "learning_rate": 1.5248e-05, "loss": 0.2782, "step": 22670 }, { "epoch": 315.0, "learning_rate": 1.5236571428571429e-05, "loss": 0.2907, "step": 22680 }, { "epoch": 315.0, "eval_loss": 0.5729448199272156, "eval_runtime": 132.1121, "eval_samples_per_second": 4.027, "eval_steps_per_second": 0.507, "eval_wer": 0.21707270039210644, "step": 22680 }, { "epoch": 315.14, "learning_rate": 1.5225142857142859e-05, "loss": 0.2819, "step": 22690 }, { "epoch": 315.28, "learning_rate": 1.5213714285714287e-05, "loss": 0.2797, "step": 22700 }, { "epoch": 315.42, "learning_rate": 1.5202285714285716e-05, "loss": 0.2779, "step": 22710 }, { "epoch": 315.55, "learning_rate": 1.5190857142857144e-05, "loss": 0.2733, "step": 22720 }, { "epoch": 315.69, "learning_rate": 1.5179428571428571e-05, "loss": 0.2799, "step": 22730 }, { "epoch": 315.83, "learning_rate": 1.5168000000000001e-05, "loss": 0.2812, "step": 22740 }, { "epoch": 315.97, "learning_rate": 1.515657142857143e-05, "loss": 0.2801, "step": 22750 }, { "epoch": 316.0, "eval_loss": 0.6014477610588074, "eval_runtime": 130.9356, "eval_samples_per_second": 4.063, "eval_steps_per_second": 0.512, "eval_wer": 0.2214437230828566, "step": 22752 }, { "epoch": 316.11, "learning_rate": 1.5145142857142858e-05, "loss": 0.2821, "step": 22760 }, { "epoch": 316.25, "learning_rate": 1.5133714285714286e-05, "loss": 0.2785, "step": 22770 }, { "epoch": 316.39, "learning_rate": 1.5122285714285717e-05, "loss": 0.2849, "step": 22780 }, { "epoch": 316.53, "learning_rate": 1.5110857142857145e-05, "loss": 0.2852, "step": 22790 }, { "epoch": 316.66, "learning_rate": 1.5099428571428573e-05, "loss": 0.2696, "step": 22800 }, { "epoch": 316.8, "learning_rate": 1.5088e-05, "loss": 0.2756, "step": 22810 }, { "epoch": 316.94, "learning_rate": 1.5076571428571429e-05, "loss": 0.2908, "step": 22820 }, { "epoch": 317.0, "eval_loss": 0.6097726821899414, "eval_runtime": 130.9595, "eval_samples_per_second": 4.062, "eval_steps_per_second": 0.512, "eval_wer": 0.21295879668316514, "step": 22824 }, { "epoch": 317.08, "learning_rate": 1.5065142857142859e-05, "loss": 0.2781, "step": 22830 }, { "epoch": 317.22, "learning_rate": 1.5053714285714287e-05, "loss": 0.2852, "step": 22840 }, { "epoch": 317.36, "learning_rate": 1.5042285714285716e-05, "loss": 0.2689, "step": 22850 }, { "epoch": 317.5, "learning_rate": 1.5030857142857144e-05, "loss": 0.2789, "step": 22860 }, { "epoch": 317.64, "learning_rate": 1.5019428571428574e-05, "loss": 0.2758, "step": 22870 }, { "epoch": 317.78, "learning_rate": 1.5008000000000001e-05, "loss": 0.2695, "step": 22880 }, { "epoch": 317.91, "learning_rate": 1.499657142857143e-05, "loss": 0.2824, "step": 22890 }, { "epoch": 318.0, "eval_loss": 0.5941612124443054, "eval_runtime": 130.3855, "eval_samples_per_second": 4.08, "eval_steps_per_second": 0.514, "eval_wer": 0.2191296522465771, "step": 22896 }, { "epoch": 318.06, "learning_rate": 1.4985142857142858e-05, "loss": 0.3016, "step": 22900 }, { "epoch": 318.19, "learning_rate": 1.4973714285714286e-05, "loss": 0.2708, "step": 22910 }, { "epoch": 318.33, "learning_rate": 1.4962285714285716e-05, "loss": 0.2703, "step": 22920 }, { "epoch": 318.47, "learning_rate": 1.4950857142857145e-05, "loss": 0.2833, "step": 22930 }, { "epoch": 318.61, "learning_rate": 1.4939428571428573e-05, "loss": 0.2808, "step": 22940 }, { "epoch": 318.75, "learning_rate": 1.4928e-05, "loss": 0.2796, "step": 22950 }, { "epoch": 318.89, "learning_rate": 1.4916571428571428e-05, "loss": 0.2799, "step": 22960 }, { "epoch": 319.0, "eval_loss": 0.6374025344848633, "eval_runtime": 130.485, "eval_samples_per_second": 4.077, "eval_steps_per_second": 0.513, "eval_wer": 0.2229864369737096, "step": 22968 }, { "epoch": 319.03, "learning_rate": 1.4905142857142859e-05, "loss": 0.2901, "step": 22970 }, { "epoch": 319.17, "learning_rate": 1.4893714285714287e-05, "loss": 0.287, "step": 22980 }, { "epoch": 319.3, "learning_rate": 1.4882285714285716e-05, "loss": 0.2774, "step": 22990 }, { "epoch": 319.44, "learning_rate": 1.4870857142857144e-05, "loss": 0.2753, "step": 23000 }, { "epoch": 319.58, "learning_rate": 1.4859428571428574e-05, "loss": 0.276, "step": 23010 }, { "epoch": 319.72, "learning_rate": 1.4848e-05, "loss": 0.2815, "step": 23020 }, { "epoch": 319.86, "learning_rate": 1.483657142857143e-05, "loss": 0.2768, "step": 23030 }, { "epoch": 320.0, "learning_rate": 1.4825142857142858e-05, "loss": 0.2725, "step": 23040 }, { "epoch": 320.0, "eval_loss": 0.6424130201339722, "eval_runtime": 130.37, "eval_samples_per_second": 4.081, "eval_steps_per_second": 0.514, "eval_wer": 0.22060808639197788, "step": 23040 }, { "epoch": 320.14, "learning_rate": 1.4813714285714286e-05, "loss": 0.2703, "step": 23050 }, { "epoch": 320.28, "learning_rate": 1.4802285714285716e-05, "loss": 0.264, "step": 23060 }, { "epoch": 320.42, "learning_rate": 1.4790857142857145e-05, "loss": 0.2782, "step": 23070 }, { "epoch": 320.55, "learning_rate": 1.4779428571428573e-05, "loss": 0.2845, "step": 23080 }, { "epoch": 320.69, "learning_rate": 1.4768e-05, "loss": 0.287, "step": 23090 }, { "epoch": 320.83, "learning_rate": 1.4756571428571428e-05, "loss": 0.2661, "step": 23100 }, { "epoch": 320.97, "learning_rate": 1.4745142857142858e-05, "loss": 0.2821, "step": 23110 }, { "epoch": 321.0, "eval_loss": 0.6464852094650269, "eval_runtime": 130.46, "eval_samples_per_second": 4.078, "eval_steps_per_second": 0.514, "eval_wer": 0.22028668766471685, "step": 23112 }, { "epoch": 321.11, "learning_rate": 1.4733714285714287e-05, "loss": 0.2744, "step": 23120 }, { "epoch": 321.25, "learning_rate": 1.4722285714285715e-05, "loss": 0.2901, "step": 23130 }, { "epoch": 321.39, "learning_rate": 1.4710857142857144e-05, "loss": 0.2659, "step": 23140 }, { "epoch": 321.53, "learning_rate": 1.4699428571428574e-05, "loss": 0.2843, "step": 23150 }, { "epoch": 321.66, "learning_rate": 1.4688000000000002e-05, "loss": 0.2845, "step": 23160 }, { "epoch": 321.8, "learning_rate": 1.4676571428571429e-05, "loss": 0.2721, "step": 23170 }, { "epoch": 321.94, "learning_rate": 1.4665142857142858e-05, "loss": 0.2795, "step": 23180 }, { "epoch": 322.0, "eval_loss": 0.616270124912262, "eval_runtime": 130.5648, "eval_samples_per_second": 4.075, "eval_steps_per_second": 0.513, "eval_wer": 0.21816545606479398, "step": 23184 }, { "epoch": 322.08, "learning_rate": 1.4653714285714286e-05, "loss": 0.275, "step": 23190 }, { "epoch": 322.22, "learning_rate": 1.4642285714285716e-05, "loss": 0.2877, "step": 23200 }, { "epoch": 322.36, "learning_rate": 1.4630857142857145e-05, "loss": 0.2788, "step": 23210 }, { "epoch": 322.5, "learning_rate": 1.4619428571428573e-05, "loss": 0.2778, "step": 23220 }, { "epoch": 322.64, "learning_rate": 1.4608000000000001e-05, "loss": 0.2653, "step": 23230 }, { "epoch": 322.78, "learning_rate": 1.4596571428571428e-05, "loss": 0.2789, "step": 23240 }, { "epoch": 322.91, "learning_rate": 1.4585142857142858e-05, "loss": 0.2764, "step": 23250 }, { "epoch": 323.0, "eval_loss": 0.6256516575813293, "eval_runtime": 130.37, "eval_samples_per_second": 4.081, "eval_steps_per_second": 0.514, "eval_wer": 0.22086520537378673, "step": 23256 }, { "epoch": 323.06, "learning_rate": 1.4573714285714287e-05, "loss": 0.2853, "step": 23260 }, { "epoch": 323.19, "learning_rate": 1.4562285714285715e-05, "loss": 0.2742, "step": 23270 }, { "epoch": 323.33, "learning_rate": 1.4550857142857144e-05, "loss": 0.2774, "step": 23280 }, { "epoch": 323.47, "learning_rate": 1.4539428571428574e-05, "loss": 0.2791, "step": 23290 }, { "epoch": 323.61, "learning_rate": 1.4528000000000002e-05, "loss": 0.2753, "step": 23300 }, { "epoch": 323.75, "learning_rate": 1.4516571428571429e-05, "loss": 0.2736, "step": 23310 }, { "epoch": 323.89, "learning_rate": 1.4505142857142857e-05, "loss": 0.2739, "step": 23320 }, { "epoch": 324.0, "eval_loss": 0.6373721361160278, "eval_runtime": 129.9479, "eval_samples_per_second": 4.094, "eval_steps_per_second": 0.516, "eval_wer": 0.21938677122838593, "step": 23328 }, { "epoch": 324.03, "learning_rate": 1.4493714285714286e-05, "loss": 0.284, "step": 23330 }, { "epoch": 324.17, "learning_rate": 1.4482285714285716e-05, "loss": 0.2843, "step": 23340 }, { "epoch": 324.3, "learning_rate": 1.4470857142857144e-05, "loss": 0.2701, "step": 23350 }, { "epoch": 324.44, "learning_rate": 1.4459428571428573e-05, "loss": 0.282, "step": 23360 }, { "epoch": 324.58, "learning_rate": 1.4448000000000001e-05, "loss": 0.2675, "step": 23370 }, { "epoch": 324.72, "learning_rate": 1.4436571428571428e-05, "loss": 0.2702, "step": 23380 }, { "epoch": 324.86, "learning_rate": 1.4425142857142858e-05, "loss": 0.2598, "step": 23390 }, { "epoch": 325.0, "learning_rate": 1.4413714285714287e-05, "loss": 0.2712, "step": 23400 }, { "epoch": 325.0, "eval_loss": 0.6227926015853882, "eval_runtime": 130.0901, "eval_samples_per_second": 4.089, "eval_steps_per_second": 0.515, "eval_wer": 0.21662274217394098, "step": 23400 }, { "epoch": 325.14, "learning_rate": 1.4402285714285715e-05, "loss": 0.2845, "step": 23410 }, { "epoch": 325.28, "learning_rate": 1.4390857142857143e-05, "loss": 0.2765, "step": 23420 }, { "epoch": 325.42, "learning_rate": 1.4379428571428574e-05, "loss": 0.2745, "step": 23430 }, { "epoch": 325.55, "learning_rate": 1.4368000000000002e-05, "loss": 0.27, "step": 23440 }, { "epoch": 325.69, "learning_rate": 1.435657142857143e-05, "loss": 0.2772, "step": 23450 }, { "epoch": 325.83, "learning_rate": 1.4345142857142857e-05, "loss": 0.2679, "step": 23460 }, { "epoch": 325.97, "learning_rate": 1.4333714285714286e-05, "loss": 0.275, "step": 23470 }, { "epoch": 326.0, "eval_loss": 0.6394278407096863, "eval_runtime": 131.0626, "eval_samples_per_second": 4.059, "eval_steps_per_second": 0.511, "eval_wer": 0.2214437230828566, "step": 23472 }, { "epoch": 326.11, "learning_rate": 1.4322285714285716e-05, "loss": 0.274, "step": 23480 }, { "epoch": 326.25, "learning_rate": 1.4310857142857144e-05, "loss": 0.2779, "step": 23490 }, { "epoch": 326.39, "learning_rate": 1.4299428571428573e-05, "loss": 0.2748, "step": 23500 }, { "epoch": 326.53, "learning_rate": 1.4288000000000001e-05, "loss": 0.269, "step": 23510 }, { "epoch": 326.66, "learning_rate": 1.4276571428571431e-05, "loss": 0.2715, "step": 23520 }, { "epoch": 326.8, "learning_rate": 1.4265142857142858e-05, "loss": 0.2685, "step": 23530 }, { "epoch": 326.94, "learning_rate": 1.4253714285714286e-05, "loss": 0.275, "step": 23540 }, { "epoch": 327.0, "eval_loss": 0.6359437108039856, "eval_runtime": 130.0575, "eval_samples_per_second": 4.09, "eval_steps_per_second": 0.515, "eval_wer": 0.22125088384649996, "step": 23544 }, { "epoch": 327.08, "learning_rate": 1.4242285714285715e-05, "loss": 0.2751, "step": 23550 }, { "epoch": 327.22, "learning_rate": 1.4230857142857143e-05, "loss": 0.2752, "step": 23560 }, { "epoch": 327.36, "learning_rate": 1.4219428571428573e-05, "loss": 0.26, "step": 23570 }, { "epoch": 327.5, "learning_rate": 1.4208000000000002e-05, "loss": 0.2732, "step": 23580 }, { "epoch": 327.64, "learning_rate": 1.419657142857143e-05, "loss": 0.2704, "step": 23590 }, { "epoch": 327.78, "learning_rate": 1.4185142857142857e-05, "loss": 0.271, "step": 23600 }, { "epoch": 327.91, "learning_rate": 1.4173714285714285e-05, "loss": 0.2702, "step": 23610 }, { "epoch": 328.0, "eval_loss": 0.6430283188819885, "eval_runtime": 130.0723, "eval_samples_per_second": 4.09, "eval_steps_per_second": 0.515, "eval_wer": 0.2207366458828823, "step": 23616 }, { "epoch": 328.06, "learning_rate": 1.4162285714285716e-05, "loss": 0.279, "step": 23620 }, { "epoch": 328.19, "learning_rate": 1.4150857142857144e-05, "loss": 0.2703, "step": 23630 }, { "epoch": 328.33, "learning_rate": 1.4139428571428572e-05, "loss": 0.2636, "step": 23640 }, { "epoch": 328.47, "learning_rate": 1.4128000000000001e-05, "loss": 0.277, "step": 23650 }, { "epoch": 328.61, "learning_rate": 1.4116571428571431e-05, "loss": 0.276, "step": 23660 }, { "epoch": 328.75, "learning_rate": 1.4105142857142858e-05, "loss": 0.2783, "step": 23670 }, { "epoch": 328.89, "learning_rate": 1.4093714285714286e-05, "loss": 0.2676, "step": 23680 }, { "epoch": 329.0, "eval_loss": 0.6320851445198059, "eval_runtime": 130.1867, "eval_samples_per_second": 4.086, "eval_steps_per_second": 0.515, "eval_wer": 0.21450151057401812, "step": 23688 }, { "epoch": 329.03, "learning_rate": 1.4082285714285715e-05, "loss": 0.2866, "step": 23690 }, { "epoch": 329.17, "learning_rate": 1.4070857142857143e-05, "loss": 0.2822, "step": 23700 }, { "epoch": 329.3, "learning_rate": 1.4059428571428573e-05, "loss": 0.2675, "step": 23710 }, { "epoch": 329.44, "learning_rate": 1.4048000000000002e-05, "loss": 0.2701, "step": 23720 }, { "epoch": 329.58, "learning_rate": 1.403657142857143e-05, "loss": 0.2727, "step": 23730 }, { "epoch": 329.72, "learning_rate": 1.4025142857142859e-05, "loss": 0.2834, "step": 23740 }, { "epoch": 329.86, "learning_rate": 1.4013714285714285e-05, "loss": 0.2735, "step": 23750 }, { "epoch": 330.0, "learning_rate": 1.4002285714285715e-05, "loss": 0.2735, "step": 23760 }, { "epoch": 330.0, "eval_loss": 0.6582525968551636, "eval_runtime": 130.2239, "eval_samples_per_second": 4.085, "eval_steps_per_second": 0.514, "eval_wer": 0.2167513016648454, "step": 23760 }, { "epoch": 330.14, "learning_rate": 1.3990857142857144e-05, "loss": 0.2831, "step": 23770 }, { "epoch": 330.28, "learning_rate": 1.3979428571428572e-05, "loss": 0.2681, "step": 23780 }, { "epoch": 330.42, "learning_rate": 1.3968e-05, "loss": 0.2866, "step": 23790 }, { "epoch": 330.55, "learning_rate": 1.3956571428571431e-05, "loss": 0.269, "step": 23800 }, { "epoch": 330.69, "learning_rate": 1.394514285714286e-05, "loss": 0.2777, "step": 23810 }, { "epoch": 330.83, "learning_rate": 1.3933714285714286e-05, "loss": 0.2766, "step": 23820 }, { "epoch": 330.97, "learning_rate": 1.3922285714285715e-05, "loss": 0.2815, "step": 23830 }, { "epoch": 331.0, "eval_loss": 0.6368274092674255, "eval_runtime": 130.2238, "eval_samples_per_second": 4.085, "eval_steps_per_second": 0.514, "eval_wer": 0.21777977759208073, "step": 23832 }, { "epoch": 331.11, "learning_rate": 1.3910857142857143e-05, "loss": 0.274, "step": 23840 }, { "epoch": 331.25, "learning_rate": 1.3899428571428573e-05, "loss": 0.2757, "step": 23850 }, { "epoch": 331.39, "learning_rate": 1.3888000000000002e-05, "loss": 0.2772, "step": 23860 }, { "epoch": 331.53, "learning_rate": 1.387657142857143e-05, "loss": 0.2854, "step": 23870 }, { "epoch": 331.66, "learning_rate": 1.3865142857142858e-05, "loss": 0.2768, "step": 23880 }, { "epoch": 331.8, "learning_rate": 1.3853714285714285e-05, "loss": 0.2798, "step": 23890 }, { "epoch": 331.94, "learning_rate": 1.3842285714285715e-05, "loss": 0.2823, "step": 23900 }, { "epoch": 332.0, "eval_loss": 0.6373156309127808, "eval_runtime": 130.7116, "eval_samples_per_second": 4.07, "eval_steps_per_second": 0.513, "eval_wer": 0.219708169955647, "step": 23904 }, { "epoch": 332.08, "learning_rate": 1.3830857142857144e-05, "loss": 0.2894, "step": 23910 }, { "epoch": 332.22, "learning_rate": 1.3819428571428572e-05, "loss": 0.2784, "step": 23920 }, { "epoch": 332.36, "learning_rate": 1.3808e-05, "loss": 0.267, "step": 23930 }, { "epoch": 332.5, "learning_rate": 1.379657142857143e-05, "loss": 0.2837, "step": 23940 }, { "epoch": 332.64, "learning_rate": 1.378514285714286e-05, "loss": 0.272, "step": 23950 }, { "epoch": 332.78, "learning_rate": 1.3773714285714286e-05, "loss": 0.26, "step": 23960 }, { "epoch": 332.91, "learning_rate": 1.3762285714285714e-05, "loss": 0.2885, "step": 23970 }, { "epoch": 333.0, "eval_loss": 0.6352220177650452, "eval_runtime": 130.1826, "eval_samples_per_second": 4.087, "eval_steps_per_second": 0.515, "eval_wer": 0.22002956868290802, "step": 23976 }, { "epoch": 333.06, "learning_rate": 1.3750857142857143e-05, "loss": 0.2955, "step": 23980 }, { "epoch": 333.19, "learning_rate": 1.3739428571428573e-05, "loss": 0.2813, "step": 23990 }, { "epoch": 333.33, "learning_rate": 1.3728000000000001e-05, "loss": 0.2741, "step": 24000 }, { "epoch": 333.47, "learning_rate": 1.371657142857143e-05, "loss": 0.2734, "step": 24010 }, { "epoch": 333.61, "learning_rate": 1.3705142857142858e-05, "loss": 0.2599, "step": 24020 }, { "epoch": 333.75, "learning_rate": 1.3693714285714285e-05, "loss": 0.2833, "step": 24030 }, { "epoch": 333.89, "learning_rate": 1.3682285714285715e-05, "loss": 0.2751, "step": 24040 }, { "epoch": 334.0, "eval_loss": 0.6430666446685791, "eval_runtime": 130.2303, "eval_samples_per_second": 4.085, "eval_steps_per_second": 0.514, "eval_wer": 0.2158513852285145, "step": 24048 }, { "epoch": 334.03, "learning_rate": 1.3670857142857144e-05, "loss": 0.2786, "step": 24050 }, { "epoch": 334.17, "learning_rate": 1.3659428571428572e-05, "loss": 0.2717, "step": 24060 }, { "epoch": 334.3, "learning_rate": 1.3648e-05, "loss": 0.2763, "step": 24070 }, { "epoch": 334.44, "learning_rate": 1.363657142857143e-05, "loss": 0.2837, "step": 24080 }, { "epoch": 334.58, "learning_rate": 1.3625142857142859e-05, "loss": 0.281, "step": 24090 }, { "epoch": 334.72, "learning_rate": 1.3613714285714287e-05, "loss": 0.2776, "step": 24100 }, { "epoch": 334.86, "learning_rate": 1.3602285714285714e-05, "loss": 0.2593, "step": 24110 }, { "epoch": 335.0, "learning_rate": 1.3590857142857143e-05, "loss": 0.2717, "step": 24120 }, { "epoch": 335.0, "eval_loss": 0.6339147090911865, "eval_runtime": 132.1075, "eval_samples_per_second": 4.027, "eval_steps_per_second": 0.507, "eval_wer": 0.22125088384649996, "step": 24120 }, { "epoch": 335.14, "learning_rate": 1.3579428571428573e-05, "loss": 0.2713, "step": 24130 }, { "epoch": 335.28, "learning_rate": 1.3568000000000001e-05, "loss": 0.27, "step": 24140 }, { "epoch": 335.42, "learning_rate": 1.355657142857143e-05, "loss": 0.2694, "step": 24150 }, { "epoch": 335.55, "learning_rate": 1.3545142857142858e-05, "loss": 0.2784, "step": 24160 }, { "epoch": 335.69, "learning_rate": 1.3533714285714288e-05, "loss": 0.2729, "step": 24170 }, { "epoch": 335.83, "learning_rate": 1.3522285714285715e-05, "loss": 0.2675, "step": 24180 }, { "epoch": 335.97, "learning_rate": 1.3510857142857143e-05, "loss": 0.286, "step": 24190 }, { "epoch": 336.0, "eval_loss": 0.6566382646560669, "eval_runtime": 131.0264, "eval_samples_per_second": 4.06, "eval_steps_per_second": 0.511, "eval_wer": 0.22452915086456257, "step": 24192 }, { "epoch": 336.11, "learning_rate": 1.3499428571428572e-05, "loss": 0.2722, "step": 24200 }, { "epoch": 336.25, "learning_rate": 1.3488e-05, "loss": 0.2756, "step": 24210 }, { "epoch": 336.39, "learning_rate": 1.347657142857143e-05, "loss": 0.2682, "step": 24220 }, { "epoch": 336.53, "learning_rate": 1.3465142857142859e-05, "loss": 0.2853, "step": 24230 }, { "epoch": 336.66, "learning_rate": 1.3453714285714287e-05, "loss": 0.2789, "step": 24240 }, { "epoch": 336.8, "learning_rate": 1.3442285714285714e-05, "loss": 0.2718, "step": 24250 }, { "epoch": 336.94, "learning_rate": 1.3430857142857142e-05, "loss": 0.2678, "step": 24260 }, { "epoch": 337.0, "eval_loss": 0.6442694067955017, "eval_runtime": 129.9647, "eval_samples_per_second": 4.093, "eval_steps_per_second": 0.516, "eval_wer": 0.21938677122838593, "step": 24264 }, { "epoch": 337.08, "learning_rate": 1.3419428571428573e-05, "loss": 0.2659, "step": 24270 }, { "epoch": 337.22, "learning_rate": 1.3408000000000001e-05, "loss": 0.28, "step": 24280 }, { "epoch": 337.36, "learning_rate": 1.339657142857143e-05, "loss": 0.2629, "step": 24290 }, { "epoch": 337.5, "learning_rate": 1.3385142857142858e-05, "loss": 0.271, "step": 24300 }, { "epoch": 337.64, "learning_rate": 1.3373714285714288e-05, "loss": 0.2669, "step": 24310 }, { "epoch": 337.78, "learning_rate": 1.3362285714285715e-05, "loss": 0.2677, "step": 24320 }, { "epoch": 337.91, "learning_rate": 1.3350857142857143e-05, "loss": 0.2692, "step": 24330 }, { "epoch": 338.0, "eval_loss": 0.6351694464683533, "eval_runtime": 130.6029, "eval_samples_per_second": 4.073, "eval_steps_per_second": 0.513, "eval_wer": 0.22253647875554414, "step": 24336 }, { "epoch": 338.06, "learning_rate": 1.3339428571428572e-05, "loss": 0.2808, "step": 24340 }, { "epoch": 338.19, "learning_rate": 1.3328e-05, "loss": 0.2703, "step": 24350 }, { "epoch": 338.33, "learning_rate": 1.331657142857143e-05, "loss": 0.2734, "step": 24360 }, { "epoch": 338.47, "learning_rate": 1.3305142857142859e-05, "loss": 0.2771, "step": 24370 }, { "epoch": 338.61, "learning_rate": 1.3293714285714287e-05, "loss": 0.266, "step": 24380 }, { "epoch": 338.75, "learning_rate": 1.3282285714285717e-05, "loss": 0.2649, "step": 24390 }, { "epoch": 338.89, "learning_rate": 1.3270857142857142e-05, "loss": 0.273, "step": 24400 }, { "epoch": 339.0, "eval_loss": 0.6496888399124146, "eval_runtime": 130.4288, "eval_samples_per_second": 4.079, "eval_steps_per_second": 0.514, "eval_wer": 0.21874397377386384, "step": 24408 }, { "epoch": 339.03, "learning_rate": 1.3259428571428572e-05, "loss": 0.2782, "step": 24410 }, { "epoch": 339.17, "learning_rate": 1.3248000000000001e-05, "loss": 0.264, "step": 24420 }, { "epoch": 339.3, "learning_rate": 1.323657142857143e-05, "loss": 0.2731, "step": 24430 }, { "epoch": 339.44, "learning_rate": 1.3225142857142858e-05, "loss": 0.2677, "step": 24440 }, { "epoch": 339.58, "learning_rate": 1.3214857142857145e-05, "loss": 0.2758, "step": 24450 }, { "epoch": 339.72, "learning_rate": 1.3203428571428572e-05, "loss": 0.2778, "step": 24460 }, { "epoch": 339.86, "learning_rate": 1.3192e-05, "loss": 0.2619, "step": 24470 }, { "epoch": 340.0, "learning_rate": 1.3180571428571429e-05, "loss": 0.2686, "step": 24480 }, { "epoch": 340.0, "eval_loss": 0.678778886795044, "eval_runtime": 130.2876, "eval_samples_per_second": 4.083, "eval_steps_per_second": 0.514, "eval_wer": 0.2213794433374044, "step": 24480 }, { "epoch": 340.14, "learning_rate": 1.3169142857142859e-05, "loss": 0.2805, "step": 24490 }, { "epoch": 340.28, "learning_rate": 1.3157714285714287e-05, "loss": 0.2675, "step": 24500 }, { "epoch": 340.42, "learning_rate": 1.3146285714285716e-05, "loss": 0.2788, "step": 24510 }, { "epoch": 340.55, "learning_rate": 1.3134857142857144e-05, "loss": 0.2681, "step": 24520 }, { "epoch": 340.69, "learning_rate": 1.312342857142857e-05, "loss": 0.2642, "step": 24530 }, { "epoch": 340.83, "learning_rate": 1.3112e-05, "loss": 0.2594, "step": 24540 }, { "epoch": 340.97, "learning_rate": 1.310057142857143e-05, "loss": 0.2699, "step": 24550 }, { "epoch": 341.0, "eval_loss": 0.661529004573822, "eval_runtime": 130.2322, "eval_samples_per_second": 4.085, "eval_steps_per_second": 0.514, "eval_wer": 0.2198367294465514, "step": 24552 }, { "epoch": 341.11, "learning_rate": 1.3089142857142858e-05, "loss": 0.2746, "step": 24560 }, { "epoch": 341.25, "learning_rate": 1.3077714285714286e-05, "loss": 0.2683, "step": 24570 }, { "epoch": 341.39, "learning_rate": 1.3066285714285716e-05, "loss": 0.2623, "step": 24580 }, { "epoch": 341.53, "learning_rate": 1.3054857142857145e-05, "loss": 0.2615, "step": 24590 }, { "epoch": 341.66, "learning_rate": 1.3043428571428573e-05, "loss": 0.277, "step": 24600 }, { "epoch": 341.8, "learning_rate": 1.3032e-05, "loss": 0.2663, "step": 24610 }, { "epoch": 341.94, "learning_rate": 1.3020571428571428e-05, "loss": 0.2636, "step": 24620 }, { "epoch": 342.0, "eval_loss": 0.6765093207359314, "eval_runtime": 130.3296, "eval_samples_per_second": 4.082, "eval_steps_per_second": 0.514, "eval_wer": 0.21957961046474256, "step": 24624 }, { "epoch": 342.08, "learning_rate": 1.3009142857142858e-05, "loss": 0.2723, "step": 24630 }, { "epoch": 342.22, "learning_rate": 1.2997714285714287e-05, "loss": 0.2743, "step": 24640 }, { "epoch": 342.36, "learning_rate": 1.2986285714285715e-05, "loss": 0.2605, "step": 24650 }, { "epoch": 342.5, "learning_rate": 1.2974857142857144e-05, "loss": 0.2726, "step": 24660 }, { "epoch": 342.64, "learning_rate": 1.2963428571428574e-05, "loss": 0.2576, "step": 24670 }, { "epoch": 342.78, "learning_rate": 1.2952e-05, "loss": 0.2607, "step": 24680 }, { "epoch": 342.91, "learning_rate": 1.2940571428571429e-05, "loss": 0.2545, "step": 24690 }, { "epoch": 343.0, "eval_loss": 0.673693835735321, "eval_runtime": 130.0495, "eval_samples_per_second": 4.091, "eval_steps_per_second": 0.515, "eval_wer": 0.22022240791926465, "step": 24696 }, { "epoch": 343.06, "learning_rate": 1.2929142857142858e-05, "loss": 0.2748, "step": 24700 }, { "epoch": 343.19, "learning_rate": 1.2917714285714286e-05, "loss": 0.2679, "step": 24710 }, { "epoch": 343.33, "learning_rate": 1.2906285714285716e-05, "loss": 0.2571, "step": 24720 }, { "epoch": 343.47, "learning_rate": 1.2894857142857145e-05, "loss": 0.2775, "step": 24730 }, { "epoch": 343.61, "learning_rate": 1.2883428571428573e-05, "loss": 0.265, "step": 24740 }, { "epoch": 343.75, "learning_rate": 1.2872e-05, "loss": 0.2731, "step": 24750 }, { "epoch": 343.89, "learning_rate": 1.2860571428571428e-05, "loss": 0.2612, "step": 24760 }, { "epoch": 344.0, "eval_loss": 0.6890807151794434, "eval_runtime": 129.7723, "eval_samples_per_second": 4.099, "eval_steps_per_second": 0.516, "eval_wer": 0.2239506331554927, "step": 24768 }, { "epoch": 344.03, "learning_rate": 1.2849142857142858e-05, "loss": 0.2802, "step": 24770 }, { "epoch": 344.17, "learning_rate": 1.2837714285714287e-05, "loss": 0.2619, "step": 24780 }, { "epoch": 344.3, "learning_rate": 1.2826285714285715e-05, "loss": 0.2592, "step": 24790 }, { "epoch": 344.44, "learning_rate": 1.2814857142857144e-05, "loss": 0.2735, "step": 24800 }, { "epoch": 344.58, "learning_rate": 1.2803428571428574e-05, "loss": 0.2672, "step": 24810 }, { "epoch": 344.72, "learning_rate": 1.2792e-05, "loss": 0.2691, "step": 24820 }, { "epoch": 344.86, "learning_rate": 1.2780571428571429e-05, "loss": 0.2592, "step": 24830 }, { "epoch": 345.0, "learning_rate": 1.2769142857142857e-05, "loss": 0.2705, "step": 24840 }, { "epoch": 345.0, "eval_loss": 0.6550489068031311, "eval_runtime": 130.2014, "eval_samples_per_second": 4.086, "eval_steps_per_second": 0.515, "eval_wer": 0.22035096741016905, "step": 24840 }, { "epoch": 345.14, "learning_rate": 1.2757714285714286e-05, "loss": 0.2638, "step": 24850 }, { "epoch": 345.28, "learning_rate": 1.2746285714285716e-05, "loss": 0.2732, "step": 24860 }, { "epoch": 345.42, "learning_rate": 1.2734857142857144e-05, "loss": 0.2717, "step": 24870 }, { "epoch": 345.55, "learning_rate": 1.2723428571428573e-05, "loss": 0.2574, "step": 24880 }, { "epoch": 345.69, "learning_rate": 1.2712000000000001e-05, "loss": 0.2664, "step": 24890 }, { "epoch": 345.83, "learning_rate": 1.2700571428571428e-05, "loss": 0.2663, "step": 24900 }, { "epoch": 345.97, "learning_rate": 1.2689142857142858e-05, "loss": 0.2658, "step": 24910 }, { "epoch": 346.0, "eval_loss": 0.6591129302978516, "eval_runtime": 130.1248, "eval_samples_per_second": 4.088, "eval_steps_per_second": 0.515, "eval_wer": 0.21996528893745582, "step": 24912 }, { "epoch": 346.11, "learning_rate": 1.2677714285714287e-05, "loss": 0.261, "step": 24920 }, { "epoch": 346.25, "learning_rate": 1.2666285714285715e-05, "loss": 0.2718, "step": 24930 }, { "epoch": 346.39, "learning_rate": 1.2654857142857143e-05, "loss": 0.2621, "step": 24940 }, { "epoch": 346.53, "learning_rate": 1.2643428571428574e-05, "loss": 0.2708, "step": 24950 }, { "epoch": 346.66, "learning_rate": 1.2632000000000002e-05, "loss": 0.2652, "step": 24960 }, { "epoch": 346.8, "learning_rate": 1.2620571428571429e-05, "loss": 0.2526, "step": 24970 }, { "epoch": 346.94, "learning_rate": 1.2609142857142857e-05, "loss": 0.2701, "step": 24980 }, { "epoch": 347.0, "eval_loss": 0.6222058534622192, "eval_runtime": 129.9237, "eval_samples_per_second": 4.095, "eval_steps_per_second": 0.516, "eval_wer": 0.22157228257376102, "step": 24984 }, { "epoch": 347.08, "learning_rate": 1.2597714285714286e-05, "loss": 0.2623, "step": 24990 }, { "epoch": 347.22, "learning_rate": 1.2586285714285716e-05, "loss": 0.2584, "step": 25000 }, { "epoch": 347.36, "learning_rate": 1.2574857142857144e-05, "loss": 0.2514, "step": 25010 }, { "epoch": 347.5, "learning_rate": 1.2563428571428573e-05, "loss": 0.2741, "step": 25020 }, { "epoch": 347.64, "learning_rate": 1.2552000000000001e-05, "loss": 0.2741, "step": 25030 }, { "epoch": 347.78, "learning_rate": 1.2540571428571428e-05, "loss": 0.2645, "step": 25040 }, { "epoch": 347.91, "learning_rate": 1.2529142857142858e-05, "loss": 0.2743, "step": 25050 }, { "epoch": 348.0, "eval_loss": 0.6263449192047119, "eval_runtime": 130.2831, "eval_samples_per_second": 4.083, "eval_steps_per_second": 0.514, "eval_wer": 0.21855113453750724, "step": 25056 }, { "epoch": 348.06, "learning_rate": 1.2517714285714286e-05, "loss": 0.2738, "step": 25060 }, { "epoch": 348.19, "learning_rate": 1.2506285714285715e-05, "loss": 0.2708, "step": 25070 }, { "epoch": 348.33, "learning_rate": 1.2494857142857143e-05, "loss": 0.2623, "step": 25080 }, { "epoch": 348.47, "learning_rate": 1.2483428571428573e-05, "loss": 0.2666, "step": 25090 }, { "epoch": 348.61, "learning_rate": 1.2472000000000002e-05, "loss": 0.2718, "step": 25100 }, { "epoch": 348.75, "learning_rate": 1.2460571428571429e-05, "loss": 0.2694, "step": 25110 }, { "epoch": 348.89, "learning_rate": 1.2449142857142857e-05, "loss": 0.2657, "step": 25120 }, { "epoch": 349.0, "eval_loss": 0.6509300470352173, "eval_runtime": 129.9501, "eval_samples_per_second": 4.094, "eval_steps_per_second": 0.516, "eval_wer": 0.21855113453750724, "step": 25128 }, { "epoch": 349.03, "learning_rate": 1.2437714285714286e-05, "loss": 0.2862, "step": 25130 }, { "epoch": 349.17, "learning_rate": 1.2426285714285716e-05, "loss": 0.2648, "step": 25140 }, { "epoch": 349.3, "learning_rate": 1.2414857142857144e-05, "loss": 0.2646, "step": 25150 }, { "epoch": 349.44, "learning_rate": 1.2403428571428573e-05, "loss": 0.2764, "step": 25160 }, { "epoch": 349.58, "learning_rate": 1.2392000000000003e-05, "loss": 0.2596, "step": 25170 }, { "epoch": 349.72, "learning_rate": 1.2380571428571431e-05, "loss": 0.276, "step": 25180 }, { "epoch": 349.86, "learning_rate": 1.2369142857142858e-05, "loss": 0.2626, "step": 25190 }, { "epoch": 350.0, "learning_rate": 1.2357714285714286e-05, "loss": 0.2635, "step": 25200 }, { "epoch": 350.0, "eval_loss": 0.6570056676864624, "eval_runtime": 130.7454, "eval_samples_per_second": 4.069, "eval_steps_per_second": 0.512, "eval_wer": 0.2206723661374301, "step": 25200 }, { "epoch": 350.14, "learning_rate": 1.2346285714285715e-05, "loss": 0.2729, "step": 25210 }, { "epoch": 350.28, "learning_rate": 1.2334857142857143e-05, "loss": 0.2745, "step": 25220 }, { "epoch": 350.42, "learning_rate": 1.2323428571428573e-05, "loss": 0.2716, "step": 25230 }, { "epoch": 350.55, "learning_rate": 1.2312000000000002e-05, "loss": 0.2571, "step": 25240 }, { "epoch": 350.69, "learning_rate": 1.230057142857143e-05, "loss": 0.2823, "step": 25250 }, { "epoch": 350.83, "learning_rate": 1.2289142857142857e-05, "loss": 0.2756, "step": 25260 }, { "epoch": 350.97, "learning_rate": 1.2277714285714285e-05, "loss": 0.2601, "step": 25270 }, { "epoch": 351.0, "eval_loss": 0.6495571136474609, "eval_runtime": 129.8963, "eval_samples_per_second": 4.096, "eval_steps_per_second": 0.516, "eval_wer": 0.21546570675580123, "step": 25272 }, { "epoch": 351.11, "learning_rate": 1.2266285714285715e-05, "loss": 0.2714, "step": 25280 }, { "epoch": 351.25, "learning_rate": 1.2254857142857144e-05, "loss": 0.2775, "step": 25290 }, { "epoch": 351.39, "learning_rate": 1.2243428571428572e-05, "loss": 0.272, "step": 25300 }, { "epoch": 351.53, "learning_rate": 1.2232000000000002e-05, "loss": 0.2621, "step": 25310 }, { "epoch": 351.66, "learning_rate": 1.2220571428571431e-05, "loss": 0.2685, "step": 25320 }, { "epoch": 351.8, "learning_rate": 1.2209142857142858e-05, "loss": 0.2654, "step": 25330 }, { "epoch": 351.94, "learning_rate": 1.2197714285714286e-05, "loss": 0.2695, "step": 25340 }, { "epoch": 352.0, "eval_loss": 0.6305015683174133, "eval_runtime": 131.0557, "eval_samples_per_second": 4.059, "eval_steps_per_second": 0.511, "eval_wer": 0.21694414090120204, "step": 25344 }, { "epoch": 352.08, "learning_rate": 1.2186285714285715e-05, "loss": 0.2762, "step": 25350 }, { "epoch": 352.22, "learning_rate": 1.2174857142857143e-05, "loss": 0.2689, "step": 25360 }, { "epoch": 352.36, "learning_rate": 1.2163428571428573e-05, "loss": 0.2618, "step": 25370 }, { "epoch": 352.5, "learning_rate": 1.2152000000000002e-05, "loss": 0.2685, "step": 25380 }, { "epoch": 352.64, "learning_rate": 1.214057142857143e-05, "loss": 0.2726, "step": 25390 }, { "epoch": 352.78, "learning_rate": 1.2129142857142857e-05, "loss": 0.2598, "step": 25400 }, { "epoch": 352.91, "learning_rate": 1.2117714285714285e-05, "loss": 0.2586, "step": 25410 }, { "epoch": 353.0, "eval_loss": 0.6268894076347351, "eval_runtime": 130.607, "eval_samples_per_second": 4.073, "eval_steps_per_second": 0.513, "eval_wer": 0.2222793597737353, "step": 25416 }, { "epoch": 353.06, "learning_rate": 1.2106285714285715e-05, "loss": 0.2688, "step": 25420 }, { "epoch": 353.19, "learning_rate": 1.2094857142857144e-05, "loss": 0.2628, "step": 25430 }, { "epoch": 353.33, "learning_rate": 1.2083428571428572e-05, "loss": 0.2558, "step": 25440 }, { "epoch": 353.47, "learning_rate": 1.2072000000000002e-05, "loss": 0.2729, "step": 25450 }, { "epoch": 353.61, "learning_rate": 1.206057142857143e-05, "loss": 0.2649, "step": 25460 }, { "epoch": 353.75, "learning_rate": 1.2049142857142858e-05, "loss": 0.2666, "step": 25470 }, { "epoch": 353.89, "learning_rate": 1.2037714285714286e-05, "loss": 0.2529, "step": 25480 }, { "epoch": 354.0, "eval_loss": 0.6417762637138367, "eval_runtime": 132.0505, "eval_samples_per_second": 4.029, "eval_steps_per_second": 0.507, "eval_wer": 0.22041524715562127, "step": 25488 }, { "epoch": 354.03, "learning_rate": 1.2026285714285714e-05, "loss": 0.2779, "step": 25490 }, { "epoch": 354.17, "learning_rate": 1.2014857142857143e-05, "loss": 0.2673, "step": 25500 }, { "epoch": 354.3, "learning_rate": 1.2003428571428573e-05, "loss": 0.2697, "step": 25510 }, { "epoch": 354.44, "learning_rate": 1.1992000000000001e-05, "loss": 0.2707, "step": 25520 }, { "epoch": 354.58, "learning_rate": 1.198057142857143e-05, "loss": 0.276, "step": 25530 }, { "epoch": 354.72, "learning_rate": 1.196914285714286e-05, "loss": 0.2695, "step": 25540 }, { "epoch": 354.86, "learning_rate": 1.1957714285714285e-05, "loss": 0.264, "step": 25550 }, { "epoch": 355.0, "learning_rate": 1.1946285714285715e-05, "loss": 0.2739, "step": 25560 }, { "epoch": 355.0, "eval_loss": 0.6471614837646484, "eval_runtime": 131.378, "eval_samples_per_second": 4.049, "eval_steps_per_second": 0.51, "eval_wer": 0.2174583788648197, "step": 25560 }, { "epoch": 355.14, "learning_rate": 1.1934857142857144e-05, "loss": 0.2724, "step": 25570 }, { "epoch": 355.28, "learning_rate": 1.1923428571428572e-05, "loss": 0.2821, "step": 25580 }, { "epoch": 355.42, "learning_rate": 1.1912000000000002e-05, "loss": 0.2801, "step": 25590 }, { "epoch": 355.55, "learning_rate": 1.190057142857143e-05, "loss": 0.2575, "step": 25600 }, { "epoch": 355.69, "learning_rate": 1.1889142857142859e-05, "loss": 0.2692, "step": 25610 }, { "epoch": 355.83, "learning_rate": 1.1877714285714286e-05, "loss": 0.2615, "step": 25620 }, { "epoch": 355.97, "learning_rate": 1.1866285714285714e-05, "loss": 0.2738, "step": 25630 }, { "epoch": 356.0, "eval_loss": 0.6416028738021851, "eval_runtime": 131.7037, "eval_samples_per_second": 4.039, "eval_steps_per_second": 0.509, "eval_wer": 0.21867969402841164, "step": 25632 }, { "epoch": 356.11, "learning_rate": 1.1854857142857143e-05, "loss": 0.278, "step": 25640 }, { "epoch": 356.25, "learning_rate": 1.1843428571428573e-05, "loss": 0.2673, "step": 25650 }, { "epoch": 356.39, "learning_rate": 1.1832000000000001e-05, "loss": 0.2639, "step": 25660 }, { "epoch": 356.53, "learning_rate": 1.182057142857143e-05, "loss": 0.2678, "step": 25670 }, { "epoch": 356.66, "learning_rate": 1.180914285714286e-05, "loss": 0.2668, "step": 25680 }, { "epoch": 356.8, "learning_rate": 1.1797714285714285e-05, "loss": 0.2654, "step": 25690 }, { "epoch": 356.94, "learning_rate": 1.1786285714285715e-05, "loss": 0.2775, "step": 25700 }, { "epoch": 357.0, "eval_loss": 0.6470057964324951, "eval_runtime": 131.655, "eval_samples_per_second": 4.041, "eval_steps_per_second": 0.509, "eval_wer": 0.2208009256283345, "step": 25704 }, { "epoch": 357.08, "learning_rate": 1.1774857142857143e-05, "loss": 0.2792, "step": 25710 }, { "epoch": 357.22, "learning_rate": 1.1763428571428572e-05, "loss": 0.2665, "step": 25720 }, { "epoch": 357.36, "learning_rate": 1.1752000000000002e-05, "loss": 0.2556, "step": 25730 }, { "epoch": 357.5, "learning_rate": 1.174057142857143e-05, "loss": 0.2684, "step": 25740 }, { "epoch": 357.64, "learning_rate": 1.1729142857142859e-05, "loss": 0.2791, "step": 25750 }, { "epoch": 357.78, "learning_rate": 1.1717714285714286e-05, "loss": 0.2638, "step": 25760 }, { "epoch": 357.91, "learning_rate": 1.1706285714285714e-05, "loss": 0.2775, "step": 25770 }, { "epoch": 358.0, "eval_loss": 0.6483216881752014, "eval_runtime": 131.7531, "eval_samples_per_second": 4.038, "eval_steps_per_second": 0.509, "eval_wer": 0.22009384842836022, "step": 25776 }, { "epoch": 358.06, "learning_rate": 1.1694857142857144e-05, "loss": 0.2711, "step": 25780 }, { "epoch": 358.19, "learning_rate": 1.1683428571428573e-05, "loss": 0.2604, "step": 25790 }, { "epoch": 358.33, "learning_rate": 1.1672000000000001e-05, "loss": 0.2721, "step": 25800 }, { "epoch": 358.47, "learning_rate": 1.166057142857143e-05, "loss": 0.2771, "step": 25810 }, { "epoch": 358.61, "learning_rate": 1.164914285714286e-05, "loss": 0.2671, "step": 25820 }, { "epoch": 358.75, "learning_rate": 1.1637714285714288e-05, "loss": 0.2688, "step": 25830 }, { "epoch": 358.89, "learning_rate": 1.1626285714285715e-05, "loss": 0.2622, "step": 25840 }, { "epoch": 359.0, "eval_loss": 0.6232872009277344, "eval_runtime": 131.8106, "eval_samples_per_second": 4.036, "eval_steps_per_second": 0.508, "eval_wer": 0.21642990293758438, "step": 25848 }, { "epoch": 359.03, "learning_rate": 1.1614857142857143e-05, "loss": 0.2771, "step": 25850 }, { "epoch": 359.17, "learning_rate": 1.1603428571428572e-05, "loss": 0.2685, "step": 25860 }, { "epoch": 359.3, "learning_rate": 1.1592000000000002e-05, "loss": 0.264, "step": 25870 }, { "epoch": 359.44, "learning_rate": 1.158057142857143e-05, "loss": 0.2816, "step": 25880 }, { "epoch": 359.58, "learning_rate": 1.1569142857142859e-05, "loss": 0.2719, "step": 25890 }, { "epoch": 359.72, "learning_rate": 1.1557714285714287e-05, "loss": 0.2667, "step": 25900 }, { "epoch": 359.86, "learning_rate": 1.1546285714285714e-05, "loss": 0.2515, "step": 25910 }, { "epoch": 360.0, "learning_rate": 1.1534857142857144e-05, "loss": 0.2727, "step": 25920 }, { "epoch": 360.0, "eval_loss": 0.6437734961509705, "eval_runtime": 131.7584, "eval_samples_per_second": 4.038, "eval_steps_per_second": 0.509, "eval_wer": 0.21777977759208073, "step": 25920 }, { "epoch": 360.14, "learning_rate": 1.1523428571428572e-05, "loss": 0.2602, "step": 25930 }, { "epoch": 360.28, "learning_rate": 1.1512000000000001e-05, "loss": 0.2649, "step": 25940 }, { "epoch": 360.42, "learning_rate": 1.150057142857143e-05, "loss": 0.2563, "step": 25950 }, { "epoch": 360.55, "learning_rate": 1.148914285714286e-05, "loss": 0.2638, "step": 25960 }, { "epoch": 360.69, "learning_rate": 1.1477714285714288e-05, "loss": 0.2728, "step": 25970 }, { "epoch": 360.83, "learning_rate": 1.1466285714285715e-05, "loss": 0.2622, "step": 25980 }, { "epoch": 360.97, "learning_rate": 1.1454857142857143e-05, "loss": 0.275, "step": 25990 }, { "epoch": 361.0, "eval_loss": 0.6459194421768188, "eval_runtime": 132.3578, "eval_samples_per_second": 4.019, "eval_steps_per_second": 0.506, "eval_wer": 0.22221508002828308, "step": 25992 }, { "epoch": 361.11, "learning_rate": 1.1443428571428572e-05, "loss": 0.2707, "step": 26000 }, { "epoch": 361.25, "learning_rate": 1.1432000000000002e-05, "loss": 0.2713, "step": 26010 }, { "epoch": 361.39, "learning_rate": 1.142057142857143e-05, "loss": 0.2638, "step": 26020 }, { "epoch": 361.53, "learning_rate": 1.1409142857142859e-05, "loss": 0.2743, "step": 26030 }, { "epoch": 361.66, "learning_rate": 1.1397714285714287e-05, "loss": 0.2644, "step": 26040 }, { "epoch": 361.8, "learning_rate": 1.1386285714285714e-05, "loss": 0.2612, "step": 26050 }, { "epoch": 361.94, "learning_rate": 1.1374857142857144e-05, "loss": 0.2688, "step": 26060 }, { "epoch": 362.0, "eval_loss": 0.6329224109649658, "eval_runtime": 131.9157, "eval_samples_per_second": 4.033, "eval_steps_per_second": 0.508, "eval_wer": 0.21880825351931607, "step": 26064 }, { "epoch": 362.08, "learning_rate": 1.1363428571428572e-05, "loss": 0.2809, "step": 26070 }, { "epoch": 362.22, "learning_rate": 1.1352e-05, "loss": 0.2718, "step": 26080 }, { "epoch": 362.36, "learning_rate": 1.134057142857143e-05, "loss": 0.2633, "step": 26090 }, { "epoch": 362.5, "learning_rate": 1.132914285714286e-05, "loss": 0.265, "step": 26100 }, { "epoch": 362.64, "learning_rate": 1.1317714285714288e-05, "loss": 0.2549, "step": 26110 }, { "epoch": 362.78, "learning_rate": 1.1306285714285716e-05, "loss": 0.2751, "step": 26120 }, { "epoch": 362.91, "learning_rate": 1.1294857142857143e-05, "loss": 0.2658, "step": 26130 }, { "epoch": 363.0, "eval_loss": 0.6482300758361816, "eval_runtime": 129.6143, "eval_samples_per_second": 4.104, "eval_steps_per_second": 0.517, "eval_wer": 0.2207366458828823, "step": 26136 }, { "epoch": 363.06, "learning_rate": 1.1283428571428571e-05, "loss": 0.2748, "step": 26140 }, { "epoch": 363.19, "learning_rate": 1.1272000000000002e-05, "loss": 0.276, "step": 26150 }, { "epoch": 363.33, "learning_rate": 1.126057142857143e-05, "loss": 0.2613, "step": 26160 }, { "epoch": 363.47, "learning_rate": 1.1249142857142858e-05, "loss": 0.2668, "step": 26170 }, { "epoch": 363.61, "learning_rate": 1.1237714285714287e-05, "loss": 0.2593, "step": 26180 }, { "epoch": 363.75, "learning_rate": 1.1226285714285717e-05, "loss": 0.2761, "step": 26190 }, { "epoch": 363.89, "learning_rate": 1.1214857142857144e-05, "loss": 0.2693, "step": 26200 }, { "epoch": 364.0, "eval_loss": 0.6337394714355469, "eval_runtime": 130.3655, "eval_samples_per_second": 4.081, "eval_steps_per_second": 0.514, "eval_wer": 0.21938677122838593, "step": 26208 }, { "epoch": 364.03, "learning_rate": 1.1203428571428572e-05, "loss": 0.2688, "step": 26210 }, { "epoch": 364.17, "learning_rate": 1.1192e-05, "loss": 0.2747, "step": 26220 }, { "epoch": 364.3, "learning_rate": 1.1180571428571429e-05, "loss": 0.2707, "step": 26230 }, { "epoch": 364.44, "learning_rate": 1.116914285714286e-05, "loss": 0.2714, "step": 26240 }, { "epoch": 364.58, "learning_rate": 1.1157714285714288e-05, "loss": 0.2606, "step": 26250 }, { "epoch": 364.72, "learning_rate": 1.1146285714285716e-05, "loss": 0.266, "step": 26260 }, { "epoch": 364.86, "learning_rate": 1.1134857142857143e-05, "loss": 0.2588, "step": 26270 }, { "epoch": 365.0, "learning_rate": 1.1123428571428571e-05, "loss": 0.2599, "step": 26280 }, { "epoch": 365.0, "eval_loss": 0.6458225250244141, "eval_runtime": 130.1146, "eval_samples_per_second": 4.089, "eval_steps_per_second": 0.515, "eval_wer": 0.21887253326476827, "step": 26280 }, { "epoch": 365.14, "learning_rate": 1.1112000000000001e-05, "loss": 0.2731, "step": 26290 }, { "epoch": 365.28, "learning_rate": 1.110057142857143e-05, "loss": 0.268, "step": 26300 }, { "epoch": 365.42, "learning_rate": 1.1089142857142858e-05, "loss": 0.2594, "step": 26310 }, { "epoch": 365.55, "learning_rate": 1.1077714285714287e-05, "loss": 0.2582, "step": 26320 }, { "epoch": 365.69, "learning_rate": 1.1066285714285717e-05, "loss": 0.2668, "step": 26330 }, { "epoch": 365.83, "learning_rate": 1.1054857142857144e-05, "loss": 0.2576, "step": 26340 }, { "epoch": 365.97, "learning_rate": 1.1043428571428572e-05, "loss": 0.2683, "step": 26350 }, { "epoch": 366.0, "eval_loss": 0.6483390927314758, "eval_runtime": 130.1117, "eval_samples_per_second": 4.089, "eval_steps_per_second": 0.515, "eval_wer": 0.22125088384649996, "step": 26352 }, { "epoch": 366.11, "learning_rate": 1.1032e-05, "loss": 0.27, "step": 26360 }, { "epoch": 366.25, "learning_rate": 1.1020571428571429e-05, "loss": 0.2744, "step": 26370 }, { "epoch": 366.39, "learning_rate": 1.1009142857142859e-05, "loss": 0.257, "step": 26380 }, { "epoch": 366.53, "learning_rate": 1.0997714285714287e-05, "loss": 0.2558, "step": 26390 }, { "epoch": 366.66, "learning_rate": 1.0986285714285716e-05, "loss": 0.2599, "step": 26400 }, { "epoch": 366.8, "learning_rate": 1.0974857142857143e-05, "loss": 0.2566, "step": 26410 }, { "epoch": 366.94, "learning_rate": 1.0963428571428571e-05, "loss": 0.2665, "step": 26420 }, { "epoch": 367.0, "eval_loss": 0.6575628519058228, "eval_runtime": 129.9589, "eval_samples_per_second": 4.094, "eval_steps_per_second": 0.516, "eval_wer": 0.22028668766471685, "step": 26424 }, { "epoch": 367.08, "learning_rate": 1.0952000000000001e-05, "loss": 0.2671, "step": 26430 }, { "epoch": 367.22, "learning_rate": 1.094057142857143e-05, "loss": 0.2762, "step": 26440 }, { "epoch": 367.36, "learning_rate": 1.0929142857142858e-05, "loss": 0.2518, "step": 26450 }, { "epoch": 367.5, "learning_rate": 1.0917714285714287e-05, "loss": 0.2642, "step": 26460 }, { "epoch": 367.64, "learning_rate": 1.0906285714285717e-05, "loss": 0.2557, "step": 26470 }, { "epoch": 367.78, "learning_rate": 1.0894857142857145e-05, "loss": 0.2527, "step": 26480 }, { "epoch": 367.91, "learning_rate": 1.0883428571428572e-05, "loss": 0.2529, "step": 26490 }, { "epoch": 368.0, "eval_loss": 0.6629326939582825, "eval_runtime": 130.163, "eval_samples_per_second": 4.087, "eval_steps_per_second": 0.515, "eval_wer": 0.22002956868290802, "step": 26496 }, { "epoch": 368.06, "learning_rate": 1.0872e-05, "loss": 0.2657, "step": 26500 }, { "epoch": 368.19, "learning_rate": 1.0860571428571429e-05, "loss": 0.2644, "step": 26510 }, { "epoch": 368.33, "learning_rate": 1.0849142857142859e-05, "loss": 0.2552, "step": 26520 }, { "epoch": 368.47, "learning_rate": 1.0837714285714287e-05, "loss": 0.2614, "step": 26530 }, { "epoch": 368.61, "learning_rate": 1.0826285714285716e-05, "loss": 0.2613, "step": 26540 }, { "epoch": 368.75, "learning_rate": 1.0814857142857144e-05, "loss": 0.2649, "step": 26550 }, { "epoch": 368.89, "learning_rate": 1.0803428571428571e-05, "loss": 0.2536, "step": 26560 }, { "epoch": 369.0, "eval_loss": 0.6664714217185974, "eval_runtime": 129.8663, "eval_samples_per_second": 4.097, "eval_steps_per_second": 0.516, "eval_wer": 0.2208009256283345, "step": 26568 }, { "epoch": 369.03, "learning_rate": 1.0792000000000001e-05, "loss": 0.2691, "step": 26570 }, { "epoch": 369.17, "learning_rate": 1.078057142857143e-05, "loss": 0.2552, "step": 26580 }, { "epoch": 369.3, "learning_rate": 1.0769142857142858e-05, "loss": 0.2608, "step": 26590 }, { "epoch": 369.44, "learning_rate": 1.0757714285714286e-05, "loss": 0.2691, "step": 26600 }, { "epoch": 369.58, "learning_rate": 1.0746285714285716e-05, "loss": 0.2539, "step": 26610 }, { "epoch": 369.72, "learning_rate": 1.0734857142857145e-05, "loss": 0.2625, "step": 26620 }, { "epoch": 369.86, "learning_rate": 1.0723428571428572e-05, "loss": 0.2626, "step": 26630 }, { "epoch": 370.0, "learning_rate": 1.0712e-05, "loss": 0.2562, "step": 26640 }, { "epoch": 370.0, "eval_loss": 0.654497504234314, "eval_runtime": 129.5258, "eval_samples_per_second": 4.107, "eval_steps_per_second": 0.517, "eval_wer": 0.21713698013755867, "step": 26640 }, { "epoch": 370.14, "learning_rate": 1.0700571428571429e-05, "loss": 0.2682, "step": 26650 }, { "epoch": 370.28, "learning_rate": 1.0689142857142859e-05, "loss": 0.262, "step": 26660 }, { "epoch": 370.42, "learning_rate": 1.0677714285714287e-05, "loss": 0.249, "step": 26670 }, { "epoch": 370.55, "learning_rate": 1.0666285714285716e-05, "loss": 0.2536, "step": 26680 }, { "epoch": 370.69, "learning_rate": 1.0654857142857144e-05, "loss": 0.2621, "step": 26690 }, { "epoch": 370.83, "learning_rate": 1.064342857142857e-05, "loss": 0.2602, "step": 26700 }, { "epoch": 370.97, "learning_rate": 1.0632000000000001e-05, "loss": 0.2713, "step": 26710 }, { "epoch": 371.0, "eval_loss": 0.6432551145553589, "eval_runtime": 130.1924, "eval_samples_per_second": 4.086, "eval_steps_per_second": 0.515, "eval_wer": 0.223114996464614, "step": 26712 }, { "epoch": 371.11, "learning_rate": 1.062057142857143e-05, "loss": 0.2473, "step": 26720 }, { "epoch": 371.25, "learning_rate": 1.0609142857142858e-05, "loss": 0.2674, "step": 26730 }, { "epoch": 371.39, "learning_rate": 1.0597714285714286e-05, "loss": 0.2548, "step": 26740 }, { "epoch": 371.53, "learning_rate": 1.0586285714285716e-05, "loss": 0.2535, "step": 26750 }, { "epoch": 371.66, "learning_rate": 1.0574857142857145e-05, "loss": 0.2641, "step": 26760 }, { "epoch": 371.8, "learning_rate": 1.0563428571428573e-05, "loss": 0.2564, "step": 26770 }, { "epoch": 371.94, "learning_rate": 1.0552e-05, "loss": 0.2545, "step": 26780 }, { "epoch": 372.0, "eval_loss": 0.6329887509346008, "eval_runtime": 130.0727, "eval_samples_per_second": 4.09, "eval_steps_per_second": 0.515, "eval_wer": 0.22015812817381245, "step": 26784 }, { "epoch": 372.08, "learning_rate": 1.0540571428571428e-05, "loss": 0.2591, "step": 26790 }, { "epoch": 372.22, "learning_rate": 1.0529142857142859e-05, "loss": 0.2691, "step": 26800 }, { "epoch": 372.36, "learning_rate": 1.0517714285714287e-05, "loss": 0.2438, "step": 26810 }, { "epoch": 372.5, "learning_rate": 1.0506285714285715e-05, "loss": 0.2608, "step": 26820 }, { "epoch": 372.64, "learning_rate": 1.0494857142857144e-05, "loss": 0.2572, "step": 26830 }, { "epoch": 372.78, "learning_rate": 1.0483428571428574e-05, "loss": 0.2548, "step": 26840 }, { "epoch": 372.91, "learning_rate": 1.0472e-05, "loss": 0.2513, "step": 26850 }, { "epoch": 373.0, "eval_loss": 0.647386372089386, "eval_runtime": 129.472, "eval_samples_per_second": 4.109, "eval_steps_per_second": 0.517, "eval_wer": 0.21540142701034903, "step": 26856 }, { "epoch": 373.06, "learning_rate": 1.0460571428571429e-05, "loss": 0.259, "step": 26860 }, { "epoch": 373.19, "learning_rate": 1.0449142857142858e-05, "loss": 0.2551, "step": 26870 }, { "epoch": 373.33, "learning_rate": 1.0437714285714286e-05, "loss": 0.2526, "step": 26880 }, { "epoch": 373.47, "learning_rate": 1.0426285714285716e-05, "loss": 0.2518, "step": 26890 }, { "epoch": 373.61, "learning_rate": 1.0414857142857145e-05, "loss": 0.2475, "step": 26900 }, { "epoch": 373.75, "learning_rate": 1.0403428571428573e-05, "loss": 0.2579, "step": 26910 }, { "epoch": 373.89, "learning_rate": 1.0392e-05, "loss": 0.2564, "step": 26920 }, { "epoch": 374.0, "eval_loss": 0.6519069671630859, "eval_runtime": 129.6819, "eval_samples_per_second": 4.102, "eval_steps_per_second": 0.517, "eval_wer": 0.2190653725011249, "step": 26928 }, { "epoch": 374.03, "learning_rate": 1.0380571428571428e-05, "loss": 0.2602, "step": 26930 }, { "epoch": 374.17, "learning_rate": 1.0369142857142858e-05, "loss": 0.2635, "step": 26940 }, { "epoch": 374.3, "learning_rate": 1.0357714285714287e-05, "loss": 0.255, "step": 26950 }, { "epoch": 374.44, "learning_rate": 1.0346285714285715e-05, "loss": 0.2495, "step": 26960 }, { "epoch": 374.58, "learning_rate": 1.0334857142857144e-05, "loss": 0.252, "step": 26970 }, { "epoch": 374.72, "learning_rate": 1.0323428571428574e-05, "loss": 0.2608, "step": 26980 }, { "epoch": 374.86, "learning_rate": 1.0312e-05, "loss": 0.2497, "step": 26990 }, { "epoch": 375.0, "learning_rate": 1.0300571428571429e-05, "loss": 0.266, "step": 27000 }, { "epoch": 375.0, "eval_loss": 0.6577351689338684, "eval_runtime": 129.9806, "eval_samples_per_second": 4.093, "eval_steps_per_second": 0.515, "eval_wer": 0.2199010091920036, "step": 27000 }, { "epoch": 375.14, "learning_rate": 1.0289142857142857e-05, "loss": 0.2595, "step": 27010 }, { "epoch": 375.28, "learning_rate": 1.0277714285714286e-05, "loss": 0.2525, "step": 27020 }, { "epoch": 375.42, "learning_rate": 1.0266285714285716e-05, "loss": 0.2664, "step": 27030 }, { "epoch": 375.55, "learning_rate": 1.0254857142857144e-05, "loss": 0.2579, "step": 27040 }, { "epoch": 375.69, "learning_rate": 1.0243428571428573e-05, "loss": 0.2566, "step": 27050 }, { "epoch": 375.83, "learning_rate": 1.0232000000000001e-05, "loss": 0.2525, "step": 27060 }, { "epoch": 375.97, "learning_rate": 1.0220571428571428e-05, "loss": 0.2623, "step": 27070 }, { "epoch": 376.0, "eval_loss": 0.6508190035820007, "eval_runtime": 129.6401, "eval_samples_per_second": 4.104, "eval_steps_per_second": 0.517, "eval_wer": 0.21874397377386384, "step": 27072 }, { "epoch": 376.11, "learning_rate": 1.0209142857142858e-05, "loss": 0.2564, "step": 27080 }, { "epoch": 376.25, "learning_rate": 1.0197714285714287e-05, "loss": 0.2564, "step": 27090 }, { "epoch": 376.39, "learning_rate": 1.0186285714285715e-05, "loss": 0.2517, "step": 27100 }, { "epoch": 376.53, "learning_rate": 1.0174857142857144e-05, "loss": 0.2424, "step": 27110 }, { "epoch": 376.66, "learning_rate": 1.0163428571428574e-05, "loss": 0.2558, "step": 27120 }, { "epoch": 376.8, "learning_rate": 1.0152000000000002e-05, "loss": 0.2469, "step": 27130 }, { "epoch": 376.94, "learning_rate": 1.0140571428571429e-05, "loss": 0.2666, "step": 27140 }, { "epoch": 377.0, "eval_loss": 0.6358464360237122, "eval_runtime": 129.4556, "eval_samples_per_second": 4.11, "eval_steps_per_second": 0.518, "eval_wer": 0.21707270039210644, "step": 27144 }, { "epoch": 377.08, "learning_rate": 1.0129142857142857e-05, "loss": 0.263, "step": 27150 }, { "epoch": 377.22, "learning_rate": 1.0117714285714286e-05, "loss": 0.2574, "step": 27160 }, { "epoch": 377.36, "learning_rate": 1.0106285714285716e-05, "loss": 0.2421, "step": 27170 }, { "epoch": 377.5, "learning_rate": 1.0094857142857144e-05, "loss": 0.2567, "step": 27180 }, { "epoch": 377.64, "learning_rate": 1.0083428571428573e-05, "loss": 0.2509, "step": 27190 }, { "epoch": 377.78, "learning_rate": 1.0072000000000001e-05, "loss": 0.26, "step": 27200 }, { "epoch": 377.91, "learning_rate": 1.0060571428571428e-05, "loss": 0.2503, "step": 27210 }, { "epoch": 378.0, "eval_loss": 0.6514796018600464, "eval_runtime": 129.9664, "eval_samples_per_second": 4.093, "eval_steps_per_second": 0.516, "eval_wer": 0.21945105097383813, "step": 27216 }, { "epoch": 378.06, "learning_rate": 1.0049142857142858e-05, "loss": 0.2619, "step": 27220 }, { "epoch": 378.19, "learning_rate": 1.0037714285714286e-05, "loss": 0.2647, "step": 27230 }, { "epoch": 378.33, "learning_rate": 1.0026285714285715e-05, "loss": 0.2531, "step": 27240 }, { "epoch": 378.47, "learning_rate": 1.0014857142857143e-05, "loss": 0.2626, "step": 27250 }, { "epoch": 378.61, "learning_rate": 1.0003428571428573e-05, "loss": 0.254, "step": 27260 }, { "epoch": 378.75, "learning_rate": 9.992e-06, "loss": 0.2536, "step": 27270 }, { "epoch": 378.89, "learning_rate": 9.980571428571429e-06, "loss": 0.252, "step": 27280 }, { "epoch": 379.0, "eval_loss": 0.6478943228721619, "eval_runtime": 129.2879, "eval_samples_per_second": 4.115, "eval_steps_per_second": 0.518, "eval_wer": 0.22208652053737868, "step": 27288 }, { "epoch": 379.03, "learning_rate": 9.969142857142859e-06, "loss": 0.2661, "step": 27290 }, { "epoch": 379.17, "learning_rate": 9.957714285714286e-06, "loss": 0.254, "step": 27300 }, { "epoch": 379.3, "learning_rate": 9.946285714285716e-06, "loss": 0.2493, "step": 27310 }, { "epoch": 379.44, "learning_rate": 9.934857142857144e-06, "loss": 0.2662, "step": 27320 }, { "epoch": 379.58, "learning_rate": 9.923428571428573e-06, "loss": 0.2525, "step": 27330 }, { "epoch": 379.72, "learning_rate": 9.912000000000001e-06, "loss": 0.255, "step": 27340 }, { "epoch": 379.86, "learning_rate": 9.90057142857143e-06, "loss": 0.2544, "step": 27350 }, { "epoch": 380.0, "learning_rate": 9.890285714285715e-06, "loss": 0.2558, "step": 27360 }, { "epoch": 380.0, "eval_loss": 0.6343653798103333, "eval_runtime": 129.729, "eval_samples_per_second": 4.101, "eval_steps_per_second": 0.516, "eval_wer": 0.22028668766471685, "step": 27360 }, { "epoch": 380.14, "learning_rate": 9.878857142857143e-06, "loss": 0.2513, "step": 27370 }, { "epoch": 380.28, "learning_rate": 9.867428571428572e-06, "loss": 0.2582, "step": 27380 }, { "epoch": 380.42, "learning_rate": 9.856000000000002e-06, "loss": 0.2615, "step": 27390 }, { "epoch": 380.55, "learning_rate": 9.844571428571429e-06, "loss": 0.255, "step": 27400 }, { "epoch": 380.69, "learning_rate": 9.833142857142857e-06, "loss": 0.261, "step": 27410 }, { "epoch": 380.83, "learning_rate": 9.821714285714287e-06, "loss": 0.2552, "step": 27420 }, { "epoch": 380.97, "learning_rate": 9.810285714285716e-06, "loss": 0.2673, "step": 27430 }, { "epoch": 381.0, "eval_loss": 0.671670138835907, "eval_runtime": 129.7298, "eval_samples_per_second": 4.101, "eval_steps_per_second": 0.516, "eval_wer": 0.21964389021019476, "step": 27432 }, { "epoch": 381.11, "learning_rate": 9.798857142857144e-06, "loss": 0.2554, "step": 27440 }, { "epoch": 381.25, "learning_rate": 9.787428571428572e-06, "loss": 0.2736, "step": 27450 }, { "epoch": 381.39, "learning_rate": 9.776000000000001e-06, "loss": 0.2605, "step": 27460 }, { "epoch": 381.53, "learning_rate": 9.76457142857143e-06, "loss": 0.2546, "step": 27470 }, { "epoch": 381.66, "learning_rate": 9.753142857142858e-06, "loss": 0.2527, "step": 27480 }, { "epoch": 381.8, "learning_rate": 9.741714285714286e-06, "loss": 0.2455, "step": 27490 }, { "epoch": 381.94, "learning_rate": 9.730285714285715e-06, "loss": 0.2615, "step": 27500 }, { "epoch": 382.0, "eval_loss": 0.6392806172370911, "eval_runtime": 130.3791, "eval_samples_per_second": 4.08, "eval_steps_per_second": 0.514, "eval_wer": 0.21777977759208073, "step": 27504 }, { "epoch": 382.08, "learning_rate": 9.718857142857143e-06, "loss": 0.2528, "step": 27510 }, { "epoch": 382.22, "learning_rate": 9.707428571428572e-06, "loss": 0.2538, "step": 27520 }, { "epoch": 382.36, "learning_rate": 9.696000000000002e-06, "loss": 0.2474, "step": 27530 }, { "epoch": 382.5, "learning_rate": 9.68457142857143e-06, "loss": 0.2507, "step": 27540 }, { "epoch": 382.64, "learning_rate": 9.673142857142857e-06, "loss": 0.2596, "step": 27550 }, { "epoch": 382.78, "learning_rate": 9.661714285714287e-06, "loss": 0.2566, "step": 27560 }, { "epoch": 382.91, "learning_rate": 9.650285714285715e-06, "loss": 0.2603, "step": 27570 }, { "epoch": 383.0, "eval_loss": 0.6375032663345337, "eval_runtime": 130.3268, "eval_samples_per_second": 4.082, "eval_steps_per_second": 0.514, "eval_wer": 0.2166870219193932, "step": 27576 }, { "epoch": 383.06, "learning_rate": 9.638857142857144e-06, "loss": 0.2657, "step": 27580 }, { "epoch": 383.19, "learning_rate": 9.627428571428572e-06, "loss": 0.2573, "step": 27590 }, { "epoch": 383.33, "learning_rate": 9.616e-06, "loss": 0.2574, "step": 27600 }, { "epoch": 383.47, "learning_rate": 9.60457142857143e-06, "loss": 0.263, "step": 27610 }, { "epoch": 383.61, "learning_rate": 9.593142857142858e-06, "loss": 0.2513, "step": 27620 }, { "epoch": 383.75, "learning_rate": 9.581714285714286e-06, "loss": 0.2606, "step": 27630 }, { "epoch": 383.89, "learning_rate": 9.570285714285715e-06, "loss": 0.2522, "step": 27640 }, { "epoch": 384.0, "eval_loss": 0.6380506753921509, "eval_runtime": 129.4449, "eval_samples_per_second": 4.11, "eval_steps_per_second": 0.518, "eval_wer": 0.21951533071929036, "step": 27648 }, { "epoch": 384.03, "learning_rate": 9.558857142857145e-06, "loss": 0.259, "step": 27650 }, { "epoch": 384.17, "learning_rate": 9.547428571428571e-06, "loss": 0.272, "step": 27660 }, { "epoch": 384.3, "learning_rate": 9.536000000000002e-06, "loss": 0.2524, "step": 27670 }, { "epoch": 384.44, "learning_rate": 9.52457142857143e-06, "loss": 0.2541, "step": 27680 }, { "epoch": 384.58, "learning_rate": 9.513142857142857e-06, "loss": 0.2465, "step": 27690 }, { "epoch": 384.72, "learning_rate": 9.501714285714287e-06, "loss": 0.2559, "step": 27700 }, { "epoch": 384.86, "learning_rate": 9.490285714285715e-06, "loss": 0.2589, "step": 27710 }, { "epoch": 385.0, "learning_rate": 9.478857142857144e-06, "loss": 0.2532, "step": 27720 }, { "epoch": 385.0, "eval_loss": 0.6566269993782043, "eval_runtime": 129.8222, "eval_samples_per_second": 4.098, "eval_steps_per_second": 0.516, "eval_wer": 0.22092948511923893, "step": 27720 }, { "epoch": 385.14, "learning_rate": 9.467428571428572e-06, "loss": 0.2574, "step": 27730 }, { "epoch": 385.28, "learning_rate": 9.456e-06, "loss": 0.2518, "step": 27740 }, { "epoch": 385.42, "learning_rate": 9.444571428571429e-06, "loss": 0.2632, "step": 27750 }, { "epoch": 385.55, "learning_rate": 9.433142857142857e-06, "loss": 0.2542, "step": 27760 }, { "epoch": 385.69, "learning_rate": 9.421714285714286e-06, "loss": 0.2493, "step": 27770 }, { "epoch": 385.83, "learning_rate": 9.410285714285714e-06, "loss": 0.2572, "step": 27780 }, { "epoch": 385.97, "learning_rate": 9.398857142857144e-06, "loss": 0.2544, "step": 27790 }, { "epoch": 386.0, "eval_loss": 0.6639662981033325, "eval_runtime": 130.0418, "eval_samples_per_second": 4.091, "eval_steps_per_second": 0.515, "eval_wer": 0.223114996464614, "step": 27792 }, { "epoch": 386.11, "learning_rate": 9.387428571428571e-06, "loss": 0.2537, "step": 27800 }, { "epoch": 386.25, "learning_rate": 9.376000000000001e-06, "loss": 0.246, "step": 27810 }, { "epoch": 386.39, "learning_rate": 9.36457142857143e-06, "loss": 0.2468, "step": 27820 }, { "epoch": 386.53, "learning_rate": 9.353142857142858e-06, "loss": 0.2568, "step": 27830 }, { "epoch": 386.66, "learning_rate": 9.341714285714287e-06, "loss": 0.2531, "step": 27840 }, { "epoch": 386.8, "learning_rate": 9.330285714285715e-06, "loss": 0.25, "step": 27850 }, { "epoch": 386.94, "learning_rate": 9.318857142857144e-06, "loss": 0.2529, "step": 27860 }, { "epoch": 387.0, "eval_loss": 0.6531180739402771, "eval_runtime": 129.7768, "eval_samples_per_second": 4.099, "eval_steps_per_second": 0.516, "eval_wer": 0.2207366458828823, "step": 27864 }, { "epoch": 387.08, "learning_rate": 9.307428571428572e-06, "loss": 0.2555, "step": 27870 }, { "epoch": 387.22, "learning_rate": 9.296e-06, "loss": 0.2587, "step": 27880 }, { "epoch": 387.36, "learning_rate": 9.284571428571429e-06, "loss": 0.2508, "step": 27890 }, { "epoch": 387.5, "learning_rate": 9.273142857142859e-06, "loss": 0.2608, "step": 27900 }, { "epoch": 387.64, "learning_rate": 9.261714285714286e-06, "loss": 0.2538, "step": 27910 }, { "epoch": 387.78, "learning_rate": 9.250285714285714e-06, "loss": 0.2547, "step": 27920 }, { "epoch": 387.91, "learning_rate": 9.238857142857144e-06, "loss": 0.2578, "step": 27930 }, { "epoch": 388.0, "eval_loss": 0.6914970278739929, "eval_runtime": 129.8906, "eval_samples_per_second": 4.096, "eval_steps_per_second": 0.516, "eval_wer": 0.22015812817381245, "step": 27936 }, { "epoch": 388.06, "learning_rate": 9.227428571428573e-06, "loss": 0.2517, "step": 27940 }, { "epoch": 388.19, "learning_rate": 9.216000000000001e-06, "loss": 0.2504, "step": 27950 }, { "epoch": 388.33, "learning_rate": 9.20457142857143e-06, "loss": 0.255, "step": 27960 }, { "epoch": 388.47, "learning_rate": 9.193142857142858e-06, "loss": 0.2656, "step": 27970 }, { "epoch": 388.61, "learning_rate": 9.181714285714287e-06, "loss": 0.2436, "step": 27980 }, { "epoch": 388.75, "learning_rate": 9.170285714285715e-06, "loss": 0.2537, "step": 27990 }, { "epoch": 388.89, "learning_rate": 9.158857142857143e-06, "loss": 0.2517, "step": 28000 }, { "epoch": 389.0, "eval_loss": 0.6902373433113098, "eval_runtime": 129.9569, "eval_samples_per_second": 4.094, "eval_steps_per_second": 0.516, "eval_wer": 0.22382207366458828, "step": 28008 }, { "epoch": 389.03, "learning_rate": 9.147428571428572e-06, "loss": 0.2696, "step": 28010 }, { "epoch": 389.17, "learning_rate": 9.136e-06, "loss": 0.2596, "step": 28020 }, { "epoch": 389.3, "learning_rate": 9.124571428571429e-06, "loss": 0.2537, "step": 28030 }, { "epoch": 389.44, "learning_rate": 9.113142857142859e-06, "loss": 0.2599, "step": 28040 }, { "epoch": 389.58, "learning_rate": 9.101714285714286e-06, "loss": 0.2403, "step": 28050 }, { "epoch": 389.72, "learning_rate": 9.090285714285714e-06, "loss": 0.2612, "step": 28060 }, { "epoch": 389.86, "learning_rate": 9.078857142857144e-06, "loss": 0.2617, "step": 28070 }, { "epoch": 390.0, "learning_rate": 9.067428571428573e-06, "loss": 0.2453, "step": 28080 }, { "epoch": 390.0, "eval_loss": 0.6727211475372314, "eval_runtime": 130.2932, "eval_samples_per_second": 4.083, "eval_steps_per_second": 0.514, "eval_wer": 0.22485054959182363, "step": 28080 }, { "epoch": 390.14, "learning_rate": 9.056000000000001e-06, "loss": 0.2556, "step": 28090 }, { "epoch": 390.28, "learning_rate": 9.04457142857143e-06, "loss": 0.2669, "step": 28100 }, { "epoch": 390.42, "learning_rate": 9.033142857142858e-06, "loss": 0.2536, "step": 28110 }, { "epoch": 390.55, "learning_rate": 9.021714285714286e-06, "loss": 0.2529, "step": 28120 }, { "epoch": 390.69, "learning_rate": 9.010285714285715e-06, "loss": 0.2587, "step": 28130 }, { "epoch": 390.83, "learning_rate": 8.998857142857143e-06, "loss": 0.2549, "step": 28140 }, { "epoch": 390.97, "learning_rate": 8.987428571428572e-06, "loss": 0.2634, "step": 28150 }, { "epoch": 391.0, "eval_loss": 0.6666874289512634, "eval_runtime": 129.2636, "eval_samples_per_second": 4.116, "eval_steps_per_second": 0.518, "eval_wer": 0.22350067493732725, "step": 28152 }, { "epoch": 391.11, "learning_rate": 8.976e-06, "loss": 0.2482, "step": 28160 }, { "epoch": 391.25, "learning_rate": 8.964571428571429e-06, "loss": 0.2563, "step": 28170 }, { "epoch": 391.39, "learning_rate": 8.953142857142859e-06, "loss": 0.2513, "step": 28180 }, { "epoch": 391.53, "learning_rate": 8.941714285714287e-06, "loss": 0.2536, "step": 28190 }, { "epoch": 391.66, "learning_rate": 8.930285714285714e-06, "loss": 0.2545, "step": 28200 }, { "epoch": 391.8, "learning_rate": 8.918857142857144e-06, "loss": 0.242, "step": 28210 }, { "epoch": 391.94, "learning_rate": 8.907428571428572e-06, "loss": 0.2515, "step": 28220 }, { "epoch": 392.0, "eval_loss": 0.6553586721420288, "eval_runtime": 129.7533, "eval_samples_per_second": 4.1, "eval_steps_per_second": 0.516, "eval_wer": 0.22118660410104776, "step": 28224 }, { "epoch": 392.08, "learning_rate": 8.896000000000001e-06, "loss": 0.2411, "step": 28230 }, { "epoch": 392.22, "learning_rate": 8.88457142857143e-06, "loss": 0.258, "step": 28240 }, { "epoch": 392.36, "learning_rate": 8.873142857142858e-06, "loss": 0.2467, "step": 28250 }, { "epoch": 392.5, "learning_rate": 8.861714285714286e-06, "loss": 0.2471, "step": 28260 }, { "epoch": 392.64, "learning_rate": 8.850285714285715e-06, "loss": 0.2503, "step": 28270 }, { "epoch": 392.78, "learning_rate": 8.838857142857143e-06, "loss": 0.2445, "step": 28280 }, { "epoch": 392.91, "learning_rate": 8.827428571428572e-06, "loss": 0.249, "step": 28290 }, { "epoch": 393.0, "eval_loss": 0.6671547293663025, "eval_runtime": 130.329, "eval_samples_per_second": 4.082, "eval_steps_per_second": 0.514, "eval_wer": 0.2213794433374044, "step": 28296 }, { "epoch": 393.06, "learning_rate": 8.816000000000002e-06, "loss": 0.2556, "step": 28300 }, { "epoch": 393.19, "learning_rate": 8.804571428571428e-06, "loss": 0.2631, "step": 28310 }, { "epoch": 393.33, "learning_rate": 8.793142857142859e-06, "loss": 0.2469, "step": 28320 }, { "epoch": 393.47, "learning_rate": 8.781714285714287e-06, "loss": 0.2525, "step": 28330 }, { "epoch": 393.61, "learning_rate": 8.770285714285714e-06, "loss": 0.249, "step": 28340 }, { "epoch": 393.75, "learning_rate": 8.758857142857144e-06, "loss": 0.2489, "step": 28350 }, { "epoch": 393.89, "learning_rate": 8.747428571428572e-06, "loss": 0.2524, "step": 28360 }, { "epoch": 394.0, "eval_loss": 0.6693130135536194, "eval_runtime": 129.6887, "eval_samples_per_second": 4.102, "eval_steps_per_second": 0.517, "eval_wer": 0.21642990293758438, "step": 28368 }, { "epoch": 394.03, "learning_rate": 8.736e-06, "loss": 0.2712, "step": 28370 }, { "epoch": 394.17, "learning_rate": 8.72457142857143e-06, "loss": 0.2597, "step": 28380 }, { "epoch": 394.3, "learning_rate": 8.713142857142858e-06, "loss": 0.2507, "step": 28390 }, { "epoch": 394.44, "learning_rate": 8.701714285714286e-06, "loss": 0.245, "step": 28400 }, { "epoch": 394.58, "learning_rate": 8.690285714285716e-06, "loss": 0.2482, "step": 28410 }, { "epoch": 394.72, "learning_rate": 8.678857142857143e-06, "loss": 0.2603, "step": 28420 }, { "epoch": 394.86, "learning_rate": 8.667428571428571e-06, "loss": 0.2503, "step": 28430 }, { "epoch": 395.0, "learning_rate": 8.656000000000001e-06, "loss": 0.2529, "step": 28440 }, { "epoch": 395.0, "eval_loss": 0.6571841835975647, "eval_runtime": 129.9168, "eval_samples_per_second": 4.095, "eval_steps_per_second": 0.516, "eval_wer": 0.21861541428295944, "step": 28440 }, { "epoch": 395.14, "learning_rate": 8.644571428571428e-06, "loss": 0.263, "step": 28450 }, { "epoch": 395.28, "learning_rate": 8.633142857142858e-06, "loss": 0.2533, "step": 28460 }, { "epoch": 395.42, "learning_rate": 8.621714285714287e-06, "loss": 0.2524, "step": 28470 }, { "epoch": 395.55, "learning_rate": 8.610285714285715e-06, "loss": 0.2531, "step": 28480 }, { "epoch": 395.69, "learning_rate": 8.598857142857144e-06, "loss": 0.2531, "step": 28490 }, { "epoch": 395.83, "learning_rate": 8.587428571428572e-06, "loss": 0.2449, "step": 28500 }, { "epoch": 395.97, "learning_rate": 8.576e-06, "loss": 0.256, "step": 28510 }, { "epoch": 396.0, "eval_loss": 0.6419864892959595, "eval_runtime": 129.5944, "eval_samples_per_second": 4.105, "eval_steps_per_second": 0.517, "eval_wer": 0.21707270039210644, "step": 28512 }, { "epoch": 396.11, "learning_rate": 8.564571428571429e-06, "loss": 0.2492, "step": 28520 }, { "epoch": 396.25, "learning_rate": 8.553142857142857e-06, "loss": 0.2507, "step": 28530 }, { "epoch": 396.39, "learning_rate": 8.541714285714286e-06, "loss": 0.2478, "step": 28540 }, { "epoch": 396.53, "learning_rate": 8.530285714285716e-06, "loss": 0.2467, "step": 28550 }, { "epoch": 396.66, "learning_rate": 8.518857142857143e-06, "loss": 0.2588, "step": 28560 }, { "epoch": 396.8, "learning_rate": 8.507428571428571e-06, "loss": 0.2488, "step": 28570 }, { "epoch": 396.94, "learning_rate": 8.496000000000001e-06, "loss": 0.2498, "step": 28580 }, { "epoch": 397.0, "eval_loss": 0.6711761355400085, "eval_runtime": 129.4421, "eval_samples_per_second": 4.11, "eval_steps_per_second": 0.518, "eval_wer": 0.2168155814102976, "step": 28584 }, { "epoch": 397.08, "learning_rate": 8.48457142857143e-06, "loss": 0.2568, "step": 28590 }, { "epoch": 397.22, "learning_rate": 8.473142857142858e-06, "loss": 0.2615, "step": 28600 }, { "epoch": 397.36, "learning_rate": 8.461714285714287e-06, "loss": 0.2436, "step": 28610 }, { "epoch": 397.5, "learning_rate": 8.450285714285715e-06, "loss": 0.2541, "step": 28620 }, { "epoch": 397.64, "learning_rate": 8.438857142857144e-06, "loss": 0.2434, "step": 28630 }, { "epoch": 397.78, "learning_rate": 8.427428571428572e-06, "loss": 0.2535, "step": 28640 }, { "epoch": 397.91, "learning_rate": 8.416e-06, "loss": 0.2565, "step": 28650 }, { "epoch": 398.0, "eval_loss": 0.6890328526496887, "eval_runtime": 130.273, "eval_samples_per_second": 4.084, "eval_steps_per_second": 0.514, "eval_wer": 0.2175226586102719, "step": 28656 }, { "epoch": 398.06, "learning_rate": 8.40457142857143e-06, "loss": 0.2539, "step": 28660 }, { "epoch": 398.19, "learning_rate": 8.393142857142857e-06, "loss": 0.2512, "step": 28670 }, { "epoch": 398.33, "learning_rate": 8.381714285714286e-06, "loss": 0.242, "step": 28680 }, { "epoch": 398.47, "learning_rate": 8.370285714285716e-06, "loss": 0.2524, "step": 28690 }, { "epoch": 398.61, "learning_rate": 8.358857142857143e-06, "loss": 0.2473, "step": 28700 }, { "epoch": 398.75, "learning_rate": 8.347428571428573e-06, "loss": 0.2474, "step": 28710 }, { "epoch": 398.89, "learning_rate": 8.336000000000001e-06, "loss": 0.2477, "step": 28720 }, { "epoch": 399.0, "eval_loss": 0.690473198890686, "eval_runtime": 129.785, "eval_samples_per_second": 4.099, "eval_steps_per_second": 0.516, "eval_wer": 0.218486854792055, "step": 28728 }, { "epoch": 399.03, "learning_rate": 8.32457142857143e-06, "loss": 0.2537, "step": 28730 }, { "epoch": 399.17, "learning_rate": 8.313142857142858e-06, "loss": 0.2481, "step": 28740 }, { "epoch": 399.3, "learning_rate": 8.301714285714286e-06, "loss": 0.2424, "step": 28750 }, { "epoch": 399.44, "learning_rate": 8.290285714285715e-06, "loss": 0.2514, "step": 28760 }, { "epoch": 399.58, "learning_rate": 8.278857142857143e-06, "loss": 0.2415, "step": 28770 }, { "epoch": 399.72, "learning_rate": 8.267428571428572e-06, "loss": 0.2547, "step": 28780 }, { "epoch": 399.86, "learning_rate": 8.256e-06, "loss": 0.2451, "step": 28790 }, { "epoch": 400.0, "learning_rate": 8.24457142857143e-06, "loss": 0.2486, "step": 28800 }, { "epoch": 400.0, "eval_loss": 0.7009914517402649, "eval_runtime": 129.6901, "eval_samples_per_second": 4.102, "eval_steps_per_second": 0.517, "eval_wer": 0.2190653725011249, "step": 28800 }, { "epoch": 400.14, "learning_rate": 8.233142857142857e-06, "loss": 0.2506, "step": 28810 }, { "epoch": 400.28, "learning_rate": 8.221714285714286e-06, "loss": 0.2462, "step": 28820 }, { "epoch": 400.42, "learning_rate": 8.210285714285716e-06, "loss": 0.2441, "step": 28830 }, { "epoch": 400.55, "learning_rate": 8.198857142857144e-06, "loss": 0.2555, "step": 28840 }, { "epoch": 400.69, "learning_rate": 8.187428571428573e-06, "loss": 0.2561, "step": 28850 }, { "epoch": 400.83, "learning_rate": 8.176000000000001e-06, "loss": 0.2508, "step": 28860 }, { "epoch": 400.97, "learning_rate": 8.16457142857143e-06, "loss": 0.259, "step": 28870 }, { "epoch": 401.0, "eval_loss": 0.6982916593551636, "eval_runtime": 130.3878, "eval_samples_per_second": 4.08, "eval_steps_per_second": 0.514, "eval_wer": 0.21694414090120204, "step": 28872 }, { "epoch": 401.11, "learning_rate": 8.153142857142858e-06, "loss": 0.2518, "step": 28880 }, { "epoch": 401.25, "learning_rate": 8.141714285714286e-06, "loss": 0.2487, "step": 28890 }, { "epoch": 401.39, "learning_rate": 8.130285714285715e-06, "loss": 0.2557, "step": 28900 }, { "epoch": 401.53, "learning_rate": 8.118857142857143e-06, "loss": 0.2593, "step": 28910 }, { "epoch": 401.66, "learning_rate": 8.107428571428572e-06, "loss": 0.2571, "step": 28920 }, { "epoch": 401.8, "learning_rate": 8.096e-06, "loss": 0.2502, "step": 28930 }, { "epoch": 401.94, "learning_rate": 8.08457142857143e-06, "loss": 0.2555, "step": 28940 }, { "epoch": 402.0, "eval_loss": 0.6877124905586243, "eval_runtime": 130.0205, "eval_samples_per_second": 4.092, "eval_steps_per_second": 0.515, "eval_wer": 0.21887253326476827, "step": 28944 }, { "epoch": 402.08, "learning_rate": 8.073142857142859e-06, "loss": 0.2494, "step": 28950 }, { "epoch": 402.22, "learning_rate": 8.061714285714285e-06, "loss": 0.2549, "step": 28960 }, { "epoch": 402.36, "learning_rate": 8.050285714285716e-06, "loss": 0.2405, "step": 28970 }, { "epoch": 402.5, "learning_rate": 8.038857142857144e-06, "loss": 0.2575, "step": 28980 }, { "epoch": 402.64, "learning_rate": 8.027428571428572e-06, "loss": 0.2401, "step": 28990 }, { "epoch": 402.78, "learning_rate": 8.016e-06, "loss": 0.2463, "step": 29000 }, { "epoch": 402.91, "learning_rate": 8.00457142857143e-06, "loss": 0.2579, "step": 29010 }, { "epoch": 403.0, "eval_loss": 0.6864159107208252, "eval_runtime": 130.3177, "eval_samples_per_second": 4.082, "eval_steps_per_second": 0.514, "eval_wer": 0.21880825351931607, "step": 29016 }, { "epoch": 403.06, "learning_rate": 7.993142857142858e-06, "loss": 0.2519, "step": 29020 }, { "epoch": 403.19, "learning_rate": 7.981714285714286e-06, "loss": 0.2559, "step": 29030 }, { "epoch": 403.33, "learning_rate": 7.970285714285715e-06, "loss": 0.2527, "step": 29040 }, { "epoch": 403.47, "learning_rate": 7.958857142857143e-06, "loss": 0.2462, "step": 29050 }, { "epoch": 403.61, "learning_rate": 7.947428571428573e-06, "loss": 0.2453, "step": 29060 }, { "epoch": 403.75, "learning_rate": 7.936e-06, "loss": 0.2519, "step": 29070 }, { "epoch": 403.89, "learning_rate": 7.92457142857143e-06, "loss": 0.2421, "step": 29080 }, { "epoch": 404.0, "eval_loss": 0.6603102087974548, "eval_runtime": 129.8266, "eval_samples_per_second": 4.098, "eval_steps_per_second": 0.516, "eval_wer": 0.2174583788648197, "step": 29088 }, { "epoch": 404.03, "learning_rate": 7.913142857142858e-06, "loss": 0.2522, "step": 29090 }, { "epoch": 404.17, "learning_rate": 7.901714285714285e-06, "loss": 0.2334, "step": 29100 }, { "epoch": 404.3, "learning_rate": 7.890285714285715e-06, "loss": 0.2452, "step": 29110 }, { "epoch": 404.44, "learning_rate": 7.878857142857144e-06, "loss": 0.2522, "step": 29120 }, { "epoch": 404.58, "learning_rate": 7.867428571428572e-06, "loss": 0.2412, "step": 29130 }, { "epoch": 404.72, "learning_rate": 7.856e-06, "loss": 0.2449, "step": 29140 }, { "epoch": 404.86, "learning_rate": 7.844571428571429e-06, "loss": 0.2381, "step": 29150 }, { "epoch": 405.0, "learning_rate": 7.833142857142858e-06, "loss": 0.2531, "step": 29160 }, { "epoch": 405.0, "eval_loss": 0.6881992816925049, "eval_runtime": 129.4749, "eval_samples_per_second": 4.109, "eval_steps_per_second": 0.517, "eval_wer": 0.2222793597737353, "step": 29160 }, { "epoch": 405.14, "learning_rate": 7.821714285714286e-06, "loss": 0.2534, "step": 29170 }, { "epoch": 405.28, "learning_rate": 7.810285714285714e-06, "loss": 0.2563, "step": 29180 }, { "epoch": 405.42, "learning_rate": 7.798857142857143e-06, "loss": 0.2443, "step": 29190 }, { "epoch": 405.55, "learning_rate": 7.787428571428573e-06, "loss": 0.2491, "step": 29200 }, { "epoch": 405.69, "learning_rate": 7.776e-06, "loss": 0.249, "step": 29210 }, { "epoch": 405.83, "learning_rate": 7.76457142857143e-06, "loss": 0.2542, "step": 29220 }, { "epoch": 405.97, "learning_rate": 7.754285714285715e-06, "loss": 0.254, "step": 29230 }, { "epoch": 406.0, "eval_loss": 0.6813198328018188, "eval_runtime": 129.6131, "eval_samples_per_second": 4.105, "eval_steps_per_second": 0.517, "eval_wer": 0.22092948511923893, "step": 29232 }, { "epoch": 406.11, "learning_rate": 7.742857142857144e-06, "loss": 0.2446, "step": 29240 }, { "epoch": 406.25, "learning_rate": 7.731428571428572e-06, "loss": 0.2471, "step": 29250 }, { "epoch": 406.39, "learning_rate": 7.72e-06, "loss": 0.2462, "step": 29260 }, { "epoch": 406.53, "learning_rate": 7.708571428571429e-06, "loss": 0.2566, "step": 29270 }, { "epoch": 406.66, "learning_rate": 7.697142857142858e-06, "loss": 0.2536, "step": 29280 }, { "epoch": 406.8, "learning_rate": 7.685714285714286e-06, "loss": 0.2457, "step": 29290 }, { "epoch": 406.94, "learning_rate": 7.674285714285714e-06, "loss": 0.2517, "step": 29300 }, { "epoch": 407.0, "eval_loss": 0.6707356572151184, "eval_runtime": 129.4546, "eval_samples_per_second": 4.11, "eval_steps_per_second": 0.518, "eval_wer": 0.22054380664652568, "step": 29304 }, { "epoch": 407.08, "learning_rate": 7.662857142857143e-06, "loss": 0.2553, "step": 29310 }, { "epoch": 407.22, "learning_rate": 7.651428571428571e-06, "loss": 0.2495, "step": 29320 }, { "epoch": 407.36, "learning_rate": 7.640000000000001e-06, "loss": 0.246, "step": 29330 }, { "epoch": 407.5, "learning_rate": 7.62857142857143e-06, "loss": 0.2443, "step": 29340 }, { "epoch": 407.64, "learning_rate": 7.617142857142857e-06, "loss": 0.2424, "step": 29350 }, { "epoch": 407.78, "learning_rate": 7.605714285714286e-06, "loss": 0.2488, "step": 29360 }, { "epoch": 407.91, "learning_rate": 7.594285714285715e-06, "loss": 0.2521, "step": 29370 }, { "epoch": 408.0, "eval_loss": 0.6835159659385681, "eval_runtime": 129.6284, "eval_samples_per_second": 4.104, "eval_steps_per_second": 0.517, "eval_wer": 0.22337211544642283, "step": 29376 }, { "epoch": 408.06, "learning_rate": 7.5828571428571444e-06, "loss": 0.2529, "step": 29380 }, { "epoch": 408.19, "learning_rate": 7.571428571428572e-06, "loss": 0.2515, "step": 29390 }, { "epoch": 408.33, "learning_rate": 7.5600000000000005e-06, "loss": 0.2492, "step": 29400 }, { "epoch": 408.47, "learning_rate": 7.54857142857143e-06, "loss": 0.2552, "step": 29410 }, { "epoch": 408.61, "learning_rate": 7.537142857142857e-06, "loss": 0.2407, "step": 29420 }, { "epoch": 408.75, "learning_rate": 7.525714285714286e-06, "loss": 0.2442, "step": 29430 }, { "epoch": 408.89, "learning_rate": 7.514285714285715e-06, "loss": 0.2494, "step": 29440 }, { "epoch": 409.0, "eval_loss": 0.6896212100982666, "eval_runtime": 129.4861, "eval_samples_per_second": 4.109, "eval_steps_per_second": 0.517, "eval_wer": 0.22163656231921322, "step": 29448 }, { "epoch": 409.03, "learning_rate": 7.502857142857144e-06, "loss": 0.2489, "step": 29450 }, { "epoch": 409.17, "learning_rate": 7.491428571428572e-06, "loss": 0.2486, "step": 29460 }, { "epoch": 409.3, "learning_rate": 7.48e-06, "loss": 0.2489, "step": 29470 }, { "epoch": 409.44, "learning_rate": 7.46857142857143e-06, "loss": 0.2519, "step": 29480 }, { "epoch": 409.58, "learning_rate": 7.457142857142857e-06, "loss": 0.2452, "step": 29490 }, { "epoch": 409.72, "learning_rate": 7.445714285714286e-06, "loss": 0.2417, "step": 29500 }, { "epoch": 409.86, "learning_rate": 7.434285714285715e-06, "loss": 0.2361, "step": 29510 }, { "epoch": 410.0, "learning_rate": 7.422857142857144e-06, "loss": 0.2516, "step": 29520 }, { "epoch": 410.0, "eval_loss": 0.6759763956069946, "eval_runtime": 129.9723, "eval_samples_per_second": 4.093, "eval_steps_per_second": 0.515, "eval_wer": 0.22182940155556985, "step": 29520 }, { "epoch": 410.14, "learning_rate": 7.411428571428572e-06, "loss": 0.2425, "step": 29530 }, { "epoch": 410.28, "learning_rate": 7.4e-06, "loss": 0.2537, "step": 29540 }, { "epoch": 410.42, "learning_rate": 7.38857142857143e-06, "loss": 0.2496, "step": 29550 }, { "epoch": 410.55, "learning_rate": 7.377142857142858e-06, "loss": 0.2457, "step": 29560 }, { "epoch": 410.69, "learning_rate": 7.365714285714286e-06, "loss": 0.2528, "step": 29570 }, { "epoch": 410.83, "learning_rate": 7.354285714285715e-06, "loss": 0.2512, "step": 29580 }, { "epoch": 410.97, "learning_rate": 7.342857142857144e-06, "loss": 0.2605, "step": 29590 }, { "epoch": 411.0, "eval_loss": 0.7055128812789917, "eval_runtime": 129.8522, "eval_samples_per_second": 4.097, "eval_steps_per_second": 0.516, "eval_wer": 0.2206723661374301, "step": 29592 }, { "epoch": 411.11, "learning_rate": 7.331428571428572e-06, "loss": 0.2437, "step": 29600 }, { "epoch": 411.25, "learning_rate": 7.32e-06, "loss": 0.2398, "step": 29610 }, { "epoch": 411.39, "learning_rate": 7.3085714285714295e-06, "loss": 0.2465, "step": 29620 }, { "epoch": 411.53, "learning_rate": 7.297142857142858e-06, "loss": 0.2539, "step": 29630 }, { "epoch": 411.66, "learning_rate": 7.285714285714286e-06, "loss": 0.2453, "step": 29640 }, { "epoch": 411.8, "learning_rate": 7.274285714285715e-06, "loss": 0.2514, "step": 29650 }, { "epoch": 411.94, "learning_rate": 7.262857142857144e-06, "loss": 0.2514, "step": 29660 }, { "epoch": 412.0, "eval_loss": 0.6706816554069519, "eval_runtime": 130.0494, "eval_samples_per_second": 4.091, "eval_steps_per_second": 0.515, "eval_wer": 0.22324355595551842, "step": 29664 }, { "epoch": 412.08, "learning_rate": 7.251428571428572e-06, "loss": 0.2461, "step": 29670 }, { "epoch": 412.22, "learning_rate": 7.24e-06, "loss": 0.2426, "step": 29680 }, { "epoch": 412.36, "learning_rate": 7.2285714285714294e-06, "loss": 0.2393, "step": 29690 }, { "epoch": 412.5, "learning_rate": 7.217142857142858e-06, "loss": 0.2509, "step": 29700 }, { "epoch": 412.64, "learning_rate": 7.205714285714286e-06, "loss": 0.2497, "step": 29710 }, { "epoch": 412.78, "learning_rate": 7.194285714285715e-06, "loss": 0.2478, "step": 29720 }, { "epoch": 412.91, "learning_rate": 7.182857142857144e-06, "loss": 0.242, "step": 29730 }, { "epoch": 413.0, "eval_loss": 0.6853117942810059, "eval_runtime": 129.5551, "eval_samples_per_second": 4.106, "eval_steps_per_second": 0.517, "eval_wer": 0.2182940155556984, "step": 29736 }, { "epoch": 413.06, "learning_rate": 7.1714285714285725e-06, "loss": 0.248, "step": 29740 }, { "epoch": 413.19, "learning_rate": 7.16e-06, "loss": 0.2494, "step": 29750 }, { "epoch": 413.33, "learning_rate": 7.148571428571429e-06, "loss": 0.2393, "step": 29760 }, { "epoch": 413.47, "learning_rate": 7.137142857142858e-06, "loss": 0.252, "step": 29770 }, { "epoch": 413.61, "learning_rate": 7.125714285714286e-06, "loss": 0.2466, "step": 29780 }, { "epoch": 413.75, "learning_rate": 7.114285714285715e-06, "loss": 0.2545, "step": 29790 }, { "epoch": 413.89, "learning_rate": 7.102857142857144e-06, "loss": 0.2505, "step": 29800 }, { "epoch": 414.0, "eval_loss": 0.6869497895240784, "eval_runtime": 130.1983, "eval_samples_per_second": 4.086, "eval_steps_per_second": 0.515, "eval_wer": 0.22324355595551842, "step": 29808 }, { "epoch": 414.03, "learning_rate": 7.091428571428572e-06, "loss": 0.2527, "step": 29810 }, { "epoch": 414.17, "learning_rate": 7.08e-06, "loss": 0.2613, "step": 29820 }, { "epoch": 414.3, "learning_rate": 7.068571428571429e-06, "loss": 0.2561, "step": 29830 }, { "epoch": 414.44, "learning_rate": 7.057142857142858e-06, "loss": 0.2546, "step": 29840 }, { "epoch": 414.58, "learning_rate": 7.045714285714287e-06, "loss": 0.2459, "step": 29850 }, { "epoch": 414.72, "learning_rate": 7.034285714285715e-06, "loss": 0.2573, "step": 29860 }, { "epoch": 414.86, "learning_rate": 7.022857142857144e-06, "loss": 0.2483, "step": 29870 }, { "epoch": 415.0, "learning_rate": 7.011428571428572e-06, "loss": 0.2398, "step": 29880 }, { "epoch": 415.0, "eval_loss": 0.6732475161552429, "eval_runtime": 129.681, "eval_samples_per_second": 4.102, "eval_steps_per_second": 0.517, "eval_wer": 0.22279359773735297, "step": 29880 }, { "epoch": 415.14, "learning_rate": 7e-06, "loss": 0.2589, "step": 29890 }, { "epoch": 415.28, "learning_rate": 6.988571428571429e-06, "loss": 0.2534, "step": 29900 }, { "epoch": 415.42, "learning_rate": 6.977142857142858e-06, "loss": 0.259, "step": 29910 }, { "epoch": 415.55, "learning_rate": 6.965714285714287e-06, "loss": 0.2467, "step": 29920 }, { "epoch": 415.69, "learning_rate": 6.9542857142857145e-06, "loss": 0.255, "step": 29930 }, { "epoch": 415.83, "learning_rate": 6.942857142857144e-06, "loss": 0.2447, "step": 29940 }, { "epoch": 415.97, "learning_rate": 6.931428571428572e-06, "loss": 0.2549, "step": 29950 }, { "epoch": 416.0, "eval_loss": 0.6558857560157776, "eval_runtime": 129.7861, "eval_samples_per_second": 4.099, "eval_steps_per_second": 0.516, "eval_wer": 0.22221508002828308, "step": 29952 }, { "epoch": 416.11, "learning_rate": 6.92e-06, "loss": 0.2482, "step": 29960 }, { "epoch": 416.25, "learning_rate": 6.908571428571429e-06, "loss": 0.2584, "step": 29970 }, { "epoch": 416.39, "learning_rate": 6.8971428571428575e-06, "loss": 0.2465, "step": 29980 }, { "epoch": 416.53, "learning_rate": 6.885714285714287e-06, "loss": 0.2496, "step": 29990 }, { "epoch": 416.66, "learning_rate": 6.874285714285714e-06, "loss": 0.2567, "step": 30000 }, { "epoch": 416.8, "learning_rate": 6.862857142857144e-06, "loss": 0.2453, "step": 30010 }, { "epoch": 416.94, "learning_rate": 6.851428571428572e-06, "loss": 0.2496, "step": 30020 }, { "epoch": 417.0, "eval_loss": 0.6674957275390625, "eval_runtime": 129.7036, "eval_samples_per_second": 4.102, "eval_steps_per_second": 0.517, "eval_wer": 0.2231792762100662, "step": 30024 }, { "epoch": 417.08, "learning_rate": 6.8400000000000014e-06, "loss": 0.2499, "step": 30030 }, { "epoch": 417.22, "learning_rate": 6.828571428571429e-06, "loss": 0.2571, "step": 30040 }, { "epoch": 417.36, "learning_rate": 6.8171428571428575e-06, "loss": 0.2337, "step": 30050 }, { "epoch": 417.5, "learning_rate": 6.805714285714287e-06, "loss": 0.2533, "step": 30060 }, { "epoch": 417.64, "learning_rate": 6.794285714285714e-06, "loss": 0.2448, "step": 30070 }, { "epoch": 417.78, "learning_rate": 6.782857142857144e-06, "loss": 0.2485, "step": 30080 }, { "epoch": 417.91, "learning_rate": 6.771428571428572e-06, "loss": 0.2538, "step": 30090 }, { "epoch": 418.0, "eval_loss": 0.6694636344909668, "eval_runtime": 129.8776, "eval_samples_per_second": 4.096, "eval_steps_per_second": 0.516, "eval_wer": 0.2239506331554927, "step": 30096 }, { "epoch": 418.06, "learning_rate": 6.760000000000001e-06, "loss": 0.253, "step": 30100 }, { "epoch": 418.19, "learning_rate": 6.748571428571429e-06, "loss": 0.2528, "step": 30110 }, { "epoch": 418.33, "learning_rate": 6.737142857142857e-06, "loss": 0.2379, "step": 30120 }, { "epoch": 418.47, "learning_rate": 6.725714285714287e-06, "loss": 0.2484, "step": 30130 }, { "epoch": 418.61, "learning_rate": 6.714285714285714e-06, "loss": 0.2451, "step": 30140 }, { "epoch": 418.75, "learning_rate": 6.7028571428571435e-06, "loss": 0.2565, "step": 30150 }, { "epoch": 418.89, "learning_rate": 6.691428571428572e-06, "loss": 0.246, "step": 30160 }, { "epoch": 419.0, "eval_loss": 0.6917106509208679, "eval_runtime": 129.9987, "eval_samples_per_second": 4.092, "eval_steps_per_second": 0.515, "eval_wer": 0.22684322170084206, "step": 30168 }, { "epoch": 419.03, "learning_rate": 6.680000000000001e-06, "loss": 0.2443, "step": 30170 }, { "epoch": 419.17, "learning_rate": 6.668571428571429e-06, "loss": 0.2549, "step": 30180 }, { "epoch": 419.3, "learning_rate": 6.657142857142857e-06, "loss": 0.245, "step": 30190 }, { "epoch": 419.44, "learning_rate": 6.645714285714287e-06, "loss": 0.2573, "step": 30200 }, { "epoch": 419.58, "learning_rate": 6.634285714285715e-06, "loss": 0.245, "step": 30210 }, { "epoch": 419.72, "learning_rate": 6.6228571428571435e-06, "loss": 0.2542, "step": 30220 }, { "epoch": 419.86, "learning_rate": 6.611428571428572e-06, "loss": 0.2483, "step": 30230 }, { "epoch": 420.0, "learning_rate": 6.600000000000001e-06, "loss": 0.2462, "step": 30240 }, { "epoch": 420.0, "eval_loss": 0.6842324733734131, "eval_runtime": 129.9543, "eval_samples_per_second": 4.094, "eval_steps_per_second": 0.516, "eval_wer": 0.2287716140644083, "step": 30240 }, { "epoch": 420.14, "learning_rate": 6.588571428571429e-06, "loss": 0.2597, "step": 30250 }, { "epoch": 420.28, "learning_rate": 6.577142857142857e-06, "loss": 0.2496, "step": 30260 }, { "epoch": 420.42, "learning_rate": 6.5657142857142865e-06, "loss": 0.2465, "step": 30270 }, { "epoch": 420.55, "learning_rate": 6.554285714285715e-06, "loss": 0.2554, "step": 30280 }, { "epoch": 420.69, "learning_rate": 6.542857142857143e-06, "loss": 0.2514, "step": 30290 }, { "epoch": 420.83, "learning_rate": 6.531428571428572e-06, "loss": 0.2455, "step": 30300 }, { "epoch": 420.97, "learning_rate": 6.520000000000001e-06, "loss": 0.2527, "step": 30310 }, { "epoch": 421.0, "eval_loss": 0.6627729535102844, "eval_runtime": 130.3292, "eval_samples_per_second": 4.082, "eval_steps_per_second": 0.514, "eval_wer": 0.2207366458828823, "step": 30312 }, { "epoch": 421.11, "learning_rate": 6.5085714285714295e-06, "loss": 0.247, "step": 30320 }, { "epoch": 421.25, "learning_rate": 6.497142857142857e-06, "loss": 0.2522, "step": 30330 }, { "epoch": 421.39, "learning_rate": 6.485714285714286e-06, "loss": 0.2464, "step": 30340 }, { "epoch": 421.53, "learning_rate": 6.474285714285715e-06, "loss": 0.2481, "step": 30350 }, { "epoch": 421.66, "learning_rate": 6.462857142857143e-06, "loss": 0.2501, "step": 30360 }, { "epoch": 421.8, "learning_rate": 6.451428571428572e-06, "loss": 0.2353, "step": 30370 }, { "epoch": 421.94, "learning_rate": 6.440000000000001e-06, "loss": 0.2469, "step": 30380 }, { "epoch": 422.0, "eval_loss": 0.6683416962623596, "eval_runtime": 129.4685, "eval_samples_per_second": 4.109, "eval_steps_per_second": 0.518, "eval_wer": 0.2224721990100919, "step": 30384 }, { "epoch": 422.08, "learning_rate": 6.4285714285714295e-06, "loss": 0.2439, "step": 30390 }, { "epoch": 422.22, "learning_rate": 6.417142857142857e-06, "loss": 0.2479, "step": 30400 }, { "epoch": 422.36, "learning_rate": 6.405714285714286e-06, "loss": 0.248, "step": 30410 }, { "epoch": 422.5, "learning_rate": 6.394285714285715e-06, "loss": 0.2419, "step": 30420 }, { "epoch": 422.64, "learning_rate": 6.382857142857143e-06, "loss": 0.2524, "step": 30430 }, { "epoch": 422.78, "learning_rate": 6.371428571428572e-06, "loss": 0.2432, "step": 30440 }, { "epoch": 422.91, "learning_rate": 6.360000000000001e-06, "loss": 0.2493, "step": 30450 }, { "epoch": 423.0, "eval_loss": 0.6632475852966309, "eval_runtime": 130.7693, "eval_samples_per_second": 4.068, "eval_steps_per_second": 0.512, "eval_wer": 0.21887253326476827, "step": 30456 }, { "epoch": 423.06, "learning_rate": 6.348571428571429e-06, "loss": 0.2421, "step": 30460 }, { "epoch": 423.19, "learning_rate": 6.337142857142857e-06, "loss": 0.2507, "step": 30470 }, { "epoch": 423.33, "learning_rate": 6.325714285714286e-06, "loss": 0.2447, "step": 30480 }, { "epoch": 423.47, "learning_rate": 6.314285714285715e-06, "loss": 0.254, "step": 30490 }, { "epoch": 423.61, "learning_rate": 6.302857142857144e-06, "loss": 0.2323, "step": 30500 }, { "epoch": 423.75, "learning_rate": 6.2914285714285716e-06, "loss": 0.2505, "step": 30510 }, { "epoch": 423.89, "learning_rate": 6.280000000000001e-06, "loss": 0.239, "step": 30520 }, { "epoch": 424.0, "eval_loss": 0.6848077774047852, "eval_runtime": 131.0805, "eval_samples_per_second": 4.059, "eval_steps_per_second": 0.511, "eval_wer": 0.2197724497010992, "step": 30528 }, { "epoch": 424.03, "learning_rate": 6.268571428571429e-06, "loss": 0.2457, "step": 30530 }, { "epoch": 424.17, "learning_rate": 6.257142857142857e-06, "loss": 0.2461, "step": 30540 }, { "epoch": 424.3, "learning_rate": 6.245714285714286e-06, "loss": 0.2379, "step": 30550 }, { "epoch": 424.44, "learning_rate": 6.234285714285715e-06, "loss": 0.2493, "step": 30560 }, { "epoch": 424.58, "learning_rate": 6.222857142857144e-06, "loss": 0.2403, "step": 30570 }, { "epoch": 424.72, "learning_rate": 6.2114285714285715e-06, "loss": 0.2461, "step": 30580 }, { "epoch": 424.86, "learning_rate": 6.200000000000001e-06, "loss": 0.2383, "step": 30590 }, { "epoch": 425.0, "learning_rate": 6.188571428571429e-06, "loss": 0.2373, "step": 30600 }, { "epoch": 425.0, "eval_loss": 0.6833525896072388, "eval_runtime": 130.5966, "eval_samples_per_second": 4.074, "eval_steps_per_second": 0.513, "eval_wer": 0.2223436395191875, "step": 30600 }, { "epoch": 425.14, "learning_rate": 6.177142857142857e-06, "loss": 0.2404, "step": 30610 }, { "epoch": 425.28, "learning_rate": 6.165714285714286e-06, "loss": 0.2458, "step": 30620 }, { "epoch": 425.42, "learning_rate": 6.1542857142857145e-06, "loss": 0.239, "step": 30630 }, { "epoch": 425.55, "learning_rate": 6.142857142857144e-06, "loss": 0.2344, "step": 30640 }, { "epoch": 425.69, "learning_rate": 6.131428571428571e-06, "loss": 0.2529, "step": 30650 }, { "epoch": 425.83, "learning_rate": 6.120000000000001e-06, "loss": 0.2365, "step": 30660 }, { "epoch": 425.97, "learning_rate": 6.108571428571429e-06, "loss": 0.245, "step": 30670 }, { "epoch": 426.0, "eval_loss": 0.6901674270629883, "eval_runtime": 131.588, "eval_samples_per_second": 4.043, "eval_steps_per_second": 0.509, "eval_wer": 0.22510766857363246, "step": 30672 }, { "epoch": 426.11, "learning_rate": 6.097142857142858e-06, "loss": 0.2489, "step": 30680 }, { "epoch": 426.25, "learning_rate": 6.085714285714286e-06, "loss": 0.2377, "step": 30690 }, { "epoch": 426.39, "learning_rate": 6.0742857142857145e-06, "loss": 0.2371, "step": 30700 }, { "epoch": 426.53, "learning_rate": 6.062857142857144e-06, "loss": 0.2483, "step": 30710 }, { "epoch": 426.66, "learning_rate": 6.051428571428571e-06, "loss": 0.2421, "step": 30720 }, { "epoch": 426.8, "learning_rate": 6.040000000000001e-06, "loss": 0.2445, "step": 30730 }, { "epoch": 426.94, "learning_rate": 6.028571428571429e-06, "loss": 0.239, "step": 30740 }, { "epoch": 427.0, "eval_loss": 0.6916705965995789, "eval_runtime": 129.5053, "eval_samples_per_second": 4.108, "eval_steps_per_second": 0.517, "eval_wer": 0.2223436395191875, "step": 30744 }, { "epoch": 427.08, "learning_rate": 6.017142857142858e-06, "loss": 0.2466, "step": 30750 }, { "epoch": 427.22, "learning_rate": 6.005714285714286e-06, "loss": 0.2602, "step": 30760 }, { "epoch": 427.36, "learning_rate": 5.994285714285714e-06, "loss": 0.229, "step": 30770 }, { "epoch": 427.5, "learning_rate": 5.982857142857144e-06, "loss": 0.2461, "step": 30780 }, { "epoch": 427.64, "learning_rate": 5.971428571428572e-06, "loss": 0.2327, "step": 30790 }, { "epoch": 427.78, "learning_rate": 5.9600000000000005e-06, "loss": 0.2326, "step": 30800 }, { "epoch": 427.91, "learning_rate": 5.948571428571429e-06, "loss": 0.2441, "step": 30810 }, { "epoch": 428.0, "eval_loss": 0.6858615875244141, "eval_runtime": 130.0566, "eval_samples_per_second": 4.091, "eval_steps_per_second": 0.515, "eval_wer": 0.22324355595551842, "step": 30816 }, { "epoch": 428.06, "learning_rate": 5.937142857142858e-06, "loss": 0.2468, "step": 30820 }, { "epoch": 428.19, "learning_rate": 5.925714285714286e-06, "loss": 0.2507, "step": 30830 }, { "epoch": 428.33, "learning_rate": 5.914285714285714e-06, "loss": 0.2463, "step": 30840 }, { "epoch": 428.47, "learning_rate": 5.9028571428571436e-06, "loss": 0.2513, "step": 30850 }, { "epoch": 428.61, "learning_rate": 5.891428571428572e-06, "loss": 0.2329, "step": 30860 }, { "epoch": 428.75, "learning_rate": 5.8800000000000005e-06, "loss": 0.2449, "step": 30870 }, { "epoch": 428.89, "learning_rate": 5.868571428571429e-06, "loss": 0.2306, "step": 30880 }, { "epoch": 429.0, "eval_loss": 0.6843674778938293, "eval_runtime": 129.7058, "eval_samples_per_second": 4.102, "eval_steps_per_second": 0.517, "eval_wer": 0.2208009256283345, "step": 30888 }, { "epoch": 429.03, "learning_rate": 5.857142857142858e-06, "loss": 0.2384, "step": 30890 }, { "epoch": 429.17, "learning_rate": 5.845714285714286e-06, "loss": 0.2536, "step": 30900 }, { "epoch": 429.3, "learning_rate": 5.834285714285714e-06, "loss": 0.2461, "step": 30910 }, { "epoch": 429.44, "learning_rate": 5.8228571428571435e-06, "loss": 0.2508, "step": 30920 }, { "epoch": 429.58, "learning_rate": 5.811428571428572e-06, "loss": 0.243, "step": 30930 }, { "epoch": 429.72, "learning_rate": 5.8e-06, "loss": 0.244, "step": 30940 }, { "epoch": 429.86, "learning_rate": 5.788571428571429e-06, "loss": 0.2375, "step": 30950 }, { "epoch": 430.0, "learning_rate": 5.777142857142858e-06, "loss": 0.2373, "step": 30960 }, { "epoch": 430.0, "eval_loss": 0.6740304231643677, "eval_runtime": 129.8193, "eval_samples_per_second": 4.098, "eval_steps_per_second": 0.516, "eval_wer": 0.218486854792055, "step": 30960 }, { "epoch": 430.14, "learning_rate": 5.7657142857142865e-06, "loss": 0.244, "step": 30970 }, { "epoch": 430.28, "learning_rate": 5.754285714285714e-06, "loss": 0.2495, "step": 30980 }, { "epoch": 430.42, "learning_rate": 5.742857142857143e-06, "loss": 0.2444, "step": 30990 }, { "epoch": 430.55, "learning_rate": 5.731428571428572e-06, "loss": 0.238, "step": 31000 }, { "epoch": 430.69, "learning_rate": 5.72e-06, "loss": 0.2431, "step": 31010 }, { "epoch": 430.83, "learning_rate": 5.708571428571429e-06, "loss": 0.2346, "step": 31020 }, { "epoch": 430.97, "learning_rate": 5.697142857142858e-06, "loss": 0.2495, "step": 31030 }, { "epoch": 431.0, "eval_loss": 0.6822530627250671, "eval_runtime": 129.3213, "eval_samples_per_second": 4.114, "eval_steps_per_second": 0.518, "eval_wer": 0.2214437230828566, "step": 31032 }, { "epoch": 431.11, "learning_rate": 5.6857142857142865e-06, "loss": 0.2405, "step": 31040 }, { "epoch": 431.25, "learning_rate": 5.674285714285714e-06, "loss": 0.2307, "step": 31050 }, { "epoch": 431.39, "learning_rate": 5.662857142857143e-06, "loss": 0.2432, "step": 31060 }, { "epoch": 431.53, "learning_rate": 5.651428571428572e-06, "loss": 0.2413, "step": 31070 }, { "epoch": 431.66, "learning_rate": 5.64e-06, "loss": 0.2423, "step": 31080 }, { "epoch": 431.8, "learning_rate": 5.628571428571429e-06, "loss": 0.2447, "step": 31090 }, { "epoch": 431.94, "learning_rate": 5.617142857142858e-06, "loss": 0.2457, "step": 31100 }, { "epoch": 432.0, "eval_loss": 0.6686000823974609, "eval_runtime": 130.2131, "eval_samples_per_second": 4.086, "eval_steps_per_second": 0.515, "eval_wer": 0.22189368130102205, "step": 31104 }, { "epoch": 432.08, "learning_rate": 5.605714285714286e-06, "loss": 0.2342, "step": 31110 }, { "epoch": 432.22, "learning_rate": 5.594285714285714e-06, "loss": 0.2438, "step": 31120 }, { "epoch": 432.36, "learning_rate": 5.582857142857143e-06, "loss": 0.2398, "step": 31130 }, { "epoch": 432.5, "learning_rate": 5.571428571428572e-06, "loss": 0.2419, "step": 31140 }, { "epoch": 432.64, "learning_rate": 5.560000000000001e-06, "loss": 0.2339, "step": 31150 }, { "epoch": 432.78, "learning_rate": 5.5485714285714286e-06, "loss": 0.2508, "step": 31160 }, { "epoch": 432.91, "learning_rate": 5.537142857142858e-06, "loss": 0.2474, "step": 31170 }, { "epoch": 433.0, "eval_loss": 0.6856159567832947, "eval_runtime": 129.9234, "eval_samples_per_second": 4.095, "eval_steps_per_second": 0.516, "eval_wer": 0.2215080028283088, "step": 31176 }, { "epoch": 433.06, "learning_rate": 5.525714285714286e-06, "loss": 0.2475, "step": 31180 }, { "epoch": 433.19, "learning_rate": 5.514285714285714e-06, "loss": 0.2533, "step": 31190 }, { "epoch": 433.33, "learning_rate": 5.502857142857143e-06, "loss": 0.2338, "step": 31200 }, { "epoch": 433.47, "learning_rate": 5.491428571428572e-06, "loss": 0.2392, "step": 31210 }, { "epoch": 433.61, "learning_rate": 5.480000000000001e-06, "loss": 0.2291, "step": 31220 }, { "epoch": 433.75, "learning_rate": 5.4685714285714285e-06, "loss": 0.2387, "step": 31230 }, { "epoch": 433.89, "learning_rate": 5.457142857142858e-06, "loss": 0.2434, "step": 31240 }, { "epoch": 434.0, "eval_loss": 0.687577486038208, "eval_runtime": 129.6817, "eval_samples_per_second": 4.102, "eval_steps_per_second": 0.517, "eval_wer": 0.2199010091920036, "step": 31248 }, { "epoch": 434.03, "learning_rate": 5.445714285714286e-06, "loss": 0.2405, "step": 31250 }, { "epoch": 434.17, "learning_rate": 5.4342857142857155e-06, "loss": 0.2397, "step": 31260 }, { "epoch": 434.3, "learning_rate": 5.422857142857143e-06, "loss": 0.2351, "step": 31270 }, { "epoch": 434.44, "learning_rate": 5.4114285714285715e-06, "loss": 0.2446, "step": 31280 }, { "epoch": 434.58, "learning_rate": 5.400000000000001e-06, "loss": 0.2329, "step": 31290 }, { "epoch": 434.72, "learning_rate": 5.388571428571428e-06, "loss": 0.2451, "step": 31300 }, { "epoch": 434.86, "learning_rate": 5.377142857142858e-06, "loss": 0.2426, "step": 31310 }, { "epoch": 435.0, "learning_rate": 5.365714285714286e-06, "loss": 0.2377, "step": 31320 }, { "epoch": 435.0, "eval_loss": 0.6826874613761902, "eval_runtime": 130.0923, "eval_samples_per_second": 4.089, "eval_steps_per_second": 0.515, "eval_wer": 0.22337211544642283, "step": 31320 }, { "epoch": 435.14, "learning_rate": 5.354285714285715e-06, "loss": 0.2484, "step": 31330 }, { "epoch": 435.28, "learning_rate": 5.342857142857143e-06, "loss": 0.2458, "step": 31340 }, { "epoch": 435.42, "learning_rate": 5.3314285714285714e-06, "loss": 0.2436, "step": 31350 }, { "epoch": 435.55, "learning_rate": 5.320000000000001e-06, "loss": 0.2353, "step": 31360 }, { "epoch": 435.69, "learning_rate": 5.308571428571428e-06, "loss": 0.244, "step": 31370 }, { "epoch": 435.83, "learning_rate": 5.297142857142858e-06, "loss": 0.2265, "step": 31380 }, { "epoch": 435.97, "learning_rate": 5.285714285714286e-06, "loss": 0.2566, "step": 31390 }, { "epoch": 436.0, "eval_loss": 0.6920022368431091, "eval_runtime": 129.5338, "eval_samples_per_second": 4.107, "eval_steps_per_second": 0.517, "eval_wer": 0.22131516359195216, "step": 31392 }, { "epoch": 436.11, "learning_rate": 5.274285714285715e-06, "loss": 0.2551, "step": 31400 }, { "epoch": 436.25, "learning_rate": 5.262857142857143e-06, "loss": 0.2349, "step": 31410 }, { "epoch": 436.39, "learning_rate": 5.251428571428571e-06, "loss": 0.2365, "step": 31420 }, { "epoch": 436.53, "learning_rate": 5.240000000000001e-06, "loss": 0.2419, "step": 31430 }, { "epoch": 436.66, "learning_rate": 5.22857142857143e-06, "loss": 0.2475, "step": 31440 }, { "epoch": 436.8, "learning_rate": 5.2171428571428575e-06, "loss": 0.2413, "step": 31450 }, { "epoch": 436.94, "learning_rate": 5.205714285714286e-06, "loss": 0.2384, "step": 31460 }, { "epoch": 437.0, "eval_loss": 0.6733819246292114, "eval_runtime": 144.8944, "eval_samples_per_second": 3.672, "eval_steps_per_second": 0.462, "eval_wer": 0.22337211544642283, "step": 31464 }, { "epoch": 437.08, "learning_rate": 5.194285714285715e-06, "loss": 0.2291, "step": 31470 }, { "epoch": 437.22, "learning_rate": 5.182857142857143e-06, "loss": 0.234, "step": 31480 }, { "epoch": 437.36, "learning_rate": 5.171428571428571e-06, "loss": 0.2382, "step": 31490 }, { "epoch": 437.5, "learning_rate": 5.1600000000000006e-06, "loss": 0.2403, "step": 31500 }, { "epoch": 437.64, "learning_rate": 5.14857142857143e-06, "loss": 0.2435, "step": 31510 }, { "epoch": 437.78, "learning_rate": 5.1371428571428574e-06, "loss": 0.2442, "step": 31520 }, { "epoch": 437.91, "learning_rate": 5.125714285714286e-06, "loss": 0.2477, "step": 31530 }, { "epoch": 438.0, "eval_loss": 0.699192225933075, "eval_runtime": 159.2166, "eval_samples_per_second": 3.341, "eval_steps_per_second": 0.421, "eval_wer": 0.22420775213730154, "step": 31536 }, { "epoch": 438.06, "learning_rate": 5.114285714285715e-06, "loss": 0.2458, "step": 31540 }, { "epoch": 438.19, "learning_rate": 5.102857142857143e-06, "loss": 0.2548, "step": 31550 }, { "epoch": 438.33, "learning_rate": 5.091428571428571e-06, "loss": 0.2373, "step": 31560 }, { "epoch": 438.47, "learning_rate": 5.0800000000000005e-06, "loss": 0.2549, "step": 31570 }, { "epoch": 438.61, "learning_rate": 5.06857142857143e-06, "loss": 0.2307, "step": 31580 }, { "epoch": 438.75, "learning_rate": 5.057142857142857e-06, "loss": 0.2382, "step": 31590 }, { "epoch": 438.89, "learning_rate": 5.045714285714286e-06, "loss": 0.2347, "step": 31600 }, { "epoch": 439.0, "eval_loss": 0.6836819648742676, "eval_runtime": 158.8674, "eval_samples_per_second": 3.349, "eval_steps_per_second": 0.422, "eval_wer": 0.22170084206466542, "step": 31608 }, { "epoch": 439.03, "learning_rate": 5.034285714285715e-06, "loss": 0.2503, "step": 31610 }, { "epoch": 439.17, "learning_rate": 5.0228571428571435e-06, "loss": 0.2492, "step": 31620 }, { "epoch": 439.3, "learning_rate": 5.011428571428571e-06, "loss": 0.2366, "step": 31630 }, { "epoch": 439.44, "learning_rate": 5e-06, "loss": 0.2422, "step": 31640 }, { "epoch": 439.58, "learning_rate": 4.988571428571429e-06, "loss": 0.2381, "step": 31650 }, { "epoch": 439.72, "learning_rate": 4.977142857142857e-06, "loss": 0.2454, "step": 31660 }, { "epoch": 439.86, "learning_rate": 4.965714285714286e-06, "loss": 0.2369, "step": 31670 }, { "epoch": 440.0, "learning_rate": 4.954285714285715e-06, "loss": 0.2345, "step": 31680 }, { "epoch": 440.0, "eval_loss": 0.6851758360862732, "eval_runtime": 157.8303, "eval_samples_per_second": 3.371, "eval_steps_per_second": 0.425, "eval_wer": 0.22215080028283088, "step": 31680 }, { "epoch": 440.14, "learning_rate": 4.9428571428571435e-06, "loss": 0.2462, "step": 31690 }, { "epoch": 440.28, "learning_rate": 4.931428571428572e-06, "loss": 0.2359, "step": 31700 }, { "epoch": 440.42, "learning_rate": 4.92e-06, "loss": 0.2444, "step": 31710 }, { "epoch": 440.55, "learning_rate": 4.90857142857143e-06, "loss": 0.2416, "step": 31720 }, { "epoch": 440.69, "learning_rate": 4.897142857142857e-06, "loss": 0.2446, "step": 31730 }, { "epoch": 440.83, "learning_rate": 4.885714285714286e-06, "loss": 0.2396, "step": 31740 }, { "epoch": 440.97, "learning_rate": 4.874285714285715e-06, "loss": 0.2457, "step": 31750 }, { "epoch": 441.0, "eval_loss": 0.6891138553619385, "eval_runtime": 157.0837, "eval_samples_per_second": 3.387, "eval_steps_per_second": 0.427, "eval_wer": 0.2229864369737096, "step": 31752 }, { "epoch": 441.11, "learning_rate": 4.862857142857143e-06, "loss": 0.2465, "step": 31760 }, { "epoch": 441.25, "learning_rate": 4.851428571428572e-06, "loss": 0.2406, "step": 31770 }, { "epoch": 441.39, "learning_rate": 4.84e-06, "loss": 0.2374, "step": 31780 }, { "epoch": 441.53, "learning_rate": 4.8285714285714295e-06, "loss": 0.2389, "step": 31790 }, { "epoch": 441.66, "learning_rate": 4.817142857142857e-06, "loss": 0.2377, "step": 31800 }, { "epoch": 441.8, "learning_rate": 4.805714285714286e-06, "loss": 0.2462, "step": 31810 }, { "epoch": 441.94, "learning_rate": 4.794285714285715e-06, "loss": 0.2512, "step": 31820 }, { "epoch": 442.0, "eval_loss": 0.6975857615470886, "eval_runtime": 157.8169, "eval_samples_per_second": 3.371, "eval_steps_per_second": 0.425, "eval_wer": 0.2262647039917722, "step": 31824 }, { "epoch": 442.08, "learning_rate": 4.782857142857143e-06, "loss": 0.2451, "step": 31830 }, { "epoch": 442.22, "learning_rate": 4.771428571428572e-06, "loss": 0.2401, "step": 31840 }, { "epoch": 442.36, "learning_rate": 4.76e-06, "loss": 0.2309, "step": 31850 }, { "epoch": 442.5, "learning_rate": 4.7485714285714295e-06, "loss": 0.2374, "step": 31860 }, { "epoch": 442.64, "learning_rate": 4.737142857142857e-06, "loss": 0.2367, "step": 31870 }, { "epoch": 442.78, "learning_rate": 4.725714285714286e-06, "loss": 0.2473, "step": 31880 }, { "epoch": 442.91, "learning_rate": 4.714285714285715e-06, "loss": 0.25, "step": 31890 }, { "epoch": 443.0, "eval_loss": 0.6889477372169495, "eval_runtime": 156.6752, "eval_samples_per_second": 3.396, "eval_steps_per_second": 0.428, "eval_wer": 0.22324355595551842, "step": 31896 }, { "epoch": 443.06, "learning_rate": 4.702857142857143e-06, "loss": 0.2432, "step": 31900 }, { "epoch": 443.19, "learning_rate": 4.691428571428572e-06, "loss": 0.2417, "step": 31910 }, { "epoch": 443.33, "learning_rate": 4.680000000000001e-06, "loss": 0.2228, "step": 31920 }, { "epoch": 443.47, "learning_rate": 4.668571428571429e-06, "loss": 0.249, "step": 31930 }, { "epoch": 443.61, "learning_rate": 4.657142857142857e-06, "loss": 0.2304, "step": 31940 }, { "epoch": 443.75, "learning_rate": 4.645714285714286e-06, "loss": 0.2348, "step": 31950 }, { "epoch": 443.89, "learning_rate": 4.634285714285715e-06, "loss": 0.2341, "step": 31960 }, { "epoch": 444.0, "eval_loss": 0.6840574145317078, "eval_runtime": 156.9765, "eval_samples_per_second": 3.389, "eval_steps_per_second": 0.427, "eval_wer": 0.22658610271903323, "step": 31968 }, { "epoch": 444.03, "learning_rate": 4.622857142857143e-06, "loss": 0.2571, "step": 31970 }, { "epoch": 444.17, "learning_rate": 4.6114285714285716e-06, "loss": 0.2452, "step": 31980 }, { "epoch": 444.3, "learning_rate": 4.600000000000001e-06, "loss": 0.2508, "step": 31990 }, { "epoch": 444.44, "learning_rate": 4.588571428571429e-06, "loss": 0.2375, "step": 32000 }, { "epoch": 444.58, "learning_rate": 4.577142857142858e-06, "loss": 0.2291, "step": 32010 }, { "epoch": 444.72, "learning_rate": 4.565714285714286e-06, "loss": 0.2496, "step": 32020 }, { "epoch": 444.86, "learning_rate": 4.554285714285715e-06, "loss": 0.2289, "step": 32030 }, { "epoch": 445.0, "learning_rate": 4.542857142857143e-06, "loss": 0.252, "step": 32040 }, { "epoch": 445.0, "eval_loss": 0.6980647444725037, "eval_runtime": 157.0447, "eval_samples_per_second": 3.388, "eval_steps_per_second": 0.427, "eval_wer": 0.22491482933727583, "step": 32040 }, { "epoch": 445.14, "learning_rate": 4.5314285714285715e-06, "loss": 0.2483, "step": 32050 }, { "epoch": 445.28, "learning_rate": 4.520000000000001e-06, "loss": 0.24, "step": 32060 }, { "epoch": 445.42, "learning_rate": 4.508571428571429e-06, "loss": 0.2349, "step": 32070 }, { "epoch": 445.55, "learning_rate": 4.497142857142858e-06, "loss": 0.2352, "step": 32080 }, { "epoch": 445.69, "learning_rate": 4.485714285714286e-06, "loss": 0.2486, "step": 32090 }, { "epoch": 445.83, "learning_rate": 4.4742857142857145e-06, "loss": 0.231, "step": 32100 }, { "epoch": 445.97, "learning_rate": 4.462857142857143e-06, "loss": 0.2486, "step": 32110 }, { "epoch": 446.0, "eval_loss": 0.6958192586898804, "eval_runtime": 158.2493, "eval_samples_per_second": 3.362, "eval_steps_per_second": 0.423, "eval_wer": 0.22812881660988624, "step": 32112 }, { "epoch": 446.11, "learning_rate": 4.451428571428571e-06, "loss": 0.2414, "step": 32120 }, { "epoch": 446.25, "learning_rate": 4.440000000000001e-06, "loss": 0.2436, "step": 32130 }, { "epoch": 446.39, "learning_rate": 4.428571428571429e-06, "loss": 0.241, "step": 32140 }, { "epoch": 446.53, "learning_rate": 4.4171428571428576e-06, "loss": 0.2456, "step": 32150 }, { "epoch": 446.66, "learning_rate": 4.405714285714286e-06, "loss": 0.2412, "step": 32160 }, { "epoch": 446.8, "learning_rate": 4.3942857142857144e-06, "loss": 0.2371, "step": 32170 }, { "epoch": 446.94, "learning_rate": 4.382857142857143e-06, "loss": 0.2402, "step": 32180 }, { "epoch": 447.0, "eval_loss": 0.6826456189155579, "eval_runtime": 129.4539, "eval_samples_per_second": 4.11, "eval_steps_per_second": 0.518, "eval_wer": 0.22491482933727583, "step": 32184 }, { "epoch": 447.08, "learning_rate": 4.371428571428572e-06, "loss": 0.2442, "step": 32190 }, { "epoch": 447.22, "learning_rate": 4.360000000000001e-06, "loss": 0.2369, "step": 32200 }, { "epoch": 447.36, "learning_rate": 4.348571428571429e-06, "loss": 0.2318, "step": 32210 }, { "epoch": 447.5, "learning_rate": 4.3371428571428575e-06, "loss": 0.2364, "step": 32220 }, { "epoch": 447.64, "learning_rate": 4.325714285714286e-06, "loss": 0.2303, "step": 32230 }, { "epoch": 447.78, "learning_rate": 4.314285714285714e-06, "loss": 0.2378, "step": 32240 }, { "epoch": 447.91, "learning_rate": 4.302857142857143e-06, "loss": 0.2477, "step": 32250 }, { "epoch": 448.0, "eval_loss": 0.686671257019043, "eval_runtime": 129.3046, "eval_samples_per_second": 4.114, "eval_steps_per_second": 0.518, "eval_wer": 0.2247219901009192, "step": 32256 }, { "epoch": 448.06, "learning_rate": 4.291428571428572e-06, "loss": 0.2435, "step": 32260 }, { "epoch": 448.19, "learning_rate": 4.2800000000000005e-06, "loss": 0.2444, "step": 32270 }, { "epoch": 448.33, "learning_rate": 4.268571428571429e-06, "loss": 0.2347, "step": 32280 }, { "epoch": 448.47, "learning_rate": 4.257142857142857e-06, "loss": 0.2443, "step": 32290 }, { "epoch": 448.61, "learning_rate": 4.245714285714286e-06, "loss": 0.2313, "step": 32300 }, { "epoch": 448.75, "learning_rate": 4.234285714285714e-06, "loss": 0.2304, "step": 32310 }, { "epoch": 448.89, "learning_rate": 4.222857142857143e-06, "loss": 0.2304, "step": 32320 }, { "epoch": 449.0, "eval_loss": 0.7022036910057068, "eval_runtime": 129.7669, "eval_samples_per_second": 4.1, "eval_steps_per_second": 0.516, "eval_wer": 0.22427203188275374, "step": 32328 }, { "epoch": 449.03, "learning_rate": 4.211428571428572e-06, "loss": 0.2453, "step": 32330 }, { "epoch": 449.17, "learning_rate": 4.2000000000000004e-06, "loss": 0.2402, "step": 32340 }, { "epoch": 449.3, "learning_rate": 4.188571428571429e-06, "loss": 0.2349, "step": 32350 }, { "epoch": 449.44, "learning_rate": 4.177142857142857e-06, "loss": 0.2298, "step": 32360 }, { "epoch": 449.58, "learning_rate": 4.165714285714287e-06, "loss": 0.2338, "step": 32370 }, { "epoch": 449.72, "learning_rate": 4.154285714285714e-06, "loss": 0.2453, "step": 32380 }, { "epoch": 449.86, "learning_rate": 4.1428571428571435e-06, "loss": 0.237, "step": 32390 }, { "epoch": 450.0, "learning_rate": 4.131428571428572e-06, "loss": 0.2376, "step": 32400 }, { "epoch": 450.0, "eval_loss": 0.6948400735855103, "eval_runtime": 131.0358, "eval_samples_per_second": 4.06, "eval_steps_per_second": 0.511, "eval_wer": 0.22221508002828308, "step": 32400 }, { "epoch": 450.14, "learning_rate": 4.12e-06, "loss": 0.241, "step": 32410 }, { "epoch": 450.28, "learning_rate": 4.108571428571429e-06, "loss": 0.2358, "step": 32420 }, { "epoch": 450.42, "learning_rate": 4.097142857142857e-06, "loss": 0.238, "step": 32430 }, { "epoch": 450.55, "learning_rate": 4.0857142857142865e-06, "loss": 0.2373, "step": 32440 }, { "epoch": 450.69, "learning_rate": 4.074285714285714e-06, "loss": 0.2428, "step": 32450 }, { "epoch": 450.83, "learning_rate": 4.062857142857143e-06, "loss": 0.2398, "step": 32460 }, { "epoch": 450.97, "learning_rate": 4.051428571428572e-06, "loss": 0.2388, "step": 32470 }, { "epoch": 451.0, "eval_loss": 0.6771290302276611, "eval_runtime": 129.5354, "eval_samples_per_second": 4.107, "eval_steps_per_second": 0.517, "eval_wer": 0.22208652053737868, "step": 32472 }, { "epoch": 451.11, "learning_rate": 4.04e-06, "loss": 0.2413, "step": 32480 }, { "epoch": 451.25, "learning_rate": 4.028571428571429e-06, "loss": 0.2371, "step": 32490 }, { "epoch": 451.39, "learning_rate": 4.017142857142857e-06, "loss": 0.2327, "step": 32500 }, { "epoch": 451.53, "learning_rate": 4.0057142857142864e-06, "loss": 0.2352, "step": 32510 }, { "epoch": 451.66, "learning_rate": 3.994285714285714e-06, "loss": 0.2328, "step": 32520 }, { "epoch": 451.8, "learning_rate": 3.982857142857143e-06, "loss": 0.2322, "step": 32530 }, { "epoch": 451.94, "learning_rate": 3.971428571428572e-06, "loss": 0.2544, "step": 32540 }, { "epoch": 452.0, "eval_loss": 0.6840674877166748, "eval_runtime": 130.564, "eval_samples_per_second": 4.075, "eval_steps_per_second": 0.513, "eval_wer": 0.22485054959182363, "step": 32544 }, { "epoch": 452.08, "learning_rate": 3.96e-06, "loss": 0.2459, "step": 32550 }, { "epoch": 452.22, "learning_rate": 3.948571428571429e-06, "loss": 0.2464, "step": 32560 }, { "epoch": 452.36, "learning_rate": 3.937142857142858e-06, "loss": 0.2288, "step": 32570 }, { "epoch": 452.5, "learning_rate": 3.925714285714286e-06, "loss": 0.2386, "step": 32580 }, { "epoch": 452.64, "learning_rate": 3.914285714285714e-06, "loss": 0.2415, "step": 32590 }, { "epoch": 452.78, "learning_rate": 3.902857142857143e-06, "loss": 0.2221, "step": 32600 }, { "epoch": 452.91, "learning_rate": 3.891428571428572e-06, "loss": 0.2428, "step": 32610 }, { "epoch": 453.0, "eval_loss": 0.6885955929756165, "eval_runtime": 129.5434, "eval_samples_per_second": 4.107, "eval_steps_per_second": 0.517, "eval_wer": 0.22195796104647425, "step": 32616 }, { "epoch": 453.06, "learning_rate": 3.88e-06, "loss": 0.2355, "step": 32620 }, { "epoch": 453.19, "learning_rate": 3.8685714285714286e-06, "loss": 0.2443, "step": 32630 }, { "epoch": 453.33, "learning_rate": 3.857142857142858e-06, "loss": 0.2397, "step": 32640 }, { "epoch": 453.47, "learning_rate": 3.845714285714286e-06, "loss": 0.24, "step": 32650 }, { "epoch": 453.61, "learning_rate": 3.834285714285715e-06, "loss": 0.2207, "step": 32660 }, { "epoch": 453.75, "learning_rate": 3.822857142857143e-06, "loss": 0.2402, "step": 32670 }, { "epoch": 453.89, "learning_rate": 3.8114285714285716e-06, "loss": 0.2438, "step": 32680 }, { "epoch": 454.0, "eval_loss": 0.6903324127197266, "eval_runtime": 129.3285, "eval_samples_per_second": 4.114, "eval_steps_per_second": 0.518, "eval_wer": 0.2214437230828566, "step": 32688 }, { "epoch": 454.03, "learning_rate": 3.8000000000000005e-06, "loss": 0.2363, "step": 32690 }, { "epoch": 454.17, "learning_rate": 3.7885714285714285e-06, "loss": 0.226, "step": 32700 }, { "epoch": 454.3, "learning_rate": 3.7771428571428578e-06, "loss": 0.2257, "step": 32710 }, { "epoch": 454.44, "learning_rate": 3.7657142857142858e-06, "loss": 0.2308, "step": 32720 }, { "epoch": 454.58, "learning_rate": 3.7542857142857146e-06, "loss": 0.2328, "step": 32730 }, { "epoch": 454.72, "learning_rate": 3.742857142857143e-06, "loss": 0.2402, "step": 32740 }, { "epoch": 454.86, "learning_rate": 3.731428571428572e-06, "loss": 0.2295, "step": 32750 }, { "epoch": 455.0, "learning_rate": 3.7200000000000004e-06, "loss": 0.2463, "step": 32760 }, { "epoch": 455.0, "eval_loss": 0.6781482100486755, "eval_runtime": 129.254, "eval_samples_per_second": 4.116, "eval_steps_per_second": 0.518, "eval_wer": 0.22189368130102205, "step": 32760 }, { "epoch": 455.14, "learning_rate": 3.7085714285714284e-06, "loss": 0.2305, "step": 32770 }, { "epoch": 455.28, "learning_rate": 3.6971428571428577e-06, "loss": 0.2303, "step": 32780 }, { "epoch": 455.42, "learning_rate": 3.6857142857142857e-06, "loss": 0.235, "step": 32790 }, { "epoch": 455.55, "learning_rate": 3.6742857142857146e-06, "loss": 0.2329, "step": 32800 }, { "epoch": 455.69, "learning_rate": 3.662857142857143e-06, "loss": 0.2331, "step": 32810 }, { "epoch": 455.83, "learning_rate": 3.651428571428572e-06, "loss": 0.2371, "step": 32820 }, { "epoch": 455.97, "learning_rate": 3.6400000000000003e-06, "loss": 0.2355, "step": 32830 }, { "epoch": 456.0, "eval_loss": 0.6783885359764099, "eval_runtime": 129.5364, "eval_samples_per_second": 4.107, "eval_steps_per_second": 0.517, "eval_wer": 0.2197724497010992, "step": 32832 }, { "epoch": 456.11, "learning_rate": 3.628571428571429e-06, "loss": 0.2355, "step": 32840 }, { "epoch": 456.25, "learning_rate": 3.6171428571428576e-06, "loss": 0.2331, "step": 32850 }, { "epoch": 456.39, "learning_rate": 3.6057142857142865e-06, "loss": 0.2335, "step": 32860 }, { "epoch": 456.53, "learning_rate": 3.5942857142857145e-06, "loss": 0.235, "step": 32870 }, { "epoch": 456.66, "learning_rate": 3.582857142857143e-06, "loss": 0.2327, "step": 32880 }, { "epoch": 456.8, "learning_rate": 3.5714285714285718e-06, "loss": 0.2269, "step": 32890 }, { "epoch": 456.94, "learning_rate": 3.5600000000000002e-06, "loss": 0.237, "step": 32900 }, { "epoch": 457.0, "eval_loss": 0.6848962903022766, "eval_runtime": 129.3531, "eval_samples_per_second": 4.113, "eval_steps_per_second": 0.518, "eval_wer": 0.223114996464614, "step": 32904 }, { "epoch": 457.08, "learning_rate": 3.548571428571429e-06, "loss": 0.2322, "step": 32910 }, { "epoch": 457.22, "learning_rate": 3.5371428571428575e-06, "loss": 0.2315, "step": 32920 }, { "epoch": 457.36, "learning_rate": 3.5257142857142864e-06, "loss": 0.2234, "step": 32930 }, { "epoch": 457.5, "learning_rate": 3.5142857142857144e-06, "loss": 0.2351, "step": 32940 }, { "epoch": 457.64, "learning_rate": 3.5028571428571433e-06, "loss": 0.2311, "step": 32950 }, { "epoch": 457.78, "learning_rate": 3.4914285714285717e-06, "loss": 0.2452, "step": 32960 }, { "epoch": 457.91, "learning_rate": 3.48e-06, "loss": 0.2381, "step": 32970 }, { "epoch": 458.0, "eval_loss": 0.6892480850219727, "eval_runtime": 129.314, "eval_samples_per_second": 4.114, "eval_steps_per_second": 0.518, "eval_wer": 0.22195796104647425, "step": 32976 }, { "epoch": 458.06, "learning_rate": 3.468571428571429e-06, "loss": 0.2403, "step": 32980 }, { "epoch": 458.19, "learning_rate": 3.4571428571428574e-06, "loss": 0.238, "step": 32990 }, { "epoch": 458.33, "learning_rate": 3.4457142857142863e-06, "loss": 0.2332, "step": 33000 }, { "epoch": 458.47, "learning_rate": 3.4342857142857143e-06, "loss": 0.241, "step": 33010 }, { "epoch": 458.61, "learning_rate": 3.422857142857143e-06, "loss": 0.2341, "step": 33020 }, { "epoch": 458.75, "learning_rate": 3.4114285714285716e-06, "loss": 0.2341, "step": 33030 }, { "epoch": 458.89, "learning_rate": 3.4000000000000005e-06, "loss": 0.23, "step": 33040 }, { "epoch": 459.0, "eval_loss": 0.6781776547431946, "eval_runtime": 129.9722, "eval_samples_per_second": 4.093, "eval_steps_per_second": 0.515, "eval_wer": 0.2206723661374301, "step": 33048 }, { "epoch": 459.03, "learning_rate": 3.388571428571429e-06, "loss": 0.2369, "step": 33050 }, { "epoch": 459.17, "learning_rate": 3.3771428571428574e-06, "loss": 0.2424, "step": 33060 }, { "epoch": 459.3, "learning_rate": 3.3657142857142862e-06, "loss": 0.2284, "step": 33070 }, { "epoch": 459.44, "learning_rate": 3.3542857142857142e-06, "loss": 0.24, "step": 33080 }, { "epoch": 459.58, "learning_rate": 3.342857142857143e-06, "loss": 0.2322, "step": 33090 }, { "epoch": 459.72, "learning_rate": 3.3314285714285715e-06, "loss": 0.2359, "step": 33100 }, { "epoch": 459.86, "learning_rate": 3.3200000000000004e-06, "loss": 0.2309, "step": 33110 }, { "epoch": 460.0, "learning_rate": 3.308571428571429e-06, "loss": 0.2359, "step": 33120 }, { "epoch": 460.0, "eval_loss": 0.6788826584815979, "eval_runtime": 129.3997, "eval_samples_per_second": 4.111, "eval_steps_per_second": 0.518, "eval_wer": 0.22375779391913608, "step": 33120 }, { "epoch": 460.14, "learning_rate": 3.2971428571428577e-06, "loss": 0.2341, "step": 33130 }, { "epoch": 460.28, "learning_rate": 3.285714285714286e-06, "loss": 0.2355, "step": 33140 }, { "epoch": 460.42, "learning_rate": 3.274285714285714e-06, "loss": 0.244, "step": 33150 }, { "epoch": 460.55, "learning_rate": 3.262857142857143e-06, "loss": 0.2331, "step": 33160 }, { "epoch": 460.69, "learning_rate": 3.2514285714285715e-06, "loss": 0.2252, "step": 33170 }, { "epoch": 460.83, "learning_rate": 3.2400000000000003e-06, "loss": 0.2325, "step": 33180 }, { "epoch": 460.97, "learning_rate": 3.2285714285714288e-06, "loss": 0.2382, "step": 33190 }, { "epoch": 461.0, "eval_loss": 0.6829156279563904, "eval_runtime": 129.7457, "eval_samples_per_second": 4.1, "eval_steps_per_second": 0.516, "eval_wer": 0.22362923442823165, "step": 33192 }, { "epoch": 461.11, "learning_rate": 3.2171428571428576e-06, "loss": 0.2321, "step": 33200 }, { "epoch": 461.25, "learning_rate": 3.205714285714286e-06, "loss": 0.2278, "step": 33210 }, { "epoch": 461.39, "learning_rate": 3.194285714285715e-06, "loss": 0.2363, "step": 33220 }, { "epoch": 461.53, "learning_rate": 3.182857142857143e-06, "loss": 0.2339, "step": 33230 }, { "epoch": 461.66, "learning_rate": 3.1714285714285714e-06, "loss": 0.2487, "step": 33240 }, { "epoch": 461.8, "learning_rate": 3.1600000000000002e-06, "loss": 0.2343, "step": 33250 }, { "epoch": 461.94, "learning_rate": 3.1485714285714287e-06, "loss": 0.2438, "step": 33260 }, { "epoch": 462.0, "eval_loss": 0.6927677989006042, "eval_runtime": 129.3067, "eval_samples_per_second": 4.114, "eval_steps_per_second": 0.518, "eval_wer": 0.22362923442823165, "step": 33264 }, { "epoch": 462.08, "learning_rate": 3.1371428571428575e-06, "loss": 0.2349, "step": 33270 }, { "epoch": 462.22, "learning_rate": 3.125714285714286e-06, "loss": 0.2291, "step": 33280 }, { "epoch": 462.36, "learning_rate": 3.114285714285715e-06, "loss": 0.2323, "step": 33290 }, { "epoch": 462.5, "learning_rate": 3.102857142857143e-06, "loss": 0.2353, "step": 33300 }, { "epoch": 462.64, "learning_rate": 3.0914285714285717e-06, "loss": 0.2308, "step": 33310 }, { "epoch": 462.78, "learning_rate": 3.08e-06, "loss": 0.243, "step": 33320 }, { "epoch": 462.91, "learning_rate": 3.068571428571429e-06, "loss": 0.233, "step": 33330 }, { "epoch": 463.0, "eval_loss": 0.6859675049781799, "eval_runtime": 129.5277, "eval_samples_per_second": 4.107, "eval_steps_per_second": 0.517, "eval_wer": 0.22157228257376102, "step": 33336 }, { "epoch": 463.06, "learning_rate": 3.0571428571428575e-06, "loss": 0.2361, "step": 33340 }, { "epoch": 463.19, "learning_rate": 3.045714285714286e-06, "loss": 0.2428, "step": 33350 }, { "epoch": 463.33, "learning_rate": 3.0342857142857148e-06, "loss": 0.2261, "step": 33360 }, { "epoch": 463.47, "learning_rate": 3.0228571428571428e-06, "loss": 0.2254, "step": 33370 }, { "epoch": 463.61, "learning_rate": 3.0114285714285716e-06, "loss": 0.2214, "step": 33380 }, { "epoch": 463.75, "learning_rate": 3e-06, "loss": 0.2335, "step": 33390 }, { "epoch": 463.89, "learning_rate": 2.988571428571429e-06, "loss": 0.2358, "step": 33400 }, { "epoch": 464.0, "eval_loss": 0.6856800317764282, "eval_runtime": 129.895, "eval_samples_per_second": 4.096, "eval_steps_per_second": 0.516, "eval_wer": 0.22362923442823165, "step": 33408 }, { "epoch": 464.03, "learning_rate": 2.9771428571428574e-06, "loss": 0.2291, "step": 33410 }, { "epoch": 464.17, "learning_rate": 2.9657142857142862e-06, "loss": 0.2416, "step": 33420 }, { "epoch": 464.3, "learning_rate": 2.9542857142857147e-06, "loss": 0.2414, "step": 33430 }, { "epoch": 464.44, "learning_rate": 2.9428571428571427e-06, "loss": 0.2339, "step": 33440 }, { "epoch": 464.58, "learning_rate": 2.9314285714285716e-06, "loss": 0.2267, "step": 33450 }, { "epoch": 464.72, "learning_rate": 2.92e-06, "loss": 0.2339, "step": 33460 }, { "epoch": 464.86, "learning_rate": 2.908571428571429e-06, "loss": 0.2279, "step": 33470 }, { "epoch": 465.0, "learning_rate": 2.8971428571428573e-06, "loss": 0.2226, "step": 33480 }, { "epoch": 465.0, "eval_loss": 0.6818052530288696, "eval_runtime": 129.3205, "eval_samples_per_second": 4.114, "eval_steps_per_second": 0.518, "eval_wer": 0.22015812817381245, "step": 33480 }, { "epoch": 465.14, "learning_rate": 2.8868571428571427e-06, "loss": 0.2278, "step": 33490 }, { "epoch": 465.28, "learning_rate": 2.8754285714285716e-06, "loss": 0.2321, "step": 33500 }, { "epoch": 465.42, "learning_rate": 2.864e-06, "loss": 0.2288, "step": 33510 }, { "epoch": 465.55, "learning_rate": 2.852571428571429e-06, "loss": 0.2284, "step": 33520 }, { "epoch": 465.69, "learning_rate": 2.8411428571428573e-06, "loss": 0.2389, "step": 33530 }, { "epoch": 465.83, "learning_rate": 2.829714285714286e-06, "loss": 0.2339, "step": 33540 }, { "epoch": 465.97, "learning_rate": 2.8182857142857146e-06, "loss": 0.2478, "step": 33550 }, { "epoch": 466.0, "eval_loss": 0.6801430583000183, "eval_runtime": 128.9417, "eval_samples_per_second": 4.126, "eval_steps_per_second": 0.52, "eval_wer": 0.22221508002828308, "step": 33552 }, { "epoch": 466.11, "learning_rate": 2.8068571428571426e-06, "loss": 0.237, "step": 33560 }, { "epoch": 466.25, "learning_rate": 2.7954285714285715e-06, "loss": 0.2438, "step": 33570 }, { "epoch": 466.39, "learning_rate": 2.784e-06, "loss": 0.2254, "step": 33580 }, { "epoch": 466.53, "learning_rate": 2.772571428571429e-06, "loss": 0.234, "step": 33590 }, { "epoch": 466.66, "learning_rate": 2.7611428571428572e-06, "loss": 0.236, "step": 33600 }, { "epoch": 466.8, "learning_rate": 2.749714285714286e-06, "loss": 0.2204, "step": 33610 }, { "epoch": 466.94, "learning_rate": 2.7382857142857145e-06, "loss": 0.2274, "step": 33620 }, { "epoch": 467.0, "eval_loss": 0.6797326803207397, "eval_runtime": 129.8192, "eval_samples_per_second": 4.098, "eval_steps_per_second": 0.516, "eval_wer": 0.22028668766471685, "step": 33624 }, { "epoch": 467.08, "learning_rate": 2.7268571428571434e-06, "loss": 0.231, "step": 33630 }, { "epoch": 467.22, "learning_rate": 2.715428571428572e-06, "loss": 0.235, "step": 33640 }, { "epoch": 467.36, "learning_rate": 2.704e-06, "loss": 0.2176, "step": 33650 }, { "epoch": 467.5, "learning_rate": 2.6925714285714287e-06, "loss": 0.2317, "step": 33660 }, { "epoch": 467.64, "learning_rate": 2.681142857142857e-06, "loss": 0.2263, "step": 33670 }, { "epoch": 467.78, "learning_rate": 2.669714285714286e-06, "loss": 0.2374, "step": 33680 }, { "epoch": 467.91, "learning_rate": 2.6582857142857145e-06, "loss": 0.2339, "step": 33690 }, { "epoch": 468.0, "eval_loss": 0.6914926171302795, "eval_runtime": 129.0987, "eval_samples_per_second": 4.121, "eval_steps_per_second": 0.519, "eval_wer": 0.2224079192646397, "step": 33696 }, { "epoch": 468.06, "learning_rate": 2.6468571428571433e-06, "loss": 0.2389, "step": 33700 }, { "epoch": 468.19, "learning_rate": 2.6354285714285718e-06, "loss": 0.2379, "step": 33710 }, { "epoch": 468.33, "learning_rate": 2.6240000000000006e-06, "loss": 0.2328, "step": 33720 }, { "epoch": 468.47, "learning_rate": 2.6125714285714286e-06, "loss": 0.2399, "step": 33730 }, { "epoch": 468.61, "learning_rate": 2.601142857142857e-06, "loss": 0.2306, "step": 33740 }, { "epoch": 468.75, "learning_rate": 2.589714285714286e-06, "loss": 0.2268, "step": 33750 }, { "epoch": 468.89, "learning_rate": 2.5782857142857144e-06, "loss": 0.2259, "step": 33760 }, { "epoch": 469.0, "eval_loss": 0.6919407844543457, "eval_runtime": 129.6051, "eval_samples_per_second": 4.105, "eval_steps_per_second": 0.517, "eval_wer": 0.22202224079192645, "step": 33768 }, { "epoch": 469.03, "learning_rate": 2.5668571428571432e-06, "loss": 0.2325, "step": 33770 }, { "epoch": 469.17, "learning_rate": 2.5554285714285717e-06, "loss": 0.2373, "step": 33780 }, { "epoch": 469.3, "learning_rate": 2.5440000000000005e-06, "loss": 0.229, "step": 33790 }, { "epoch": 469.44, "learning_rate": 2.5325714285714286e-06, "loss": 0.231, "step": 33800 }, { "epoch": 469.58, "learning_rate": 2.5211428571428574e-06, "loss": 0.2254, "step": 33810 }, { "epoch": 469.72, "learning_rate": 2.509714285714286e-06, "loss": 0.241, "step": 33820 }, { "epoch": 469.86, "learning_rate": 2.4982857142857143e-06, "loss": 0.2292, "step": 33830 }, { "epoch": 470.0, "learning_rate": 2.486857142857143e-06, "loss": 0.2327, "step": 33840 }, { "epoch": 470.0, "eval_loss": 0.6877278685569763, "eval_runtime": 129.1466, "eval_samples_per_second": 4.119, "eval_steps_per_second": 0.519, "eval_wer": 0.22253647875554414, "step": 33840 }, { "epoch": 470.14, "learning_rate": 2.4754285714285716e-06, "loss": 0.2448, "step": 33850 }, { "epoch": 470.28, "learning_rate": 2.4640000000000005e-06, "loss": 0.2284, "step": 33860 }, { "epoch": 470.42, "learning_rate": 2.452571428571429e-06, "loss": 0.2358, "step": 33870 }, { "epoch": 470.55, "learning_rate": 2.4411428571428573e-06, "loss": 0.2308, "step": 33880 }, { "epoch": 470.69, "learning_rate": 2.4297142857142858e-06, "loss": 0.2301, "step": 33890 }, { "epoch": 470.83, "learning_rate": 2.4182857142857142e-06, "loss": 0.228, "step": 33900 }, { "epoch": 470.97, "learning_rate": 2.406857142857143e-06, "loss": 0.2341, "step": 33910 }, { "epoch": 471.0, "eval_loss": 0.689193844795227, "eval_runtime": 129.7264, "eval_samples_per_second": 4.101, "eval_steps_per_second": 0.516, "eval_wer": 0.22350067493732725, "step": 33912 }, { "epoch": 471.11, "learning_rate": 2.3954285714285715e-06, "loss": 0.2277, "step": 33920 }, { "epoch": 471.25, "learning_rate": 2.3840000000000004e-06, "loss": 0.2314, "step": 33930 }, { "epoch": 471.39, "learning_rate": 2.372571428571429e-06, "loss": 0.2334, "step": 33940 }, { "epoch": 471.53, "learning_rate": 2.3611428571428573e-06, "loss": 0.2363, "step": 33950 }, { "epoch": 471.66, "learning_rate": 2.349714285714286e-06, "loss": 0.2296, "step": 33960 }, { "epoch": 471.8, "learning_rate": 2.3382857142857146e-06, "loss": 0.2278, "step": 33970 }, { "epoch": 471.94, "learning_rate": 2.326857142857143e-06, "loss": 0.2502, "step": 33980 }, { "epoch": 472.0, "eval_loss": 0.6900443434715271, "eval_runtime": 131.1266, "eval_samples_per_second": 4.057, "eval_steps_per_second": 0.511, "eval_wer": 0.22272931799190074, "step": 33984 }, { "epoch": 472.08, "learning_rate": 2.3154285714285714e-06, "loss": 0.2396, "step": 33990 }, { "epoch": 472.22, "learning_rate": 2.3040000000000003e-06, "loss": 0.245, "step": 34000 }, { "epoch": 472.36, "learning_rate": 2.2925714285714287e-06, "loss": 0.2324, "step": 34010 }, { "epoch": 472.5, "learning_rate": 2.281142857142857e-06, "loss": 0.2296, "step": 34020 }, { "epoch": 472.64, "learning_rate": 2.269714285714286e-06, "loss": 0.2274, "step": 34030 }, { "epoch": 472.78, "learning_rate": 2.2582857142857145e-06, "loss": 0.246, "step": 34040 }, { "epoch": 472.91, "learning_rate": 2.246857142857143e-06, "loss": 0.234, "step": 34050 }, { "epoch": 473.0, "eval_loss": 0.6838749647140503, "eval_runtime": 129.2089, "eval_samples_per_second": 4.117, "eval_steps_per_second": 0.519, "eval_wer": 0.22420775213730154, "step": 34056 }, { "epoch": 473.06, "learning_rate": 2.2354285714285718e-06, "loss": 0.2314, "step": 34060 }, { "epoch": 473.19, "learning_rate": 2.2240000000000002e-06, "loss": 0.2389, "step": 34070 }, { "epoch": 473.33, "learning_rate": 2.2125714285714287e-06, "loss": 0.2246, "step": 34080 }, { "epoch": 473.47, "learning_rate": 2.201142857142857e-06, "loss": 0.2315, "step": 34090 }, { "epoch": 473.61, "learning_rate": 2.189714285714286e-06, "loss": 0.2371, "step": 34100 }, { "epoch": 473.75, "learning_rate": 2.1782857142857144e-06, "loss": 0.2279, "step": 34110 }, { "epoch": 473.89, "learning_rate": 2.166857142857143e-06, "loss": 0.2289, "step": 34120 }, { "epoch": 474.0, "eval_loss": 0.688453733921051, "eval_runtime": 129.5501, "eval_samples_per_second": 4.107, "eval_steps_per_second": 0.517, "eval_wer": 0.22427203188275374, "step": 34128 }, { "epoch": 474.03, "learning_rate": 2.1554285714285717e-06, "loss": 0.2395, "step": 34130 }, { "epoch": 474.17, "learning_rate": 2.144e-06, "loss": 0.2383, "step": 34140 }, { "epoch": 474.3, "learning_rate": 2.132571428571429e-06, "loss": 0.2268, "step": 34150 }, { "epoch": 474.44, "learning_rate": 2.1211428571428574e-06, "loss": 0.2305, "step": 34160 }, { "epoch": 474.58, "learning_rate": 2.109714285714286e-06, "loss": 0.2134, "step": 34170 }, { "epoch": 474.72, "learning_rate": 2.0982857142857143e-06, "loss": 0.2349, "step": 34180 }, { "epoch": 474.86, "learning_rate": 2.086857142857143e-06, "loss": 0.2282, "step": 34190 }, { "epoch": 475.0, "learning_rate": 2.0754285714285716e-06, "loss": 0.2311, "step": 34200 }, { "epoch": 475.0, "eval_loss": 0.6911332011222839, "eval_runtime": 129.8903, "eval_samples_per_second": 4.096, "eval_steps_per_second": 0.516, "eval_wer": 0.223114996464614, "step": 34200 }, { "epoch": 475.14, "learning_rate": 2.064e-06, "loss": 0.2368, "step": 34210 }, { "epoch": 475.28, "learning_rate": 2.052571428571429e-06, "loss": 0.2262, "step": 34220 }, { "epoch": 475.42, "learning_rate": 2.0411428571428574e-06, "loss": 0.2275, "step": 34230 }, { "epoch": 475.55, "learning_rate": 2.029714285714286e-06, "loss": 0.2244, "step": 34240 }, { "epoch": 475.69, "learning_rate": 2.0182857142857147e-06, "loss": 0.2383, "step": 34250 }, { "epoch": 475.83, "learning_rate": 2.006857142857143e-06, "loss": 0.2241, "step": 34260 }, { "epoch": 475.97, "learning_rate": 1.9954285714285715e-06, "loss": 0.2374, "step": 34270 }, { "epoch": 476.0, "eval_loss": 0.6833502650260925, "eval_runtime": 129.5339, "eval_samples_per_second": 4.107, "eval_steps_per_second": 0.517, "eval_wer": 0.22337211544642283, "step": 34272 }, { "epoch": 476.11, "learning_rate": 1.984e-06, "loss": 0.2403, "step": 34280 }, { "epoch": 476.25, "learning_rate": 1.972571428571429e-06, "loss": 0.2253, "step": 34290 }, { "epoch": 476.39, "learning_rate": 1.9611428571428573e-06, "loss": 0.2277, "step": 34300 }, { "epoch": 476.53, "learning_rate": 1.9497142857142857e-06, "loss": 0.2326, "step": 34310 }, { "epoch": 476.66, "learning_rate": 1.9382857142857146e-06, "loss": 0.227, "step": 34320 }, { "epoch": 476.8, "learning_rate": 1.926857142857143e-06, "loss": 0.234, "step": 34330 }, { "epoch": 476.94, "learning_rate": 1.915428571428572e-06, "loss": 0.235, "step": 34340 }, { "epoch": 477.0, "eval_loss": 0.6789714694023132, "eval_runtime": 130.6375, "eval_samples_per_second": 4.072, "eval_steps_per_second": 0.513, "eval_wer": 0.2223436395191875, "step": 34344 }, { "epoch": 477.08, "learning_rate": 1.9040000000000003e-06, "loss": 0.2334, "step": 34350 }, { "epoch": 477.22, "learning_rate": 1.8925714285714285e-06, "loss": 0.2345, "step": 34360 }, { "epoch": 477.36, "learning_rate": 1.8811428571428572e-06, "loss": 0.218, "step": 34370 }, { "epoch": 477.5, "learning_rate": 1.8697142857142858e-06, "loss": 0.2315, "step": 34380 }, { "epoch": 477.64, "learning_rate": 1.8582857142857145e-06, "loss": 0.2413, "step": 34390 }, { "epoch": 477.78, "learning_rate": 1.846857142857143e-06, "loss": 0.23, "step": 34400 }, { "epoch": 477.91, "learning_rate": 1.8354285714285716e-06, "loss": 0.2292, "step": 34410 }, { "epoch": 478.0, "eval_loss": 0.685696005821228, "eval_runtime": 129.3584, "eval_samples_per_second": 4.113, "eval_steps_per_second": 0.518, "eval_wer": 0.22330783570097062, "step": 34416 }, { "epoch": 478.06, "learning_rate": 1.8240000000000002e-06, "loss": 0.2307, "step": 34420 }, { "epoch": 478.19, "learning_rate": 1.8125714285714289e-06, "loss": 0.2412, "step": 34430 }, { "epoch": 478.33, "learning_rate": 1.8011428571428573e-06, "loss": 0.2294, "step": 34440 }, { "epoch": 478.47, "learning_rate": 1.7897142857142858e-06, "loss": 0.2354, "step": 34450 }, { "epoch": 478.61, "learning_rate": 1.7782857142857144e-06, "loss": 0.2391, "step": 34460 }, { "epoch": 478.75, "learning_rate": 1.7668571428571429e-06, "loss": 0.2252, "step": 34470 }, { "epoch": 478.89, "learning_rate": 1.7554285714285715e-06, "loss": 0.2243, "step": 34480 }, { "epoch": 479.0, "eval_loss": 0.6737434267997742, "eval_runtime": 130.619, "eval_samples_per_second": 4.073, "eval_steps_per_second": 0.513, "eval_wer": 0.22427203188275374, "step": 34488 }, { "epoch": 479.03, "learning_rate": 1.7440000000000002e-06, "loss": 0.2377, "step": 34490 }, { "epoch": 479.17, "learning_rate": 1.7325714285714288e-06, "loss": 0.2418, "step": 34500 }, { "epoch": 479.3, "learning_rate": 1.7211428571428572e-06, "loss": 0.2254, "step": 34510 }, { "epoch": 479.44, "learning_rate": 1.709714285714286e-06, "loss": 0.2359, "step": 34520 }, { "epoch": 479.58, "learning_rate": 1.6982857142857145e-06, "loss": 0.2188, "step": 34530 }, { "epoch": 479.72, "learning_rate": 1.6868571428571428e-06, "loss": 0.2359, "step": 34540 }, { "epoch": 479.86, "learning_rate": 1.6754285714285714e-06, "loss": 0.2257, "step": 34550 }, { "epoch": 480.0, "learning_rate": 1.664e-06, "loss": 0.235, "step": 34560 }, { "epoch": 480.0, "eval_loss": 0.6831479072570801, "eval_runtime": 129.417, "eval_samples_per_second": 4.111, "eval_steps_per_second": 0.518, "eval_wer": 0.22215080028283088, "step": 34560 }, { "epoch": 480.14, "learning_rate": 1.6525714285714287e-06, "loss": 0.2363, "step": 34570 }, { "epoch": 480.28, "learning_rate": 1.6411428571428572e-06, "loss": 0.2322, "step": 34580 }, { "epoch": 480.42, "learning_rate": 1.6297142857142858e-06, "loss": 0.2409, "step": 34590 }, { "epoch": 480.55, "learning_rate": 1.6182857142857145e-06, "loss": 0.2252, "step": 34600 }, { "epoch": 480.69, "learning_rate": 1.6068571428571431e-06, "loss": 0.2422, "step": 34610 }, { "epoch": 480.83, "learning_rate": 1.5954285714285716e-06, "loss": 0.2223, "step": 34620 }, { "epoch": 480.97, "learning_rate": 1.5840000000000002e-06, "loss": 0.2337, "step": 34630 }, { "epoch": 481.0, "eval_loss": 0.6768653988838196, "eval_runtime": 129.7943, "eval_samples_per_second": 4.099, "eval_steps_per_second": 0.516, "eval_wer": 0.2206723661374301, "step": 34632 }, { "epoch": 481.11, "learning_rate": 1.5725714285714286e-06, "loss": 0.2369, "step": 34640 }, { "epoch": 481.25, "learning_rate": 1.561142857142857e-06, "loss": 0.2293, "step": 34650 }, { "epoch": 481.39, "learning_rate": 1.5497142857142857e-06, "loss": 0.2297, "step": 34660 }, { "epoch": 481.53, "learning_rate": 1.5382857142857144e-06, "loss": 0.2351, "step": 34670 }, { "epoch": 481.66, "learning_rate": 1.526857142857143e-06, "loss": 0.2383, "step": 34680 }, { "epoch": 481.8, "learning_rate": 1.5154285714285717e-06, "loss": 0.2304, "step": 34690 }, { "epoch": 481.94, "learning_rate": 1.5040000000000001e-06, "loss": 0.2258, "step": 34700 }, { "epoch": 482.0, "eval_loss": 0.6784033179283142, "eval_runtime": 129.5147, "eval_samples_per_second": 4.108, "eval_steps_per_second": 0.517, "eval_wer": 0.2231792762100662, "step": 34704 }, { "epoch": 482.08, "learning_rate": 1.4925714285714288e-06, "loss": 0.2262, "step": 34710 }, { "epoch": 482.22, "learning_rate": 1.4811428571428574e-06, "loss": 0.2374, "step": 34720 }, { "epoch": 482.36, "learning_rate": 1.4697142857142857e-06, "loss": 0.2193, "step": 34730 }, { "epoch": 482.5, "learning_rate": 1.4582857142857143e-06, "loss": 0.2276, "step": 34740 }, { "epoch": 482.64, "learning_rate": 1.446857142857143e-06, "loss": 0.2281, "step": 34750 }, { "epoch": 482.78, "learning_rate": 1.4354285714285716e-06, "loss": 0.226, "step": 34760 }, { "epoch": 482.91, "learning_rate": 1.424e-06, "loss": 0.2276, "step": 34770 }, { "epoch": 483.0, "eval_loss": 0.6917012333869934, "eval_runtime": 129.5158, "eval_samples_per_second": 4.108, "eval_steps_per_second": 0.517, "eval_wer": 0.22414347239184934, "step": 34776 }, { "epoch": 483.06, "learning_rate": 1.4125714285714287e-06, "loss": 0.2339, "step": 34780 }, { "epoch": 483.19, "learning_rate": 1.4011428571428573e-06, "loss": 0.2295, "step": 34790 }, { "epoch": 483.33, "learning_rate": 1.389714285714286e-06, "loss": 0.2333, "step": 34800 }, { "epoch": 483.47, "learning_rate": 1.3782857142857144e-06, "loss": 0.2343, "step": 34810 }, { "epoch": 483.61, "learning_rate": 1.366857142857143e-06, "loss": 0.2304, "step": 34820 }, { "epoch": 483.75, "learning_rate": 1.3554285714285715e-06, "loss": 0.2261, "step": 34830 }, { "epoch": 483.89, "learning_rate": 1.344e-06, "loss": 0.2379, "step": 34840 }, { "epoch": 484.0, "eval_loss": 0.6805532574653625, "eval_runtime": 129.1995, "eval_samples_per_second": 4.118, "eval_steps_per_second": 0.519, "eval_wer": 0.22510766857363246, "step": 34848 }, { "epoch": 484.03, "learning_rate": 1.3325714285714286e-06, "loss": 0.2192, "step": 34850 }, { "epoch": 484.17, "learning_rate": 1.3211428571428573e-06, "loss": 0.2267, "step": 34860 }, { "epoch": 484.3, "learning_rate": 1.309714285714286e-06, "loss": 0.2257, "step": 34870 }, { "epoch": 484.44, "learning_rate": 1.2982857142857144e-06, "loss": 0.2392, "step": 34880 }, { "epoch": 484.58, "learning_rate": 1.286857142857143e-06, "loss": 0.2307, "step": 34890 }, { "epoch": 484.72, "learning_rate": 1.2754285714285717e-06, "loss": 0.2383, "step": 34900 }, { "epoch": 484.86, "learning_rate": 1.2640000000000003e-06, "loss": 0.2368, "step": 34910 }, { "epoch": 485.0, "learning_rate": 1.2525714285714285e-06, "loss": 0.229, "step": 34920 }, { "epoch": 485.0, "eval_loss": 0.6859225034713745, "eval_runtime": 129.2507, "eval_samples_per_second": 4.116, "eval_steps_per_second": 0.518, "eval_wer": 0.2231792762100662, "step": 34920 }, { "epoch": 485.14, "learning_rate": 1.2411428571428572e-06, "loss": 0.232, "step": 34930 }, { "epoch": 485.28, "learning_rate": 1.2297142857142858e-06, "loss": 0.2237, "step": 34940 }, { "epoch": 485.42, "learning_rate": 1.2182857142857143e-06, "loss": 0.244, "step": 34950 }, { "epoch": 485.55, "learning_rate": 1.206857142857143e-06, "loss": 0.2229, "step": 34960 }, { "epoch": 485.69, "learning_rate": 1.1954285714285716e-06, "loss": 0.2337, "step": 34970 }, { "epoch": 485.83, "learning_rate": 1.1840000000000002e-06, "loss": 0.229, "step": 34980 }, { "epoch": 485.97, "learning_rate": 1.1725714285714287e-06, "loss": 0.2312, "step": 34990 }, { "epoch": 486.0, "eval_loss": 0.6850021481513977, "eval_runtime": 129.2072, "eval_samples_per_second": 4.117, "eval_steps_per_second": 0.519, "eval_wer": 0.22356495468277945, "step": 34992 }, { "epoch": 486.11, "learning_rate": 1.1611428571428573e-06, "loss": 0.2345, "step": 35000 }, { "epoch": 486.25, "learning_rate": 1.1497142857142858e-06, "loss": 0.234, "step": 35010 }, { "epoch": 486.39, "learning_rate": 1.1382857142857144e-06, "loss": 0.2247, "step": 35020 }, { "epoch": 486.53, "learning_rate": 1.126857142857143e-06, "loss": 0.2253, "step": 35030 }, { "epoch": 486.66, "learning_rate": 1.1154285714285715e-06, "loss": 0.241, "step": 35040 }, { "epoch": 486.8, "learning_rate": 1.1040000000000001e-06, "loss": 0.2241, "step": 35050 }, { "epoch": 486.94, "learning_rate": 1.0925714285714286e-06, "loss": 0.2412, "step": 35060 }, { "epoch": 487.0, "eval_loss": 0.6776268482208252, "eval_runtime": 129.6555, "eval_samples_per_second": 4.103, "eval_steps_per_second": 0.517, "eval_wer": 0.22208652053737868, "step": 35064 }, { "epoch": 487.08, "learning_rate": 1.0811428571428572e-06, "loss": 0.2366, "step": 35070 }, { "epoch": 487.22, "learning_rate": 1.0697142857142857e-06, "loss": 0.2277, "step": 35080 }, { "epoch": 487.36, "learning_rate": 1.0582857142857143e-06, "loss": 0.2322, "step": 35090 }, { "epoch": 487.5, "learning_rate": 1.046857142857143e-06, "loss": 0.226, "step": 35100 }, { "epoch": 487.64, "learning_rate": 1.0354285714285716e-06, "loss": 0.2282, "step": 35110 }, { "epoch": 487.78, "learning_rate": 1.024e-06, "loss": 0.2298, "step": 35120 }, { "epoch": 487.91, "learning_rate": 1.0125714285714285e-06, "loss": 0.2328, "step": 35130 }, { "epoch": 488.0, "eval_loss": 0.6834743618965149, "eval_runtime": 129.3844, "eval_samples_per_second": 4.112, "eval_steps_per_second": 0.518, "eval_wer": 0.2229864369737096, "step": 35136 }, { "epoch": 488.06, "learning_rate": 1.0011428571428572e-06, "loss": 0.2248, "step": 35140 }, { "epoch": 488.19, "learning_rate": 9.897142857142858e-07, "loss": 0.2326, "step": 35150 }, { "epoch": 488.33, "learning_rate": 9.782857142857145e-07, "loss": 0.2303, "step": 35160 }, { "epoch": 488.47, "learning_rate": 9.668571428571429e-07, "loss": 0.2338, "step": 35170 }, { "epoch": 488.61, "learning_rate": 9.554285714285715e-07, "loss": 0.2179, "step": 35180 }, { "epoch": 488.75, "learning_rate": 9.440000000000001e-07, "loss": 0.2297, "step": 35190 }, { "epoch": 488.89, "learning_rate": 9.325714285714286e-07, "loss": 0.2373, "step": 35200 }, { "epoch": 489.0, "eval_loss": 0.6878861784934998, "eval_runtime": 129.5008, "eval_samples_per_second": 4.108, "eval_steps_per_second": 0.517, "eval_wer": 0.22221508002828308, "step": 35208 }, { "epoch": 489.03, "learning_rate": 9.211428571428573e-07, "loss": 0.2324, "step": 35210 }, { "epoch": 489.17, "learning_rate": 9.097142857142858e-07, "loss": 0.2351, "step": 35220 }, { "epoch": 489.3, "learning_rate": 8.982857142857143e-07, "loss": 0.225, "step": 35230 }, { "epoch": 489.44, "learning_rate": 8.868571428571429e-07, "loss": 0.2321, "step": 35240 }, { "epoch": 489.58, "learning_rate": 8.754285714285716e-07, "loss": 0.2256, "step": 35250 }, { "epoch": 489.72, "learning_rate": 8.640000000000001e-07, "loss": 0.2393, "step": 35260 }, { "epoch": 489.86, "learning_rate": 8.525714285714286e-07, "loss": 0.2227, "step": 35270 }, { "epoch": 490.0, "learning_rate": 8.411428571428572e-07, "loss": 0.234, "step": 35280 }, { "epoch": 490.0, "eval_loss": 0.6867592930793762, "eval_runtime": 129.5569, "eval_samples_per_second": 4.106, "eval_steps_per_second": 0.517, "eval_wer": 0.2213794433374044, "step": 35280 }, { "epoch": 490.14, "learning_rate": 8.297142857142857e-07, "loss": 0.2393, "step": 35290 }, { "epoch": 490.28, "learning_rate": 8.182857142857144e-07, "loss": 0.2263, "step": 35300 }, { "epoch": 490.42, "learning_rate": 8.068571428571429e-07, "loss": 0.2338, "step": 35310 }, { "epoch": 490.55, "learning_rate": 7.954285714285715e-07, "loss": 0.2356, "step": 35320 }, { "epoch": 490.69, "learning_rate": 7.84e-07, "loss": 0.2318, "step": 35330 }, { "epoch": 490.83, "learning_rate": 7.725714285714287e-07, "loss": 0.2261, "step": 35340 }, { "epoch": 490.97, "learning_rate": 7.611428571428572e-07, "loss": 0.2274, "step": 35350 }, { "epoch": 491.0, "eval_loss": 0.6868891716003418, "eval_runtime": 129.8019, "eval_samples_per_second": 4.099, "eval_steps_per_second": 0.516, "eval_wer": 0.22221508002828308, "step": 35352 }, { "epoch": 491.11, "learning_rate": 7.497142857142859e-07, "loss": 0.2281, "step": 35360 }, { "epoch": 491.25, "learning_rate": 7.382857142857143e-07, "loss": 0.2343, "step": 35370 }, { "epoch": 491.39, "learning_rate": 7.268571428571429e-07, "loss": 0.2322, "step": 35380 }, { "epoch": 491.53, "learning_rate": 7.154285714285715e-07, "loss": 0.2291, "step": 35390 }, { "epoch": 491.66, "learning_rate": 7.040000000000001e-07, "loss": 0.2358, "step": 35400 }, { "epoch": 491.8, "learning_rate": 6.925714285714286e-07, "loss": 0.2218, "step": 35410 }, { "epoch": 491.94, "learning_rate": 6.811428571428571e-07, "loss": 0.2332, "step": 35420 }, { "epoch": 492.0, "eval_loss": 0.6861120462417603, "eval_runtime": 129.6847, "eval_samples_per_second": 4.102, "eval_steps_per_second": 0.517, "eval_wer": 0.2213794433374044, "step": 35424 }, { "epoch": 492.08, "learning_rate": 6.697142857142858e-07, "loss": 0.2303, "step": 35430 }, { "epoch": 492.22, "learning_rate": 6.582857142857143e-07, "loss": 0.2378, "step": 35440 }, { "epoch": 492.36, "learning_rate": 6.46857142857143e-07, "loss": 0.2252, "step": 35450 }, { "epoch": 492.5, "learning_rate": 6.354285714285714e-07, "loss": 0.2312, "step": 35460 }, { "epoch": 492.64, "learning_rate": 6.24e-07, "loss": 0.2218, "step": 35470 }, { "epoch": 492.78, "learning_rate": 6.125714285714286e-07, "loss": 0.2275, "step": 35480 }, { "epoch": 492.91, "learning_rate": 6.011428571428572e-07, "loss": 0.2291, "step": 35490 }, { "epoch": 493.0, "eval_loss": 0.6881063580513, "eval_runtime": 129.2943, "eval_samples_per_second": 4.115, "eval_steps_per_second": 0.518, "eval_wer": 0.22060808639197788, "step": 35496 }, { "epoch": 493.06, "learning_rate": 5.897142857142857e-07, "loss": 0.2446, "step": 35500 }, { "epoch": 493.19, "learning_rate": 5.782857142857144e-07, "loss": 0.2338, "step": 35510 }, { "epoch": 493.33, "learning_rate": 5.668571428571429e-07, "loss": 0.2184, "step": 35520 }, { "epoch": 493.47, "learning_rate": 5.554285714285715e-07, "loss": 0.2156, "step": 35530 }, { "epoch": 493.61, "learning_rate": 5.44e-07, "loss": 0.2213, "step": 35540 }, { "epoch": 493.75, "learning_rate": 5.325714285714287e-07, "loss": 0.2376, "step": 35550 }, { "epoch": 493.89, "learning_rate": 5.211428571428572e-07, "loss": 0.2301, "step": 35560 }, { "epoch": 494.0, "eval_loss": 0.6877050399780273, "eval_runtime": 129.0935, "eval_samples_per_second": 4.121, "eval_steps_per_second": 0.519, "eval_wer": 0.22047952690107347, "step": 35568 }, { "epoch": 494.03, "learning_rate": 5.097142857142857e-07, "loss": 0.228, "step": 35570 }, { "epoch": 494.17, "learning_rate": 4.982857142857144e-07, "loss": 0.2285, "step": 35580 }, { "epoch": 494.3, "learning_rate": 4.868571428571428e-07, "loss": 0.229, "step": 35590 }, { "epoch": 494.44, "learning_rate": 4.754285714285715e-07, "loss": 0.2352, "step": 35600 }, { "epoch": 494.58, "learning_rate": 4.651428571428572e-07, "loss": 0.2224, "step": 35610 }, { "epoch": 494.72, "learning_rate": 4.537142857142857e-07, "loss": 0.2329, "step": 35620 }, { "epoch": 494.86, "learning_rate": 4.422857142857143e-07, "loss": 0.2227, "step": 35630 }, { "epoch": 495.0, "learning_rate": 4.3085714285714286e-07, "loss": 0.2258, "step": 35640 }, { "epoch": 495.0, "eval_loss": 0.6897897720336914, "eval_runtime": 128.969, "eval_samples_per_second": 4.125, "eval_steps_per_second": 0.52, "eval_wer": 0.22028668766471685, "step": 35640 }, { "epoch": 495.14, "learning_rate": 4.1942857142857146e-07, "loss": 0.2399, "step": 35650 }, { "epoch": 495.28, "learning_rate": 4.0800000000000005e-07, "loss": 0.2218, "step": 35660 }, { "epoch": 495.42, "learning_rate": 3.965714285714286e-07, "loss": 0.2338, "step": 35670 }, { "epoch": 495.55, "learning_rate": 3.851428571428572e-07, "loss": 0.2202, "step": 35680 }, { "epoch": 495.69, "learning_rate": 3.7371428571428574e-07, "loss": 0.2253, "step": 35690 }, { "epoch": 495.83, "learning_rate": 3.6228571428571434e-07, "loss": 0.2344, "step": 35700 }, { "epoch": 495.97, "learning_rate": 3.5085714285714283e-07, "loss": 0.2351, "step": 35710 }, { "epoch": 496.0, "eval_loss": 0.6883332133293152, "eval_runtime": 129.7898, "eval_samples_per_second": 4.099, "eval_steps_per_second": 0.516, "eval_wer": 0.22118660410104776, "step": 35712 }, { "epoch": 496.11, "learning_rate": 3.394285714285715e-07, "loss": 0.2281, "step": 35720 }, { "epoch": 496.25, "learning_rate": 3.280000000000001e-07, "loss": 0.2236, "step": 35730 }, { "epoch": 496.39, "learning_rate": 3.1657142857142857e-07, "loss": 0.2178, "step": 35740 }, { "epoch": 496.53, "learning_rate": 3.0514285714285717e-07, "loss": 0.2341, "step": 35750 }, { "epoch": 496.66, "learning_rate": 2.9371428571428577e-07, "loss": 0.235, "step": 35760 }, { "epoch": 496.8, "learning_rate": 2.822857142857143e-07, "loss": 0.2271, "step": 35770 }, { "epoch": 496.94, "learning_rate": 2.7085714285714285e-07, "loss": 0.2345, "step": 35780 }, { "epoch": 497.0, "eval_loss": 0.6914933323860168, "eval_runtime": 129.4647, "eval_samples_per_second": 4.109, "eval_steps_per_second": 0.518, "eval_wer": 0.22125088384649996, "step": 35784 }, { "epoch": 497.08, "learning_rate": 2.5942857142857145e-07, "loss": 0.2253, "step": 35790 }, { "epoch": 497.22, "learning_rate": 2.48e-07, "loss": 0.2309, "step": 35800 }, { "epoch": 497.36, "learning_rate": 2.3657142857142857e-07, "loss": 0.2293, "step": 35810 }, { "epoch": 497.5, "learning_rate": 2.2514285714285717e-07, "loss": 0.2413, "step": 35820 }, { "epoch": 497.64, "learning_rate": 2.1371428571428574e-07, "loss": 0.2272, "step": 35830 }, { "epoch": 497.78, "learning_rate": 2.022857142857143e-07, "loss": 0.2265, "step": 35840 }, { "epoch": 497.91, "learning_rate": 1.9085714285714288e-07, "loss": 0.23, "step": 35850 }, { "epoch": 498.0, "eval_loss": 0.6921554207801819, "eval_runtime": 129.2534, "eval_samples_per_second": 4.116, "eval_steps_per_second": 0.518, "eval_wer": 0.22170084206466542, "step": 35856 }, { "epoch": 498.06, "learning_rate": 1.7942857142857145e-07, "loss": 0.2305, "step": 35860 }, { "epoch": 498.19, "learning_rate": 1.68e-07, "loss": 0.2347, "step": 35870 }, { "epoch": 498.33, "learning_rate": 1.5657142857142857e-07, "loss": 0.2279, "step": 35880 }, { "epoch": 498.47, "learning_rate": 1.4514285714285716e-07, "loss": 0.232, "step": 35890 }, { "epoch": 498.61, "learning_rate": 1.337142857142857e-07, "loss": 0.2285, "step": 35900 }, { "epoch": 498.75, "learning_rate": 1.222857142857143e-07, "loss": 0.2265, "step": 35910 }, { "epoch": 498.89, "learning_rate": 1.1085714285714286e-07, "loss": 0.2257, "step": 35920 }, { "epoch": 499.0, "eval_loss": 0.6925147175788879, "eval_runtime": 129.4724, "eval_samples_per_second": 4.109, "eval_steps_per_second": 0.517, "eval_wer": 0.22163656231921322, "step": 35928 }, { "epoch": 499.03, "learning_rate": 9.942857142857144e-08, "loss": 0.2367, "step": 35930 }, { "epoch": 499.17, "learning_rate": 8.800000000000001e-08, "loss": 0.2332, "step": 35940 }, { "epoch": 499.3, "learning_rate": 7.657142857142858e-08, "loss": 0.2284, "step": 35950 }, { "epoch": 499.44, "learning_rate": 6.514285714285715e-08, "loss": 0.2293, "step": 35960 }, { "epoch": 499.58, "learning_rate": 5.3714285714285714e-08, "loss": 0.2248, "step": 35970 }, { "epoch": 499.72, "learning_rate": 4.228571428571429e-08, "loss": 0.2357, "step": 35980 }, { "epoch": 499.86, "learning_rate": 3.085714285714286e-08, "loss": 0.2312, "step": 35990 }, { "epoch": 500.0, "learning_rate": 1.942857142857143e-08, "loss": 0.2273, "step": 36000 }, { "epoch": 500.0, "eval_loss": 0.6914485692977905, "eval_runtime": 129.8818, "eval_samples_per_second": 4.096, "eval_steps_per_second": 0.516, "eval_wer": 0.22054380664652568, "step": 36000 }, { "epoch": 500.0, "step": 36000, "total_flos": 1.360166857740454e+21, "train_loss": 0.3272103496922387, "train_runtime": 967187.3084, "train_samples_per_second": 2.387, "train_steps_per_second": 0.037 } ], "max_steps": 36000, "num_train_epochs": 500, "total_flos": 1.360166857740454e+21, "trial_name": null, "trial_params": null }