whisper-base-common_voice0502 / trainer_state.json
liushaowei's picture
Upload 10 files
5381af2
{
"best_metric": 64.97826497826497,
"best_model_checkpoint": "./whisper-base-common_voice0502/checkpoint-40000",
"epoch": 0.8670582879934103,
"global_step": 40000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.0,
"learning_rate": 4.7000000000000005e-07,
"loss": 2.8561,
"step": 50
},
{
"epoch": 0.0,
"learning_rate": 9.7e-07,
"loss": 2.1277,
"step": 100
},
{
"epoch": 0.0,
"learning_rate": 1.4700000000000001e-06,
"loss": 1.5504,
"step": 150
},
{
"epoch": 0.0,
"learning_rate": 1.97e-06,
"loss": 1.5439,
"step": 200
},
{
"epoch": 0.01,
"learning_rate": 2.47e-06,
"loss": 1.4361,
"step": 250
},
{
"epoch": 0.01,
"learning_rate": 2.97e-06,
"loss": 1.3545,
"step": 300
},
{
"epoch": 0.01,
"learning_rate": 3.4700000000000002e-06,
"loss": 1.3984,
"step": 350
},
{
"epoch": 0.01,
"learning_rate": 3.97e-06,
"loss": 1.3189,
"step": 400
},
{
"epoch": 0.01,
"learning_rate": 4.47e-06,
"loss": 1.2998,
"step": 450
},
{
"epoch": 0.01,
"learning_rate": 4.970000000000001e-06,
"loss": 1.3097,
"step": 500
},
{
"epoch": 0.01,
"learning_rate": 5.470000000000001e-06,
"loss": 1.2081,
"step": 550
},
{
"epoch": 0.01,
"learning_rate": 5.9700000000000004e-06,
"loss": 1.3417,
"step": 600
},
{
"epoch": 0.01,
"learning_rate": 6.470000000000001e-06,
"loss": 1.3481,
"step": 650
},
{
"epoch": 0.02,
"learning_rate": 6.97e-06,
"loss": 1.3177,
"step": 700
},
{
"epoch": 0.02,
"learning_rate": 7.4700000000000005e-06,
"loss": 1.2098,
"step": 750
},
{
"epoch": 0.02,
"learning_rate": 7.970000000000002e-06,
"loss": 1.2517,
"step": 800
},
{
"epoch": 0.02,
"learning_rate": 8.47e-06,
"loss": 1.2763,
"step": 850
},
{
"epoch": 0.02,
"learning_rate": 8.97e-06,
"loss": 1.1962,
"step": 900
},
{
"epoch": 0.02,
"learning_rate": 9.47e-06,
"loss": 1.2287,
"step": 950
},
{
"epoch": 0.02,
"learning_rate": 9.970000000000001e-06,
"loss": 1.3095,
"step": 1000
},
{
"epoch": 0.02,
"learning_rate": 9.987948717948719e-06,
"loss": 1.1799,
"step": 1050
},
{
"epoch": 0.02,
"learning_rate": 9.975128205128205e-06,
"loss": 1.1543,
"step": 1100
},
{
"epoch": 0.02,
"learning_rate": 9.962307692307694e-06,
"loss": 1.1441,
"step": 1150
},
{
"epoch": 0.03,
"learning_rate": 9.94948717948718e-06,
"loss": 1.2167,
"step": 1200
},
{
"epoch": 0.03,
"learning_rate": 9.936666666666668e-06,
"loss": 1.2066,
"step": 1250
},
{
"epoch": 0.03,
"learning_rate": 9.923846153846154e-06,
"loss": 1.2142,
"step": 1300
},
{
"epoch": 0.03,
"learning_rate": 9.911025641025643e-06,
"loss": 1.2081,
"step": 1350
},
{
"epoch": 0.03,
"learning_rate": 9.89820512820513e-06,
"loss": 1.1554,
"step": 1400
},
{
"epoch": 0.03,
"learning_rate": 9.885384615384617e-06,
"loss": 1.1011,
"step": 1450
},
{
"epoch": 0.03,
"learning_rate": 9.872564102564103e-06,
"loss": 1.1765,
"step": 1500
},
{
"epoch": 0.03,
"learning_rate": 9.85974358974359e-06,
"loss": 1.1114,
"step": 1550
},
{
"epoch": 0.03,
"learning_rate": 9.846923076923077e-06,
"loss": 1.0983,
"step": 1600
},
{
"epoch": 0.04,
"learning_rate": 9.834102564102564e-06,
"loss": 1.1034,
"step": 1650
},
{
"epoch": 0.04,
"learning_rate": 9.821282051282052e-06,
"loss": 1.0933,
"step": 1700
},
{
"epoch": 0.04,
"learning_rate": 9.80846153846154e-06,
"loss": 1.1116,
"step": 1750
},
{
"epoch": 0.04,
"learning_rate": 9.795641025641026e-06,
"loss": 1.1245,
"step": 1800
},
{
"epoch": 0.04,
"learning_rate": 9.782820512820513e-06,
"loss": 1.0554,
"step": 1850
},
{
"epoch": 0.04,
"learning_rate": 9.770000000000001e-06,
"loss": 1.1102,
"step": 1900
},
{
"epoch": 0.04,
"learning_rate": 9.757179487179488e-06,
"loss": 1.16,
"step": 1950
},
{
"epoch": 0.04,
"learning_rate": 9.744358974358975e-06,
"loss": 1.0976,
"step": 2000
},
{
"epoch": 0.04,
"learning_rate": 9.731538461538462e-06,
"loss": 1.0537,
"step": 2050
},
{
"epoch": 0.05,
"learning_rate": 9.71871794871795e-06,
"loss": 1.0902,
"step": 2100
},
{
"epoch": 0.05,
"learning_rate": 9.705897435897437e-06,
"loss": 1.1244,
"step": 2150
},
{
"epoch": 0.05,
"learning_rate": 9.693076923076924e-06,
"loss": 1.1138,
"step": 2200
},
{
"epoch": 0.05,
"learning_rate": 9.68025641025641e-06,
"loss": 1.0549,
"step": 2250
},
{
"epoch": 0.05,
"learning_rate": 9.667435897435898e-06,
"loss": 1.0398,
"step": 2300
},
{
"epoch": 0.05,
"learning_rate": 9.654615384615386e-06,
"loss": 1.0726,
"step": 2350
},
{
"epoch": 0.05,
"learning_rate": 9.641794871794873e-06,
"loss": 1.0889,
"step": 2400
},
{
"epoch": 0.05,
"learning_rate": 9.62897435897436e-06,
"loss": 1.0773,
"step": 2450
},
{
"epoch": 0.05,
"learning_rate": 9.616410256410257e-06,
"loss": 1.0866,
"step": 2500
},
{
"epoch": 0.06,
"learning_rate": 9.603589743589744e-06,
"loss": 1.0817,
"step": 2550
},
{
"epoch": 0.06,
"learning_rate": 9.59076923076923e-06,
"loss": 1.0046,
"step": 2600
},
{
"epoch": 0.06,
"learning_rate": 9.577948717948719e-06,
"loss": 0.9904,
"step": 2650
},
{
"epoch": 0.06,
"learning_rate": 9.565128205128206e-06,
"loss": 1.1984,
"step": 2700
},
{
"epoch": 0.06,
"learning_rate": 9.552307692307693e-06,
"loss": 1.0691,
"step": 2750
},
{
"epoch": 0.06,
"learning_rate": 9.53948717948718e-06,
"loss": 1.0626,
"step": 2800
},
{
"epoch": 0.06,
"learning_rate": 9.526666666666668e-06,
"loss": 1.1149,
"step": 2850
},
{
"epoch": 0.06,
"learning_rate": 9.513846153846155e-06,
"loss": 0.9861,
"step": 2900
},
{
"epoch": 0.06,
"learning_rate": 9.501025641025642e-06,
"loss": 1.0764,
"step": 2950
},
{
"epoch": 0.07,
"learning_rate": 9.488205128205129e-06,
"loss": 1.0113,
"step": 3000
},
{
"epoch": 0.07,
"learning_rate": 9.475384615384617e-06,
"loss": 1.0731,
"step": 3050
},
{
"epoch": 0.07,
"learning_rate": 9.462564102564104e-06,
"loss": 1.031,
"step": 3100
},
{
"epoch": 0.07,
"learning_rate": 9.44974358974359e-06,
"loss": 1.0187,
"step": 3150
},
{
"epoch": 0.07,
"learning_rate": 9.436923076923078e-06,
"loss": 1.0408,
"step": 3200
},
{
"epoch": 0.07,
"learning_rate": 9.424102564102564e-06,
"loss": 1.1287,
"step": 3250
},
{
"epoch": 0.07,
"learning_rate": 9.411282051282053e-06,
"loss": 1.0135,
"step": 3300
},
{
"epoch": 0.07,
"learning_rate": 9.39846153846154e-06,
"loss": 1.0801,
"step": 3350
},
{
"epoch": 0.07,
"learning_rate": 9.385641025641027e-06,
"loss": 0.9575,
"step": 3400
},
{
"epoch": 0.07,
"learning_rate": 9.372820512820513e-06,
"loss": 1.0608,
"step": 3450
},
{
"epoch": 0.08,
"learning_rate": 9.360000000000002e-06,
"loss": 0.9936,
"step": 3500
},
{
"epoch": 0.08,
"learning_rate": 9.347179487179487e-06,
"loss": 1.0566,
"step": 3550
},
{
"epoch": 0.08,
"learning_rate": 9.334358974358974e-06,
"loss": 1.0688,
"step": 3600
},
{
"epoch": 0.08,
"learning_rate": 9.321538461538462e-06,
"loss": 1.0538,
"step": 3650
},
{
"epoch": 0.08,
"learning_rate": 9.30871794871795e-06,
"loss": 1.0748,
"step": 3700
},
{
"epoch": 0.08,
"learning_rate": 9.295897435897436e-06,
"loss": 1.0053,
"step": 3750
},
{
"epoch": 0.08,
"learning_rate": 9.283076923076923e-06,
"loss": 0.9508,
"step": 3800
},
{
"epoch": 0.08,
"learning_rate": 9.270256410256411e-06,
"loss": 1.0795,
"step": 3850
},
{
"epoch": 0.08,
"learning_rate": 9.257435897435898e-06,
"loss": 0.9591,
"step": 3900
},
{
"epoch": 0.09,
"learning_rate": 9.244615384615385e-06,
"loss": 0.9743,
"step": 3950
},
{
"epoch": 0.09,
"learning_rate": 9.231794871794872e-06,
"loss": 1.0612,
"step": 4000
},
{
"epoch": 0.09,
"eval_loss": 0.4351472556591034,
"eval_runtime": 2537.7667,
"eval_samples_per_second": 4.169,
"eval_steps_per_second": 0.13,
"eval_wer": 83.14118314118313,
"step": 4000
},
{
"epoch": 0.09,
"learning_rate": 9.21897435897436e-06,
"loss": 1.0269,
"step": 4050
},
{
"epoch": 0.09,
"learning_rate": 9.206153846153847e-06,
"loss": 1.0935,
"step": 4100
},
{
"epoch": 0.09,
"learning_rate": 9.193333333333334e-06,
"loss": 0.9632,
"step": 4150
},
{
"epoch": 0.09,
"learning_rate": 9.18051282051282e-06,
"loss": 1.0797,
"step": 4200
},
{
"epoch": 0.09,
"learning_rate": 9.16769230769231e-06,
"loss": 1.0288,
"step": 4250
},
{
"epoch": 0.09,
"learning_rate": 9.154871794871796e-06,
"loss": 0.9837,
"step": 4300
},
{
"epoch": 0.09,
"learning_rate": 9.142051282051283e-06,
"loss": 0.9999,
"step": 4350
},
{
"epoch": 0.1,
"learning_rate": 9.12923076923077e-06,
"loss": 1.0741,
"step": 4400
},
{
"epoch": 0.1,
"learning_rate": 9.116410256410257e-06,
"loss": 1.0865,
"step": 4450
},
{
"epoch": 0.1,
"learning_rate": 9.103589743589745e-06,
"loss": 1.0139,
"step": 4500
},
{
"epoch": 0.1,
"learning_rate": 9.090769230769232e-06,
"loss": 1.0065,
"step": 4550
},
{
"epoch": 0.1,
"learning_rate": 9.077948717948719e-06,
"loss": 1.0032,
"step": 4600
},
{
"epoch": 0.1,
"learning_rate": 9.065128205128206e-06,
"loss": 0.9768,
"step": 4650
},
{
"epoch": 0.1,
"learning_rate": 9.052307692307694e-06,
"loss": 0.9932,
"step": 4700
},
{
"epoch": 0.1,
"learning_rate": 9.03948717948718e-06,
"loss": 0.9384,
"step": 4750
},
{
"epoch": 0.1,
"learning_rate": 9.026666666666666e-06,
"loss": 1.0154,
"step": 4800
},
{
"epoch": 0.11,
"learning_rate": 9.013846153846155e-06,
"loss": 0.9847,
"step": 4850
},
{
"epoch": 0.11,
"learning_rate": 9.001025641025641e-06,
"loss": 0.9199,
"step": 4900
},
{
"epoch": 0.11,
"learning_rate": 8.988205128205128e-06,
"loss": 1.0063,
"step": 4950
},
{
"epoch": 0.11,
"learning_rate": 8.975384615384615e-06,
"loss": 1.0245,
"step": 5000
},
{
"epoch": 0.11,
"learning_rate": 8.962564102564104e-06,
"loss": 0.9681,
"step": 5050
},
{
"epoch": 0.11,
"learning_rate": 8.94974358974359e-06,
"loss": 0.9625,
"step": 5100
},
{
"epoch": 0.11,
"learning_rate": 8.936923076923077e-06,
"loss": 0.9865,
"step": 5150
},
{
"epoch": 0.11,
"learning_rate": 8.924102564102564e-06,
"loss": 0.9794,
"step": 5200
},
{
"epoch": 0.11,
"learning_rate": 8.911282051282053e-06,
"loss": 0.9455,
"step": 5250
},
{
"epoch": 0.11,
"learning_rate": 8.89846153846154e-06,
"loss": 0.96,
"step": 5300
},
{
"epoch": 0.12,
"learning_rate": 8.885641025641026e-06,
"loss": 0.9918,
"step": 5350
},
{
"epoch": 0.12,
"learning_rate": 8.872820512820513e-06,
"loss": 0.9797,
"step": 5400
},
{
"epoch": 0.12,
"learning_rate": 8.860000000000002e-06,
"loss": 1.0075,
"step": 5450
},
{
"epoch": 0.12,
"learning_rate": 8.847179487179488e-06,
"loss": 0.9661,
"step": 5500
},
{
"epoch": 0.12,
"learning_rate": 8.834358974358975e-06,
"loss": 0.9275,
"step": 5550
},
{
"epoch": 0.12,
"learning_rate": 8.821538461538462e-06,
"loss": 0.9913,
"step": 5600
},
{
"epoch": 0.12,
"learning_rate": 8.80871794871795e-06,
"loss": 0.9891,
"step": 5650
},
{
"epoch": 0.12,
"learning_rate": 8.795897435897437e-06,
"loss": 0.9671,
"step": 5700
},
{
"epoch": 0.12,
"learning_rate": 8.783076923076924e-06,
"loss": 0.925,
"step": 5750
},
{
"epoch": 0.13,
"learning_rate": 8.770256410256411e-06,
"loss": 0.9449,
"step": 5800
},
{
"epoch": 0.13,
"learning_rate": 8.757435897435898e-06,
"loss": 1.0119,
"step": 5850
},
{
"epoch": 0.13,
"learning_rate": 8.744615384615386e-06,
"loss": 1.0217,
"step": 5900
},
{
"epoch": 0.13,
"learning_rate": 8.731794871794873e-06,
"loss": 0.9794,
"step": 5950
},
{
"epoch": 0.13,
"learning_rate": 8.718974358974358e-06,
"loss": 1.0236,
"step": 6000
},
{
"epoch": 0.13,
"learning_rate": 8.706153846153847e-06,
"loss": 1.0065,
"step": 6050
},
{
"epoch": 0.13,
"learning_rate": 8.693333333333334e-06,
"loss": 0.9238,
"step": 6100
},
{
"epoch": 0.13,
"learning_rate": 8.68051282051282e-06,
"loss": 0.9403,
"step": 6150
},
{
"epoch": 0.13,
"learning_rate": 8.667692307692307e-06,
"loss": 0.9365,
"step": 6200
},
{
"epoch": 0.14,
"learning_rate": 8.654871794871796e-06,
"loss": 1.0259,
"step": 6250
},
{
"epoch": 0.14,
"learning_rate": 8.642051282051283e-06,
"loss": 0.9234,
"step": 6300
},
{
"epoch": 0.14,
"learning_rate": 8.62923076923077e-06,
"loss": 0.9249,
"step": 6350
},
{
"epoch": 0.14,
"learning_rate": 8.616666666666668e-06,
"loss": 0.9409,
"step": 6400
},
{
"epoch": 0.14,
"learning_rate": 8.603846153846155e-06,
"loss": 0.941,
"step": 6450
},
{
"epoch": 0.14,
"learning_rate": 8.591025641025642e-06,
"loss": 0.9172,
"step": 6500
},
{
"epoch": 0.14,
"learning_rate": 8.578205128205129e-06,
"loss": 0.9804,
"step": 6550
},
{
"epoch": 0.14,
"learning_rate": 8.565384615384617e-06,
"loss": 0.9599,
"step": 6600
},
{
"epoch": 0.14,
"learning_rate": 8.552564102564104e-06,
"loss": 0.9646,
"step": 6650
},
{
"epoch": 0.15,
"learning_rate": 8.539743589743591e-06,
"loss": 0.9661,
"step": 6700
},
{
"epoch": 0.15,
"learning_rate": 8.526923076923078e-06,
"loss": 0.8645,
"step": 6750
},
{
"epoch": 0.15,
"learning_rate": 8.514102564102565e-06,
"loss": 0.8842,
"step": 6800
},
{
"epoch": 0.15,
"learning_rate": 8.501282051282051e-06,
"loss": 0.9561,
"step": 6850
},
{
"epoch": 0.15,
"learning_rate": 8.488461538461538e-06,
"loss": 0.968,
"step": 6900
},
{
"epoch": 0.15,
"learning_rate": 8.475641025641027e-06,
"loss": 0.9069,
"step": 6950
},
{
"epoch": 0.15,
"learning_rate": 8.462820512820514e-06,
"loss": 0.9145,
"step": 7000
},
{
"epoch": 0.15,
"learning_rate": 8.45e-06,
"loss": 1.0245,
"step": 7050
},
{
"epoch": 0.15,
"learning_rate": 8.437179487179487e-06,
"loss": 0.9759,
"step": 7100
},
{
"epoch": 0.15,
"learning_rate": 8.424358974358974e-06,
"loss": 1.0075,
"step": 7150
},
{
"epoch": 0.16,
"learning_rate": 8.411538461538463e-06,
"loss": 0.9605,
"step": 7200
},
{
"epoch": 0.16,
"learning_rate": 8.39871794871795e-06,
"loss": 0.9634,
"step": 7250
},
{
"epoch": 0.16,
"learning_rate": 8.385897435897436e-06,
"loss": 0.8981,
"step": 7300
},
{
"epoch": 0.16,
"learning_rate": 8.373076923076923e-06,
"loss": 1.0294,
"step": 7350
},
{
"epoch": 0.16,
"learning_rate": 8.360256410256412e-06,
"loss": 0.9765,
"step": 7400
},
{
"epoch": 0.16,
"learning_rate": 8.347435897435898e-06,
"loss": 0.8643,
"step": 7450
},
{
"epoch": 0.16,
"learning_rate": 8.334615384615385e-06,
"loss": 1.0503,
"step": 7500
},
{
"epoch": 0.16,
"learning_rate": 8.321794871794872e-06,
"loss": 0.9202,
"step": 7550
},
{
"epoch": 0.16,
"learning_rate": 8.30897435897436e-06,
"loss": 0.9152,
"step": 7600
},
{
"epoch": 0.17,
"learning_rate": 8.296153846153847e-06,
"loss": 0.9796,
"step": 7650
},
{
"epoch": 0.17,
"learning_rate": 8.283333333333334e-06,
"loss": 0.9664,
"step": 7700
},
{
"epoch": 0.17,
"learning_rate": 8.270512820512821e-06,
"loss": 0.9215,
"step": 7750
},
{
"epoch": 0.17,
"learning_rate": 8.25769230769231e-06,
"loss": 0.9392,
"step": 7800
},
{
"epoch": 0.17,
"learning_rate": 8.244871794871796e-06,
"loss": 0.9879,
"step": 7850
},
{
"epoch": 0.17,
"learning_rate": 8.232051282051283e-06,
"loss": 0.9373,
"step": 7900
},
{
"epoch": 0.17,
"learning_rate": 8.21923076923077e-06,
"loss": 0.8937,
"step": 7950
},
{
"epoch": 0.17,
"learning_rate": 8.206410256410257e-06,
"loss": 0.8558,
"step": 8000
},
{
"epoch": 0.17,
"eval_loss": 0.37861934304237366,
"eval_runtime": 2347.8802,
"eval_samples_per_second": 4.507,
"eval_steps_per_second": 0.141,
"eval_wer": 78.34057834057833,
"step": 8000
},
{
"epoch": 0.17,
"learning_rate": 8.193589743589744e-06,
"loss": 0.8994,
"step": 8050
},
{
"epoch": 0.18,
"learning_rate": 8.18076923076923e-06,
"loss": 0.9032,
"step": 8100
},
{
"epoch": 0.18,
"learning_rate": 8.167948717948719e-06,
"loss": 0.9623,
"step": 8150
},
{
"epoch": 0.18,
"learning_rate": 8.155128205128206e-06,
"loss": 0.8825,
"step": 8200
},
{
"epoch": 0.18,
"learning_rate": 8.142564102564103e-06,
"loss": 0.9967,
"step": 8250
},
{
"epoch": 0.18,
"learning_rate": 8.12974358974359e-06,
"loss": 0.8167,
"step": 8300
},
{
"epoch": 0.18,
"learning_rate": 8.116923076923078e-06,
"loss": 0.8482,
"step": 8350
},
{
"epoch": 0.18,
"learning_rate": 8.104102564102565e-06,
"loss": 0.9776,
"step": 8400
},
{
"epoch": 0.18,
"learning_rate": 8.091282051282052e-06,
"loss": 0.8644,
"step": 8450
},
{
"epoch": 0.18,
"learning_rate": 8.078461538461539e-06,
"loss": 0.8732,
"step": 8500
},
{
"epoch": 0.19,
"learning_rate": 8.065641025641027e-06,
"loss": 0.9447,
"step": 8550
},
{
"epoch": 0.19,
"learning_rate": 8.052820512820514e-06,
"loss": 0.8957,
"step": 8600
},
{
"epoch": 0.19,
"learning_rate": 8.040000000000001e-06,
"loss": 0.9365,
"step": 8650
},
{
"epoch": 0.19,
"learning_rate": 8.027179487179488e-06,
"loss": 0.8746,
"step": 8700
},
{
"epoch": 0.19,
"learning_rate": 8.014358974358975e-06,
"loss": 0.8635,
"step": 8750
},
{
"epoch": 0.19,
"learning_rate": 8.001538461538461e-06,
"loss": 0.8931,
"step": 8800
},
{
"epoch": 0.19,
"learning_rate": 7.988717948717948e-06,
"loss": 0.9487,
"step": 8850
},
{
"epoch": 0.19,
"learning_rate": 7.975897435897437e-06,
"loss": 0.9137,
"step": 8900
},
{
"epoch": 0.19,
"learning_rate": 7.963076923076924e-06,
"loss": 0.8445,
"step": 8950
},
{
"epoch": 0.2,
"learning_rate": 7.95025641025641e-06,
"loss": 0.9021,
"step": 9000
},
{
"epoch": 0.2,
"learning_rate": 7.937435897435897e-06,
"loss": 0.9535,
"step": 9050
},
{
"epoch": 0.2,
"learning_rate": 7.924615384615386e-06,
"loss": 0.8456,
"step": 9100
},
{
"epoch": 0.2,
"learning_rate": 7.911794871794873e-06,
"loss": 0.9153,
"step": 9150
},
{
"epoch": 0.2,
"learning_rate": 7.89897435897436e-06,
"loss": 0.8893,
"step": 9200
},
{
"epoch": 0.2,
"learning_rate": 7.886153846153846e-06,
"loss": 0.8867,
"step": 9250
},
{
"epoch": 0.2,
"learning_rate": 7.873333333333335e-06,
"loss": 0.8725,
"step": 9300
},
{
"epoch": 0.2,
"learning_rate": 7.860512820512822e-06,
"loss": 0.8142,
"step": 9350
},
{
"epoch": 0.2,
"learning_rate": 7.847692307692308e-06,
"loss": 0.9261,
"step": 9400
},
{
"epoch": 0.2,
"learning_rate": 7.834871794871795e-06,
"loss": 0.9693,
"step": 9450
},
{
"epoch": 0.21,
"learning_rate": 7.822051282051282e-06,
"loss": 0.8627,
"step": 9500
},
{
"epoch": 0.21,
"learning_rate": 7.80923076923077e-06,
"loss": 0.85,
"step": 9550
},
{
"epoch": 0.21,
"learning_rate": 7.796410256410257e-06,
"loss": 0.8674,
"step": 9600
},
{
"epoch": 0.21,
"learning_rate": 7.783589743589744e-06,
"loss": 0.9627,
"step": 9650
},
{
"epoch": 0.21,
"learning_rate": 7.770769230769231e-06,
"loss": 0.906,
"step": 9700
},
{
"epoch": 0.21,
"learning_rate": 7.75794871794872e-06,
"loss": 0.8261,
"step": 9750
},
{
"epoch": 0.21,
"learning_rate": 7.745128205128206e-06,
"loss": 0.8949,
"step": 9800
},
{
"epoch": 0.21,
"learning_rate": 7.732307692307693e-06,
"loss": 0.9519,
"step": 9850
},
{
"epoch": 0.21,
"learning_rate": 7.71948717948718e-06,
"loss": 0.8861,
"step": 9900
},
{
"epoch": 0.22,
"learning_rate": 7.706666666666669e-06,
"loss": 0.9476,
"step": 9950
},
{
"epoch": 0.22,
"learning_rate": 7.693846153846154e-06,
"loss": 0.9045,
"step": 10000
},
{
"epoch": 0.22,
"learning_rate": 7.68102564102564e-06,
"loss": 0.955,
"step": 10050
},
{
"epoch": 0.22,
"learning_rate": 7.668205128205129e-06,
"loss": 0.9103,
"step": 10100
},
{
"epoch": 0.22,
"learning_rate": 7.655384615384616e-06,
"loss": 0.8718,
"step": 10150
},
{
"epoch": 0.22,
"learning_rate": 7.642564102564103e-06,
"loss": 0.8664,
"step": 10200
},
{
"epoch": 0.22,
"learning_rate": 7.62974358974359e-06,
"loss": 0.8745,
"step": 10250
},
{
"epoch": 0.22,
"learning_rate": 7.616923076923077e-06,
"loss": 0.9317,
"step": 10300
},
{
"epoch": 0.22,
"learning_rate": 7.604102564102565e-06,
"loss": 0.8618,
"step": 10350
},
{
"epoch": 0.23,
"learning_rate": 7.591282051282052e-06,
"loss": 0.8996,
"step": 10400
},
{
"epoch": 0.23,
"learning_rate": 7.578461538461539e-06,
"loss": 0.8384,
"step": 10450
},
{
"epoch": 0.23,
"learning_rate": 7.565641025641026e-06,
"loss": 0.9845,
"step": 10500
},
{
"epoch": 0.23,
"learning_rate": 7.552820512820514e-06,
"loss": 0.8287,
"step": 10550
},
{
"epoch": 0.23,
"learning_rate": 7.540000000000001e-06,
"loss": 0.9573,
"step": 10600
},
{
"epoch": 0.23,
"learning_rate": 7.5271794871794875e-06,
"loss": 0.8777,
"step": 10650
},
{
"epoch": 0.23,
"learning_rate": 7.514358974358975e-06,
"loss": 0.9686,
"step": 10700
},
{
"epoch": 0.23,
"learning_rate": 7.501538461538462e-06,
"loss": 0.8655,
"step": 10750
},
{
"epoch": 0.23,
"learning_rate": 7.48871794871795e-06,
"loss": 0.8344,
"step": 10800
},
{
"epoch": 0.24,
"learning_rate": 7.4758974358974365e-06,
"loss": 0.9327,
"step": 10850
},
{
"epoch": 0.24,
"learning_rate": 7.463076923076924e-06,
"loss": 0.9102,
"step": 10900
},
{
"epoch": 0.24,
"learning_rate": 7.450256410256411e-06,
"loss": 0.8639,
"step": 10950
},
{
"epoch": 0.24,
"learning_rate": 7.437435897435899e-06,
"loss": 0.7969,
"step": 11000
},
{
"epoch": 0.24,
"learning_rate": 7.4246153846153855e-06,
"loss": 0.9236,
"step": 11050
},
{
"epoch": 0.24,
"learning_rate": 7.411794871794873e-06,
"loss": 0.8887,
"step": 11100
},
{
"epoch": 0.24,
"learning_rate": 7.39897435897436e-06,
"loss": 0.9512,
"step": 11150
},
{
"epoch": 0.24,
"learning_rate": 7.386153846153846e-06,
"loss": 0.8883,
"step": 11200
},
{
"epoch": 0.24,
"learning_rate": 7.373333333333334e-06,
"loss": 0.9263,
"step": 11250
},
{
"epoch": 0.24,
"learning_rate": 7.3605128205128204e-06,
"loss": 0.8522,
"step": 11300
},
{
"epoch": 0.25,
"learning_rate": 7.347692307692308e-06,
"loss": 0.8411,
"step": 11350
},
{
"epoch": 0.25,
"learning_rate": 7.334871794871795e-06,
"loss": 0.9144,
"step": 11400
},
{
"epoch": 0.25,
"learning_rate": 7.322051282051283e-06,
"loss": 0.8312,
"step": 11450
},
{
"epoch": 0.25,
"learning_rate": 7.309230769230769e-06,
"loss": 0.8642,
"step": 11500
},
{
"epoch": 0.25,
"learning_rate": 7.296410256410257e-06,
"loss": 0.8949,
"step": 11550
},
{
"epoch": 0.25,
"learning_rate": 7.283589743589744e-06,
"loss": 0.9084,
"step": 11600
},
{
"epoch": 0.25,
"learning_rate": 7.270769230769232e-06,
"loss": 0.8532,
"step": 11650
},
{
"epoch": 0.25,
"learning_rate": 7.257948717948718e-06,
"loss": 0.9145,
"step": 11700
},
{
"epoch": 0.25,
"learning_rate": 7.245128205128206e-06,
"loss": 0.9374,
"step": 11750
},
{
"epoch": 0.26,
"learning_rate": 7.232307692307693e-06,
"loss": 0.9016,
"step": 11800
},
{
"epoch": 0.26,
"learning_rate": 7.21948717948718e-06,
"loss": 0.8444,
"step": 11850
},
{
"epoch": 0.26,
"learning_rate": 7.206666666666667e-06,
"loss": 0.8414,
"step": 11900
},
{
"epoch": 0.26,
"learning_rate": 7.193846153846154e-06,
"loss": 0.9172,
"step": 11950
},
{
"epoch": 0.26,
"learning_rate": 7.181025641025642e-06,
"loss": 0.9109,
"step": 12000
},
{
"epoch": 0.26,
"eval_loss": 0.343860000371933,
"eval_runtime": 2361.4858,
"eval_samples_per_second": 4.481,
"eval_steps_per_second": 0.14,
"eval_wer": 75.74182574182574,
"step": 12000
},
{
"epoch": 0.26,
"learning_rate": 7.168205128205129e-06,
"loss": 0.937,
"step": 12050
},
{
"epoch": 0.26,
"learning_rate": 7.155384615384616e-06,
"loss": 0.8721,
"step": 12100
},
{
"epoch": 0.26,
"learning_rate": 7.142564102564103e-06,
"loss": 0.9569,
"step": 12150
},
{
"epoch": 0.26,
"learning_rate": 7.129743589743591e-06,
"loss": 0.9084,
"step": 12200
},
{
"epoch": 0.27,
"learning_rate": 7.116923076923078e-06,
"loss": 0.8028,
"step": 12250
},
{
"epoch": 0.27,
"learning_rate": 7.104102564102565e-06,
"loss": 0.875,
"step": 12300
},
{
"epoch": 0.27,
"learning_rate": 7.091282051282052e-06,
"loss": 0.9257,
"step": 12350
},
{
"epoch": 0.27,
"learning_rate": 7.078461538461538e-06,
"loss": 0.8943,
"step": 12400
},
{
"epoch": 0.27,
"learning_rate": 7.065641025641026e-06,
"loss": 0.8458,
"step": 12450
},
{
"epoch": 0.27,
"learning_rate": 7.052820512820513e-06,
"loss": 0.856,
"step": 12500
},
{
"epoch": 0.27,
"learning_rate": 7.04e-06,
"loss": 0.8905,
"step": 12550
},
{
"epoch": 0.27,
"learning_rate": 7.027179487179487e-06,
"loss": 0.8732,
"step": 12600
},
{
"epoch": 0.27,
"learning_rate": 7.014358974358975e-06,
"loss": 0.8868,
"step": 12650
},
{
"epoch": 0.28,
"learning_rate": 7.001538461538462e-06,
"loss": 0.857,
"step": 12700
},
{
"epoch": 0.28,
"learning_rate": 6.988717948717949e-06,
"loss": 0.8119,
"step": 12750
},
{
"epoch": 0.28,
"learning_rate": 6.975897435897436e-06,
"loss": 0.8115,
"step": 12800
},
{
"epoch": 0.28,
"learning_rate": 6.963076923076924e-06,
"loss": 0.8636,
"step": 12850
},
{
"epoch": 0.28,
"learning_rate": 6.950256410256411e-06,
"loss": 0.8649,
"step": 12900
},
{
"epoch": 0.28,
"learning_rate": 6.937435897435898e-06,
"loss": 0.8017,
"step": 12950
},
{
"epoch": 0.28,
"learning_rate": 6.924615384615385e-06,
"loss": 0.8575,
"step": 13000
},
{
"epoch": 0.28,
"learning_rate": 6.911794871794872e-06,
"loss": 0.837,
"step": 13050
},
{
"epoch": 0.28,
"learning_rate": 6.89897435897436e-06,
"loss": 0.8036,
"step": 13100
},
{
"epoch": 0.29,
"learning_rate": 6.8861538461538465e-06,
"loss": 0.8588,
"step": 13150
},
{
"epoch": 0.29,
"learning_rate": 6.873333333333334e-06,
"loss": 0.8328,
"step": 13200
},
{
"epoch": 0.29,
"learning_rate": 6.860512820512821e-06,
"loss": 0.8611,
"step": 13250
},
{
"epoch": 0.29,
"learning_rate": 6.847692307692309e-06,
"loss": 0.862,
"step": 13300
},
{
"epoch": 0.29,
"learning_rate": 6.8348717948717955e-06,
"loss": 0.8616,
"step": 13350
},
{
"epoch": 0.29,
"learning_rate": 6.822051282051283e-06,
"loss": 0.8776,
"step": 13400
},
{
"epoch": 0.29,
"learning_rate": 6.80923076923077e-06,
"loss": 0.8725,
"step": 13450
},
{
"epoch": 0.29,
"learning_rate": 6.796410256410258e-06,
"loss": 0.8838,
"step": 13500
},
{
"epoch": 0.29,
"learning_rate": 6.7835897435897445e-06,
"loss": 0.8285,
"step": 13550
},
{
"epoch": 0.29,
"learning_rate": 6.770769230769232e-06,
"loss": 0.859,
"step": 13600
},
{
"epoch": 0.3,
"learning_rate": 6.757948717948718e-06,
"loss": 0.8535,
"step": 13650
},
{
"epoch": 0.3,
"learning_rate": 6.745128205128205e-06,
"loss": 0.7801,
"step": 13700
},
{
"epoch": 0.3,
"learning_rate": 6.732307692307693e-06,
"loss": 0.8726,
"step": 13750
},
{
"epoch": 0.3,
"learning_rate": 6.7194871794871794e-06,
"loss": 0.92,
"step": 13800
},
{
"epoch": 0.3,
"learning_rate": 6.706666666666667e-06,
"loss": 0.927,
"step": 13850
},
{
"epoch": 0.3,
"learning_rate": 6.693846153846154e-06,
"loss": 0.9115,
"step": 13900
},
{
"epoch": 0.3,
"learning_rate": 6.681025641025642e-06,
"loss": 0.8339,
"step": 13950
},
{
"epoch": 0.3,
"learning_rate": 6.6682051282051284e-06,
"loss": 0.8136,
"step": 14000
},
{
"epoch": 0.3,
"learning_rate": 6.655384615384616e-06,
"loss": 0.852,
"step": 14050
},
{
"epoch": 0.31,
"learning_rate": 6.642564102564103e-06,
"loss": 0.8495,
"step": 14100
},
{
"epoch": 0.31,
"learning_rate": 6.629743589743591e-06,
"loss": 0.9006,
"step": 14150
},
{
"epoch": 0.31,
"learning_rate": 6.616923076923077e-06,
"loss": 0.8732,
"step": 14200
},
{
"epoch": 0.31,
"learning_rate": 6.604102564102565e-06,
"loss": 0.8505,
"step": 14250
},
{
"epoch": 0.31,
"learning_rate": 6.591282051282052e-06,
"loss": 0.9086,
"step": 14300
},
{
"epoch": 0.31,
"learning_rate": 6.578461538461539e-06,
"loss": 0.7929,
"step": 14350
},
{
"epoch": 0.31,
"learning_rate": 6.565641025641026e-06,
"loss": 0.836,
"step": 14400
},
{
"epoch": 0.31,
"learning_rate": 6.552820512820513e-06,
"loss": 0.8503,
"step": 14450
},
{
"epoch": 0.31,
"learning_rate": 6.540000000000001e-06,
"loss": 0.8556,
"step": 14500
},
{
"epoch": 0.32,
"learning_rate": 6.527179487179488e-06,
"loss": 0.8645,
"step": 14550
},
{
"epoch": 0.32,
"learning_rate": 6.514615384615385e-06,
"loss": 0.9161,
"step": 14600
},
{
"epoch": 0.32,
"learning_rate": 6.501794871794872e-06,
"loss": 0.8358,
"step": 14650
},
{
"epoch": 0.32,
"learning_rate": 6.488974358974359e-06,
"loss": 0.8968,
"step": 14700
},
{
"epoch": 0.32,
"learning_rate": 6.476153846153846e-06,
"loss": 0.8117,
"step": 14750
},
{
"epoch": 0.32,
"learning_rate": 6.463333333333334e-06,
"loss": 0.8847,
"step": 14800
},
{
"epoch": 0.32,
"learning_rate": 6.450512820512821e-06,
"loss": 0.9181,
"step": 14850
},
{
"epoch": 0.32,
"learning_rate": 6.437692307692308e-06,
"loss": 0.8921,
"step": 14900
},
{
"epoch": 0.32,
"learning_rate": 6.424871794871795e-06,
"loss": 0.9063,
"step": 14950
},
{
"epoch": 0.33,
"learning_rate": 6.412051282051283e-06,
"loss": 0.9255,
"step": 15000
},
{
"epoch": 0.33,
"learning_rate": 6.39923076923077e-06,
"loss": 0.867,
"step": 15050
},
{
"epoch": 0.33,
"learning_rate": 6.386410256410257e-06,
"loss": 0.8736,
"step": 15100
},
{
"epoch": 0.33,
"learning_rate": 6.373589743589744e-06,
"loss": 0.8517,
"step": 15150
},
{
"epoch": 0.33,
"learning_rate": 6.360769230769232e-06,
"loss": 0.8799,
"step": 15200
},
{
"epoch": 0.33,
"learning_rate": 6.347948717948719e-06,
"loss": 0.7834,
"step": 15250
},
{
"epoch": 0.33,
"learning_rate": 6.335128205128206e-06,
"loss": 0.857,
"step": 15300
},
{
"epoch": 0.33,
"learning_rate": 6.322307692307693e-06,
"loss": 0.8723,
"step": 15350
},
{
"epoch": 0.33,
"learning_rate": 6.30948717948718e-06,
"loss": 0.8364,
"step": 15400
},
{
"epoch": 0.33,
"learning_rate": 6.296666666666668e-06,
"loss": 0.7583,
"step": 15450
},
{
"epoch": 0.34,
"learning_rate": 6.2838461538461545e-06,
"loss": 0.8553,
"step": 15500
},
{
"epoch": 0.34,
"learning_rate": 6.271025641025642e-06,
"loss": 0.8032,
"step": 15550
},
{
"epoch": 0.34,
"learning_rate": 6.258205128205129e-06,
"loss": 0.8224,
"step": 15600
},
{
"epoch": 0.34,
"learning_rate": 6.245384615384616e-06,
"loss": 0.8567,
"step": 15650
},
{
"epoch": 0.34,
"learning_rate": 6.232564102564103e-06,
"loss": 0.8267,
"step": 15700
},
{
"epoch": 0.34,
"learning_rate": 6.2197435897435894e-06,
"loss": 0.8053,
"step": 15750
},
{
"epoch": 0.34,
"learning_rate": 6.206923076923077e-06,
"loss": 0.7789,
"step": 15800
},
{
"epoch": 0.34,
"learning_rate": 6.194102564102564e-06,
"loss": 0.8372,
"step": 15850
},
{
"epoch": 0.34,
"learning_rate": 6.181282051282052e-06,
"loss": 0.8842,
"step": 15900
},
{
"epoch": 0.35,
"learning_rate": 6.1684615384615384e-06,
"loss": 0.7784,
"step": 15950
},
{
"epoch": 0.35,
"learning_rate": 6.155641025641026e-06,
"loss": 0.8203,
"step": 16000
},
{
"epoch": 0.35,
"eval_loss": 0.32156890630722046,
"eval_runtime": 2309.1659,
"eval_samples_per_second": 4.582,
"eval_steps_per_second": 0.143,
"eval_wer": 72.77452277452278,
"step": 16000
},
{
"epoch": 0.35,
"learning_rate": 6.142820512820513e-06,
"loss": 0.8743,
"step": 16050
},
{
"epoch": 0.35,
"learning_rate": 6.130000000000001e-06,
"loss": 0.8755,
"step": 16100
},
{
"epoch": 0.35,
"learning_rate": 6.1171794871794874e-06,
"loss": 0.9192,
"step": 16150
},
{
"epoch": 0.35,
"learning_rate": 6.104358974358975e-06,
"loss": 0.8563,
"step": 16200
},
{
"epoch": 0.35,
"learning_rate": 6.091538461538462e-06,
"loss": 0.865,
"step": 16250
},
{
"epoch": 0.35,
"learning_rate": 6.07897435897436e-06,
"loss": 0.8556,
"step": 16300
},
{
"epoch": 0.35,
"learning_rate": 6.0661538461538476e-06,
"loss": 0.8485,
"step": 16350
},
{
"epoch": 0.36,
"learning_rate": 6.0533333333333335e-06,
"loss": 0.8257,
"step": 16400
},
{
"epoch": 0.36,
"learning_rate": 6.04051282051282e-06,
"loss": 0.7927,
"step": 16450
},
{
"epoch": 0.36,
"learning_rate": 6.027692307692308e-06,
"loss": 0.7649,
"step": 16500
},
{
"epoch": 0.36,
"learning_rate": 6.014871794871795e-06,
"loss": 0.8562,
"step": 16550
},
{
"epoch": 0.36,
"learning_rate": 6.0020512820512825e-06,
"loss": 0.9156,
"step": 16600
},
{
"epoch": 0.36,
"learning_rate": 5.989230769230769e-06,
"loss": 0.9004,
"step": 16650
},
{
"epoch": 0.36,
"learning_rate": 5.976410256410257e-06,
"loss": 0.8761,
"step": 16700
},
{
"epoch": 0.36,
"learning_rate": 5.963589743589744e-06,
"loss": 0.7352,
"step": 16750
},
{
"epoch": 0.36,
"learning_rate": 5.950769230769231e-06,
"loss": 0.8805,
"step": 16800
},
{
"epoch": 0.37,
"learning_rate": 5.937948717948718e-06,
"loss": 0.8591,
"step": 16850
},
{
"epoch": 0.37,
"learning_rate": 5.925128205128205e-06,
"loss": 0.7584,
"step": 16900
},
{
"epoch": 0.37,
"learning_rate": 5.912307692307693e-06,
"loss": 0.8739,
"step": 16950
},
{
"epoch": 0.37,
"learning_rate": 5.89948717948718e-06,
"loss": 0.8465,
"step": 17000
},
{
"epoch": 0.37,
"learning_rate": 5.886666666666667e-06,
"loss": 0.8733,
"step": 17050
},
{
"epoch": 0.37,
"learning_rate": 5.873846153846154e-06,
"loss": 0.8386,
"step": 17100
},
{
"epoch": 0.37,
"learning_rate": 5.861025641025642e-06,
"loss": 0.8337,
"step": 17150
},
{
"epoch": 0.37,
"learning_rate": 5.848205128205129e-06,
"loss": 0.8046,
"step": 17200
},
{
"epoch": 0.37,
"learning_rate": 5.835384615384616e-06,
"loss": 0.819,
"step": 17250
},
{
"epoch": 0.38,
"learning_rate": 5.822564102564103e-06,
"loss": 0.8665,
"step": 17300
},
{
"epoch": 0.38,
"learning_rate": 5.809743589743591e-06,
"loss": 0.7507,
"step": 17350
},
{
"epoch": 0.38,
"learning_rate": 5.796923076923078e-06,
"loss": 0.8599,
"step": 17400
},
{
"epoch": 0.38,
"learning_rate": 5.784102564102565e-06,
"loss": 0.7877,
"step": 17450
},
{
"epoch": 0.38,
"learning_rate": 5.771282051282052e-06,
"loss": 0.8069,
"step": 17500
},
{
"epoch": 0.38,
"learning_rate": 5.75846153846154e-06,
"loss": 0.8001,
"step": 17550
},
{
"epoch": 0.38,
"learning_rate": 5.745641025641027e-06,
"loss": 0.7938,
"step": 17600
},
{
"epoch": 0.38,
"learning_rate": 5.732820512820513e-06,
"loss": 0.7951,
"step": 17650
},
{
"epoch": 0.38,
"learning_rate": 5.72e-06,
"loss": 0.8148,
"step": 17700
},
{
"epoch": 0.38,
"learning_rate": 5.707179487179487e-06,
"loss": 0.8015,
"step": 17750
},
{
"epoch": 0.39,
"learning_rate": 5.694358974358975e-06,
"loss": 0.845,
"step": 17800
},
{
"epoch": 0.39,
"learning_rate": 5.681538461538462e-06,
"loss": 0.8216,
"step": 17850
},
{
"epoch": 0.39,
"learning_rate": 5.668717948717949e-06,
"loss": 0.7611,
"step": 17900
},
{
"epoch": 0.39,
"learning_rate": 5.655897435897436e-06,
"loss": 0.7851,
"step": 17950
},
{
"epoch": 0.39,
"learning_rate": 5.643076923076923e-06,
"loss": 0.8352,
"step": 18000
},
{
"epoch": 0.39,
"learning_rate": 5.630256410256411e-06,
"loss": 0.8161,
"step": 18050
},
{
"epoch": 0.39,
"learning_rate": 5.6174358974358974e-06,
"loss": 0.8156,
"step": 18100
},
{
"epoch": 0.39,
"learning_rate": 5.604615384615385e-06,
"loss": 0.8151,
"step": 18150
},
{
"epoch": 0.39,
"learning_rate": 5.591794871794872e-06,
"loss": 0.8425,
"step": 18200
},
{
"epoch": 0.4,
"learning_rate": 5.57897435897436e-06,
"loss": 0.771,
"step": 18250
},
{
"epoch": 0.4,
"learning_rate": 5.566153846153846e-06,
"loss": 0.7472,
"step": 18300
},
{
"epoch": 0.4,
"learning_rate": 5.553333333333334e-06,
"loss": 0.8373,
"step": 18350
},
{
"epoch": 0.4,
"learning_rate": 5.540512820512821e-06,
"loss": 0.8685,
"step": 18400
},
{
"epoch": 0.4,
"learning_rate": 5.527692307692309e-06,
"loss": 0.8753,
"step": 18450
},
{
"epoch": 0.4,
"learning_rate": 5.514871794871795e-06,
"loss": 0.8096,
"step": 18500
},
{
"epoch": 0.4,
"learning_rate": 5.502051282051283e-06,
"loss": 0.8726,
"step": 18550
},
{
"epoch": 0.4,
"learning_rate": 5.48923076923077e-06,
"loss": 0.883,
"step": 18600
},
{
"epoch": 0.4,
"learning_rate": 5.476410256410258e-06,
"loss": 0.812,
"step": 18650
},
{
"epoch": 0.41,
"learning_rate": 5.463589743589744e-06,
"loss": 0.7934,
"step": 18700
},
{
"epoch": 0.41,
"learning_rate": 5.450769230769232e-06,
"loss": 0.9021,
"step": 18750
},
{
"epoch": 0.41,
"learning_rate": 5.437948717948719e-06,
"loss": 0.7765,
"step": 18800
},
{
"epoch": 0.41,
"learning_rate": 5.425128205128205e-06,
"loss": 0.8453,
"step": 18850
},
{
"epoch": 0.41,
"learning_rate": 5.4123076923076925e-06,
"loss": 0.8043,
"step": 18900
},
{
"epoch": 0.41,
"learning_rate": 5.399487179487179e-06,
"loss": 0.7747,
"step": 18950
},
{
"epoch": 0.41,
"learning_rate": 5.386666666666667e-06,
"loss": 0.814,
"step": 19000
},
{
"epoch": 0.41,
"learning_rate": 5.373846153846154e-06,
"loss": 0.8306,
"step": 19050
},
{
"epoch": 0.41,
"learning_rate": 5.3610256410256415e-06,
"loss": 0.8242,
"step": 19100
},
{
"epoch": 0.42,
"learning_rate": 5.348205128205128e-06,
"loss": 0.7803,
"step": 19150
},
{
"epoch": 0.42,
"learning_rate": 5.335384615384615e-06,
"loss": 0.8586,
"step": 19200
},
{
"epoch": 0.42,
"learning_rate": 5.322564102564103e-06,
"loss": 0.78,
"step": 19250
},
{
"epoch": 0.42,
"learning_rate": 5.30974358974359e-06,
"loss": 0.8054,
"step": 19300
},
{
"epoch": 0.42,
"learning_rate": 5.296923076923077e-06,
"loss": 0.8024,
"step": 19350
},
{
"epoch": 0.42,
"learning_rate": 5.284102564102564e-06,
"loss": 0.8438,
"step": 19400
},
{
"epoch": 0.42,
"learning_rate": 5.271282051282052e-06,
"loss": 0.7888,
"step": 19450
},
{
"epoch": 0.42,
"learning_rate": 5.258461538461539e-06,
"loss": 0.8126,
"step": 19500
},
{
"epoch": 0.42,
"learning_rate": 5.245641025641026e-06,
"loss": 0.8023,
"step": 19550
},
{
"epoch": 0.42,
"learning_rate": 5.232820512820513e-06,
"loss": 0.7935,
"step": 19600
},
{
"epoch": 0.43,
"learning_rate": 5.220000000000001e-06,
"loss": 0.8027,
"step": 19650
},
{
"epoch": 0.43,
"learning_rate": 5.207179487179488e-06,
"loss": 0.8049,
"step": 19700
},
{
"epoch": 0.43,
"learning_rate": 5.194358974358975e-06,
"loss": 0.7715,
"step": 19750
},
{
"epoch": 0.43,
"learning_rate": 5.181538461538462e-06,
"loss": 0.8414,
"step": 19800
},
{
"epoch": 0.43,
"learning_rate": 5.16871794871795e-06,
"loss": 0.849,
"step": 19850
},
{
"epoch": 0.43,
"learning_rate": 5.155897435897437e-06,
"loss": 0.7973,
"step": 19900
},
{
"epoch": 0.43,
"learning_rate": 5.143076923076924e-06,
"loss": 0.8342,
"step": 19950
},
{
"epoch": 0.43,
"learning_rate": 5.130256410256411e-06,
"loss": 0.7383,
"step": 20000
},
{
"epoch": 0.43,
"eval_loss": 0.3015395998954773,
"eval_runtime": 2355.1549,
"eval_samples_per_second": 4.493,
"eval_steps_per_second": 0.141,
"eval_wer": 70.79002079002079,
"step": 20000
},
{
"epoch": 0.43,
"learning_rate": 5.117435897435897e-06,
"loss": 0.8312,
"step": 20050
},
{
"epoch": 0.44,
"learning_rate": 5.104615384615385e-06,
"loss": 0.7332,
"step": 20100
},
{
"epoch": 0.44,
"learning_rate": 5.091794871794872e-06,
"loss": 0.8523,
"step": 20150
},
{
"epoch": 0.44,
"learning_rate": 5.078974358974359e-06,
"loss": 0.8004,
"step": 20200
},
{
"epoch": 0.44,
"learning_rate": 5.066153846153846e-06,
"loss": 0.9089,
"step": 20250
},
{
"epoch": 0.44,
"learning_rate": 5.053333333333334e-06,
"loss": 0.7833,
"step": 20300
},
{
"epoch": 0.44,
"learning_rate": 5.040769230769231e-06,
"loss": 0.8074,
"step": 20350
},
{
"epoch": 0.44,
"learning_rate": 5.027948717948719e-06,
"loss": 0.8449,
"step": 20400
},
{
"epoch": 0.44,
"learning_rate": 5.015128205128205e-06,
"loss": 0.7655,
"step": 20450
},
{
"epoch": 0.44,
"learning_rate": 5.002307692307693e-06,
"loss": 0.8507,
"step": 20500
},
{
"epoch": 0.45,
"learning_rate": 4.98948717948718e-06,
"loss": 0.803,
"step": 20550
},
{
"epoch": 0.45,
"learning_rate": 4.976666666666667e-06,
"loss": 0.7476,
"step": 20600
},
{
"epoch": 0.45,
"learning_rate": 4.963846153846154e-06,
"loss": 0.7929,
"step": 20650
},
{
"epoch": 0.45,
"learning_rate": 4.951025641025641e-06,
"loss": 0.8162,
"step": 20700
},
{
"epoch": 0.45,
"learning_rate": 4.938461538461538e-06,
"loss": 0.8593,
"step": 20750
},
{
"epoch": 0.45,
"learning_rate": 4.925641025641026e-06,
"loss": 0.8301,
"step": 20800
},
{
"epoch": 0.45,
"learning_rate": 4.912820512820513e-06,
"loss": 0.8038,
"step": 20850
},
{
"epoch": 0.45,
"learning_rate": 4.9000000000000005e-06,
"loss": 0.7919,
"step": 20900
},
{
"epoch": 0.45,
"learning_rate": 4.887179487179487e-06,
"loss": 0.8354,
"step": 20950
},
{
"epoch": 0.46,
"learning_rate": 4.874358974358975e-06,
"loss": 0.8079,
"step": 21000
},
{
"epoch": 0.46,
"learning_rate": 4.861538461538462e-06,
"loss": 0.7674,
"step": 21050
},
{
"epoch": 0.46,
"learning_rate": 4.8487179487179495e-06,
"loss": 0.8267,
"step": 21100
},
{
"epoch": 0.46,
"learning_rate": 4.835897435897436e-06,
"loss": 0.8431,
"step": 21150
},
{
"epoch": 0.46,
"learning_rate": 4.823076923076924e-06,
"loss": 0.8325,
"step": 21200
},
{
"epoch": 0.46,
"learning_rate": 4.810256410256411e-06,
"loss": 0.8341,
"step": 21250
},
{
"epoch": 0.46,
"learning_rate": 4.7974358974358985e-06,
"loss": 0.7696,
"step": 21300
},
{
"epoch": 0.46,
"learning_rate": 4.7846153846153845e-06,
"loss": 0.824,
"step": 21350
},
{
"epoch": 0.46,
"learning_rate": 4.771794871794872e-06,
"loss": 0.7799,
"step": 21400
},
{
"epoch": 0.46,
"learning_rate": 4.758974358974359e-06,
"loss": 0.8678,
"step": 21450
},
{
"epoch": 0.47,
"learning_rate": 4.746153846153847e-06,
"loss": 0.8052,
"step": 21500
},
{
"epoch": 0.47,
"learning_rate": 4.7333333333333335e-06,
"loss": 0.7904,
"step": 21550
},
{
"epoch": 0.47,
"learning_rate": 4.720512820512821e-06,
"loss": 0.8087,
"step": 21600
},
{
"epoch": 0.47,
"learning_rate": 4.707692307692308e-06,
"loss": 0.8294,
"step": 21650
},
{
"epoch": 0.47,
"learning_rate": 4.694871794871796e-06,
"loss": 0.8158,
"step": 21700
},
{
"epoch": 0.47,
"learning_rate": 4.6820512820512825e-06,
"loss": 0.8856,
"step": 21750
},
{
"epoch": 0.47,
"learning_rate": 4.66923076923077e-06,
"loss": 0.8251,
"step": 21800
},
{
"epoch": 0.47,
"learning_rate": 4.656410256410257e-06,
"loss": 0.7168,
"step": 21850
},
{
"epoch": 0.47,
"learning_rate": 4.643589743589745e-06,
"loss": 0.839,
"step": 21900
},
{
"epoch": 0.48,
"learning_rate": 4.630769230769231e-06,
"loss": 0.8547,
"step": 21950
},
{
"epoch": 0.48,
"learning_rate": 4.617948717948718e-06,
"loss": 0.7659,
"step": 22000
},
{
"epoch": 0.48,
"learning_rate": 4.605128205128205e-06,
"loss": 0.7956,
"step": 22050
},
{
"epoch": 0.48,
"learning_rate": 4.592307692307693e-06,
"loss": 0.7989,
"step": 22100
},
{
"epoch": 0.48,
"learning_rate": 4.57948717948718e-06,
"loss": 0.7819,
"step": 22150
},
{
"epoch": 0.48,
"learning_rate": 4.566666666666667e-06,
"loss": 0.7591,
"step": 22200
},
{
"epoch": 0.48,
"learning_rate": 4.553846153846154e-06,
"loss": 0.7859,
"step": 22250
},
{
"epoch": 0.48,
"learning_rate": 4.541025641025642e-06,
"loss": 0.8602,
"step": 22300
},
{
"epoch": 0.48,
"learning_rate": 4.528205128205129e-06,
"loss": 0.8627,
"step": 22350
},
{
"epoch": 0.49,
"learning_rate": 4.515384615384616e-06,
"loss": 0.8695,
"step": 22400
},
{
"epoch": 0.49,
"learning_rate": 4.502564102564103e-06,
"loss": 0.8606,
"step": 22450
},
{
"epoch": 0.49,
"learning_rate": 4.489743589743591e-06,
"loss": 0.7762,
"step": 22500
},
{
"epoch": 0.49,
"learning_rate": 4.476923076923077e-06,
"loss": 0.811,
"step": 22550
},
{
"epoch": 0.49,
"learning_rate": 4.464102564102564e-06,
"loss": 0.7663,
"step": 22600
},
{
"epoch": 0.49,
"learning_rate": 4.451282051282051e-06,
"loss": 0.8819,
"step": 22650
},
{
"epoch": 0.49,
"learning_rate": 4.438461538461539e-06,
"loss": 0.8139,
"step": 22700
},
{
"epoch": 0.49,
"learning_rate": 4.425641025641026e-06,
"loss": 0.7623,
"step": 22750
},
{
"epoch": 0.49,
"learning_rate": 4.412820512820513e-06,
"loss": 0.7149,
"step": 22800
},
{
"epoch": 0.5,
"learning_rate": 4.4e-06,
"loss": 0.7642,
"step": 22850
},
{
"epoch": 0.5,
"learning_rate": 4.387179487179488e-06,
"loss": 0.7423,
"step": 22900
},
{
"epoch": 0.5,
"learning_rate": 4.374358974358975e-06,
"loss": 0.7505,
"step": 22950
},
{
"epoch": 0.5,
"learning_rate": 4.361538461538462e-06,
"loss": 0.8102,
"step": 23000
},
{
"epoch": 0.5,
"learning_rate": 4.348717948717949e-06,
"loss": 0.718,
"step": 23050
},
{
"epoch": 0.5,
"learning_rate": 4.335897435897437e-06,
"loss": 0.8357,
"step": 23100
},
{
"epoch": 0.5,
"learning_rate": 4.323076923076923e-06,
"loss": 0.7778,
"step": 23150
},
{
"epoch": 0.5,
"learning_rate": 4.3102564102564105e-06,
"loss": 0.7692,
"step": 23200
},
{
"epoch": 0.5,
"learning_rate": 4.297435897435897e-06,
"loss": 0.7716,
"step": 23250
},
{
"epoch": 0.51,
"learning_rate": 4.284615384615385e-06,
"loss": 0.8006,
"step": 23300
},
{
"epoch": 0.51,
"learning_rate": 4.271794871794872e-06,
"loss": 0.7957,
"step": 23350
},
{
"epoch": 0.51,
"learning_rate": 4.2589743589743595e-06,
"loss": 0.7936,
"step": 23400
},
{
"epoch": 0.51,
"learning_rate": 4.246153846153846e-06,
"loss": 0.7875,
"step": 23450
},
{
"epoch": 0.51,
"learning_rate": 4.233333333333334e-06,
"loss": 0.738,
"step": 23500
},
{
"epoch": 0.51,
"learning_rate": 4.220512820512821e-06,
"loss": 0.8422,
"step": 23550
},
{
"epoch": 0.51,
"learning_rate": 4.2076923076923085e-06,
"loss": 0.7859,
"step": 23600
},
{
"epoch": 0.51,
"learning_rate": 4.194871794871795e-06,
"loss": 0.735,
"step": 23650
},
{
"epoch": 0.51,
"learning_rate": 4.182051282051283e-06,
"loss": 0.8055,
"step": 23700
},
{
"epoch": 0.51,
"learning_rate": 4.169230769230769e-06,
"loss": 0.8354,
"step": 23750
},
{
"epoch": 0.52,
"learning_rate": 4.156410256410257e-06,
"loss": 0.8115,
"step": 23800
},
{
"epoch": 0.52,
"learning_rate": 4.1435897435897435e-06,
"loss": 0.7839,
"step": 23850
},
{
"epoch": 0.52,
"learning_rate": 4.130769230769231e-06,
"loss": 0.7855,
"step": 23900
},
{
"epoch": 0.52,
"learning_rate": 4.117948717948718e-06,
"loss": 0.8639,
"step": 23950
},
{
"epoch": 0.52,
"learning_rate": 4.105128205128206e-06,
"loss": 0.7451,
"step": 24000
},
{
"epoch": 0.52,
"eval_loss": 0.2875209450721741,
"eval_runtime": 2388.4505,
"eval_samples_per_second": 4.43,
"eval_steps_per_second": 0.139,
"eval_wer": 68.86221886221887,
"step": 24000
},
{
"epoch": 0.52,
"learning_rate": 4.0923076923076925e-06,
"loss": 0.8286,
"step": 24050
},
{
"epoch": 0.52,
"learning_rate": 4.07948717948718e-06,
"loss": 0.8096,
"step": 24100
},
{
"epoch": 0.52,
"learning_rate": 4.066666666666667e-06,
"loss": 0.807,
"step": 24150
},
{
"epoch": 0.52,
"learning_rate": 4.053846153846155e-06,
"loss": 0.7891,
"step": 24200
},
{
"epoch": 0.53,
"learning_rate": 4.0410256410256415e-06,
"loss": 0.7599,
"step": 24250
},
{
"epoch": 0.53,
"learning_rate": 4.028205128205129e-06,
"loss": 0.8145,
"step": 24300
},
{
"epoch": 0.53,
"learning_rate": 4.015384615384615e-06,
"loss": 0.7863,
"step": 24350
},
{
"epoch": 0.53,
"learning_rate": 4.002564102564103e-06,
"loss": 0.8316,
"step": 24400
},
{
"epoch": 0.53,
"learning_rate": 3.98974358974359e-06,
"loss": 0.7719,
"step": 24450
},
{
"epoch": 0.53,
"learning_rate": 3.977179487179488e-06,
"loss": 0.883,
"step": 24500
},
{
"epoch": 0.53,
"learning_rate": 3.964358974358974e-06,
"loss": 0.7388,
"step": 24550
},
{
"epoch": 0.53,
"learning_rate": 3.951538461538461e-06,
"loss": 0.7917,
"step": 24600
},
{
"epoch": 0.53,
"learning_rate": 3.938717948717949e-06,
"loss": 0.8494,
"step": 24650
},
{
"epoch": 0.54,
"learning_rate": 3.925897435897436e-06,
"loss": 0.7985,
"step": 24700
},
{
"epoch": 0.54,
"learning_rate": 3.913076923076923e-06,
"loss": 0.788,
"step": 24750
},
{
"epoch": 0.54,
"learning_rate": 3.90025641025641e-06,
"loss": 0.7984,
"step": 24800
},
{
"epoch": 0.54,
"learning_rate": 3.887435897435898e-06,
"loss": 0.7863,
"step": 24850
},
{
"epoch": 0.54,
"learning_rate": 3.874615384615385e-06,
"loss": 0.8338,
"step": 24900
},
{
"epoch": 0.54,
"learning_rate": 3.861794871794872e-06,
"loss": 0.7254,
"step": 24950
},
{
"epoch": 0.54,
"learning_rate": 3.848974358974359e-06,
"loss": 0.8152,
"step": 25000
},
{
"epoch": 0.54,
"learning_rate": 3.836153846153847e-06,
"loss": 0.821,
"step": 25050
},
{
"epoch": 0.54,
"learning_rate": 3.823333333333334e-06,
"loss": 0.8696,
"step": 25100
},
{
"epoch": 0.55,
"learning_rate": 3.8105128205128205e-06,
"loss": 0.8408,
"step": 25150
},
{
"epoch": 0.55,
"learning_rate": 3.7976923076923078e-06,
"loss": 0.8282,
"step": 25200
},
{
"epoch": 0.55,
"learning_rate": 3.784871794871795e-06,
"loss": 0.8513,
"step": 25250
},
{
"epoch": 0.55,
"learning_rate": 3.7720512820512823e-06,
"loss": 0.7233,
"step": 25300
},
{
"epoch": 0.55,
"learning_rate": 3.7592307692307695e-06,
"loss": 0.8516,
"step": 25350
},
{
"epoch": 0.55,
"learning_rate": 3.7464102564102568e-06,
"loss": 0.802,
"step": 25400
},
{
"epoch": 0.55,
"learning_rate": 3.733589743589744e-06,
"loss": 0.7276,
"step": 25450
},
{
"epoch": 0.55,
"learning_rate": 3.7207692307692313e-06,
"loss": 0.8185,
"step": 25500
},
{
"epoch": 0.55,
"learning_rate": 3.7079487179487185e-06,
"loss": 0.7061,
"step": 25550
},
{
"epoch": 0.55,
"learning_rate": 3.6951282051282058e-06,
"loss": 0.8132,
"step": 25600
},
{
"epoch": 0.56,
"learning_rate": 3.6823076923076926e-06,
"loss": 0.7634,
"step": 25650
},
{
"epoch": 0.56,
"learning_rate": 3.66948717948718e-06,
"loss": 0.7745,
"step": 25700
},
{
"epoch": 0.56,
"learning_rate": 3.6566666666666667e-06,
"loss": 0.7392,
"step": 25750
},
{
"epoch": 0.56,
"learning_rate": 3.643846153846154e-06,
"loss": 0.752,
"step": 25800
},
{
"epoch": 0.56,
"learning_rate": 3.631025641025641e-06,
"loss": 0.7355,
"step": 25850
},
{
"epoch": 0.56,
"learning_rate": 3.6182051282051284e-06,
"loss": 0.7894,
"step": 25900
},
{
"epoch": 0.56,
"learning_rate": 3.6053846153846157e-06,
"loss": 0.8476,
"step": 25950
},
{
"epoch": 0.56,
"learning_rate": 3.592564102564103e-06,
"loss": 0.789,
"step": 26000
},
{
"epoch": 0.56,
"learning_rate": 3.57974358974359e-06,
"loss": 0.7271,
"step": 26050
},
{
"epoch": 0.57,
"learning_rate": 3.5669230769230774e-06,
"loss": 0.8256,
"step": 26100
},
{
"epoch": 0.57,
"learning_rate": 3.5541025641025647e-06,
"loss": 0.6709,
"step": 26150
},
{
"epoch": 0.57,
"learning_rate": 3.541282051282052e-06,
"loss": 0.7646,
"step": 26200
},
{
"epoch": 0.57,
"learning_rate": 3.528461538461539e-06,
"loss": 0.7727,
"step": 26250
},
{
"epoch": 0.57,
"learning_rate": 3.515641025641026e-06,
"loss": 0.8103,
"step": 26300
},
{
"epoch": 0.57,
"learning_rate": 3.502820512820513e-06,
"loss": 0.8124,
"step": 26350
},
{
"epoch": 0.57,
"learning_rate": 3.49e-06,
"loss": 0.7628,
"step": 26400
},
{
"epoch": 0.57,
"learning_rate": 3.4771794871794873e-06,
"loss": 0.698,
"step": 26450
},
{
"epoch": 0.57,
"learning_rate": 3.4643589743589745e-06,
"loss": 0.7626,
"step": 26500
},
{
"epoch": 0.58,
"learning_rate": 3.4515384615384618e-06,
"loss": 0.7807,
"step": 26550
},
{
"epoch": 0.58,
"learning_rate": 3.438717948717949e-06,
"loss": 0.7767,
"step": 26600
},
{
"epoch": 0.58,
"learning_rate": 3.4258974358974363e-06,
"loss": 0.7487,
"step": 26650
},
{
"epoch": 0.58,
"learning_rate": 3.4130769230769235e-06,
"loss": 0.8079,
"step": 26700
},
{
"epoch": 0.58,
"learning_rate": 3.4002564102564108e-06,
"loss": 0.7907,
"step": 26750
},
{
"epoch": 0.58,
"learning_rate": 3.387435897435898e-06,
"loss": 0.7452,
"step": 26800
},
{
"epoch": 0.58,
"learning_rate": 3.3746153846153853e-06,
"loss": 0.7217,
"step": 26850
},
{
"epoch": 0.58,
"learning_rate": 3.361794871794872e-06,
"loss": 0.817,
"step": 26900
},
{
"epoch": 0.58,
"learning_rate": 3.3489743589743593e-06,
"loss": 0.8182,
"step": 26950
},
{
"epoch": 0.59,
"learning_rate": 3.336153846153846e-06,
"loss": 0.7641,
"step": 27000
},
{
"epoch": 0.59,
"learning_rate": 3.3233333333333334e-06,
"loss": 0.7667,
"step": 27050
},
{
"epoch": 0.59,
"learning_rate": 3.3105128205128207e-06,
"loss": 0.8408,
"step": 27100
},
{
"epoch": 0.59,
"learning_rate": 3.297692307692308e-06,
"loss": 0.7768,
"step": 27150
},
{
"epoch": 0.59,
"learning_rate": 3.284871794871795e-06,
"loss": 0.7837,
"step": 27200
},
{
"epoch": 0.59,
"learning_rate": 3.2720512820512824e-06,
"loss": 0.7631,
"step": 27250
},
{
"epoch": 0.59,
"learning_rate": 3.2592307692307697e-06,
"loss": 0.7669,
"step": 27300
},
{
"epoch": 0.59,
"learning_rate": 3.246410256410257e-06,
"loss": 0.7885,
"step": 27350
},
{
"epoch": 0.59,
"learning_rate": 3.233589743589744e-06,
"loss": 0.7419,
"step": 27400
},
{
"epoch": 0.6,
"learning_rate": 3.2207692307692314e-06,
"loss": 0.7794,
"step": 27450
},
{
"epoch": 0.6,
"learning_rate": 3.2079487179487182e-06,
"loss": 0.834,
"step": 27500
},
{
"epoch": 0.6,
"learning_rate": 3.1951282051282055e-06,
"loss": 0.6929,
"step": 27550
},
{
"epoch": 0.6,
"learning_rate": 3.182564102564103e-06,
"loss": 0.7557,
"step": 27600
},
{
"epoch": 0.6,
"learning_rate": 3.1697435897435903e-06,
"loss": 0.7569,
"step": 27650
},
{
"epoch": 0.6,
"learning_rate": 3.1569230769230775e-06,
"loss": 0.7765,
"step": 27700
},
{
"epoch": 0.6,
"learning_rate": 3.144102564102564e-06,
"loss": 0.7774,
"step": 27750
},
{
"epoch": 0.6,
"learning_rate": 3.131282051282051e-06,
"loss": 0.7784,
"step": 27800
},
{
"epoch": 0.6,
"learning_rate": 3.1184615384615384e-06,
"loss": 0.7641,
"step": 27850
},
{
"epoch": 0.6,
"learning_rate": 3.1056410256410257e-06,
"loss": 0.7589,
"step": 27900
},
{
"epoch": 0.61,
"learning_rate": 3.092820512820513e-06,
"loss": 0.7941,
"step": 27950
},
{
"epoch": 0.61,
"learning_rate": 3.08e-06,
"loss": 0.7755,
"step": 28000
},
{
"epoch": 0.61,
"eval_loss": 0.2776980996131897,
"eval_runtime": 2379.4894,
"eval_samples_per_second": 4.447,
"eval_steps_per_second": 0.139,
"eval_wer": 67.61481761481761,
"step": 28000
},
{
"epoch": 0.61,
"learning_rate": 3.0671794871794874e-06,
"loss": 0.7351,
"step": 28050
},
{
"epoch": 0.61,
"learning_rate": 3.0543589743589747e-06,
"loss": 0.7859,
"step": 28100
},
{
"epoch": 0.61,
"learning_rate": 3.041538461538462e-06,
"loss": 0.7596,
"step": 28150
},
{
"epoch": 0.61,
"learning_rate": 3.028717948717949e-06,
"loss": 0.7664,
"step": 28200
},
{
"epoch": 0.61,
"learning_rate": 3.0158974358974364e-06,
"loss": 0.818,
"step": 28250
},
{
"epoch": 0.61,
"learning_rate": 3.0030769230769236e-06,
"loss": 0.7387,
"step": 28300
},
{
"epoch": 0.61,
"learning_rate": 2.99025641025641e-06,
"loss": 0.746,
"step": 28350
},
{
"epoch": 0.62,
"learning_rate": 2.9774358974358973e-06,
"loss": 0.8034,
"step": 28400
},
{
"epoch": 0.62,
"learning_rate": 2.9646153846153845e-06,
"loss": 0.7298,
"step": 28450
},
{
"epoch": 0.62,
"learning_rate": 2.951794871794872e-06,
"loss": 0.7703,
"step": 28500
},
{
"epoch": 0.62,
"learning_rate": 2.938974358974359e-06,
"loss": 0.7201,
"step": 28550
},
{
"epoch": 0.62,
"learning_rate": 2.9261538461538463e-06,
"loss": 0.718,
"step": 28600
},
{
"epoch": 0.62,
"learning_rate": 2.9133333333333335e-06,
"loss": 0.8134,
"step": 28650
},
{
"epoch": 0.62,
"learning_rate": 2.9005128205128208e-06,
"loss": 0.8361,
"step": 28700
},
{
"epoch": 0.62,
"learning_rate": 2.887692307692308e-06,
"loss": 0.7924,
"step": 28750
},
{
"epoch": 0.62,
"learning_rate": 2.8748717948717953e-06,
"loss": 0.7938,
"step": 28800
},
{
"epoch": 0.63,
"learning_rate": 2.8620512820512825e-06,
"loss": 0.7555,
"step": 28850
},
{
"epoch": 0.63,
"learning_rate": 2.8492307692307698e-06,
"loss": 0.7738,
"step": 28900
},
{
"epoch": 0.63,
"learning_rate": 2.836410256410257e-06,
"loss": 0.7696,
"step": 28950
},
{
"epoch": 0.63,
"learning_rate": 2.8235897435897434e-06,
"loss": 0.7833,
"step": 29000
},
{
"epoch": 0.63,
"learning_rate": 2.8107692307692307e-06,
"loss": 0.7477,
"step": 29050
},
{
"epoch": 0.63,
"learning_rate": 2.797948717948718e-06,
"loss": 0.7358,
"step": 29100
},
{
"epoch": 0.63,
"learning_rate": 2.785128205128205e-06,
"loss": 0.8575,
"step": 29150
},
{
"epoch": 0.63,
"learning_rate": 2.7723076923076924e-06,
"loss": 0.7473,
"step": 29200
},
{
"epoch": 0.63,
"learning_rate": 2.7594871794871797e-06,
"loss": 0.7472,
"step": 29250
},
{
"epoch": 0.64,
"learning_rate": 2.746666666666667e-06,
"loss": 0.7032,
"step": 29300
},
{
"epoch": 0.64,
"learning_rate": 2.733846153846154e-06,
"loss": 0.8022,
"step": 29350
},
{
"epoch": 0.64,
"learning_rate": 2.7210256410256414e-06,
"loss": 0.719,
"step": 29400
},
{
"epoch": 0.64,
"learning_rate": 2.7082051282051287e-06,
"loss": 0.7356,
"step": 29450
},
{
"epoch": 0.64,
"learning_rate": 2.695384615384616e-06,
"loss": 0.764,
"step": 29500
},
{
"epoch": 0.64,
"learning_rate": 2.682564102564103e-06,
"loss": 0.7941,
"step": 29550
},
{
"epoch": 0.64,
"learning_rate": 2.6697435897435896e-06,
"loss": 0.7537,
"step": 29600
},
{
"epoch": 0.64,
"learning_rate": 2.656923076923077e-06,
"loss": 0.7105,
"step": 29650
},
{
"epoch": 0.64,
"learning_rate": 2.644102564102564e-06,
"loss": 0.6976,
"step": 29700
},
{
"epoch": 0.64,
"learning_rate": 2.6312820512820513e-06,
"loss": 0.758,
"step": 29750
},
{
"epoch": 0.65,
"learning_rate": 2.6184615384615385e-06,
"loss": 0.8502,
"step": 29800
},
{
"epoch": 0.65,
"learning_rate": 2.605897435897436e-06,
"loss": 0.7521,
"step": 29850
},
{
"epoch": 0.65,
"learning_rate": 2.5930769230769233e-06,
"loss": 0.7455,
"step": 29900
},
{
"epoch": 0.65,
"learning_rate": 2.5802564102564106e-06,
"loss": 0.7838,
"step": 29950
},
{
"epoch": 0.65,
"learning_rate": 2.5674358974358974e-06,
"loss": 0.7652,
"step": 30000
},
{
"epoch": 0.65,
"learning_rate": 2.5546153846153847e-06,
"loss": 0.726,
"step": 30050
},
{
"epoch": 0.65,
"learning_rate": 2.541794871794872e-06,
"loss": 0.7213,
"step": 30100
},
{
"epoch": 0.65,
"learning_rate": 2.528974358974359e-06,
"loss": 0.7379,
"step": 30150
},
{
"epoch": 0.65,
"learning_rate": 2.5161538461538464e-06,
"loss": 0.7387,
"step": 30200
},
{
"epoch": 0.66,
"learning_rate": 2.5033333333333336e-06,
"loss": 0.8344,
"step": 30250
},
{
"epoch": 0.66,
"learning_rate": 2.4905128205128205e-06,
"loss": 0.7844,
"step": 30300
},
{
"epoch": 0.66,
"learning_rate": 2.4776923076923077e-06,
"loss": 0.7456,
"step": 30350
},
{
"epoch": 0.66,
"learning_rate": 2.464871794871795e-06,
"loss": 0.8072,
"step": 30400
},
{
"epoch": 0.66,
"learning_rate": 2.4520512820512822e-06,
"loss": 0.7475,
"step": 30450
},
{
"epoch": 0.66,
"learning_rate": 2.4392307692307695e-06,
"loss": 0.7797,
"step": 30500
},
{
"epoch": 0.66,
"learning_rate": 2.4264102564102567e-06,
"loss": 0.7714,
"step": 30550
},
{
"epoch": 0.66,
"learning_rate": 2.4135897435897435e-06,
"loss": 0.7098,
"step": 30600
},
{
"epoch": 0.66,
"learning_rate": 2.4007692307692308e-06,
"loss": 0.7899,
"step": 30650
},
{
"epoch": 0.67,
"learning_rate": 2.387948717948718e-06,
"loss": 0.7921,
"step": 30700
},
{
"epoch": 0.67,
"learning_rate": 2.3751282051282053e-06,
"loss": 0.7596,
"step": 30750
},
{
"epoch": 0.67,
"learning_rate": 2.3623076923076925e-06,
"loss": 0.792,
"step": 30800
},
{
"epoch": 0.67,
"learning_rate": 2.3494871794871798e-06,
"loss": 0.7529,
"step": 30850
},
{
"epoch": 0.67,
"learning_rate": 2.3366666666666666e-06,
"loss": 0.8179,
"step": 30900
},
{
"epoch": 0.67,
"learning_rate": 2.323846153846154e-06,
"loss": 0.6807,
"step": 30950
},
{
"epoch": 0.67,
"learning_rate": 2.311025641025641e-06,
"loss": 0.7816,
"step": 31000
},
{
"epoch": 0.67,
"learning_rate": 2.2982051282051283e-06,
"loss": 0.6662,
"step": 31050
},
{
"epoch": 0.67,
"learning_rate": 2.2853846153846156e-06,
"loss": 0.7548,
"step": 31100
},
{
"epoch": 0.68,
"learning_rate": 2.272564102564103e-06,
"loss": 0.7931,
"step": 31150
},
{
"epoch": 0.68,
"learning_rate": 2.2597435897435897e-06,
"loss": 0.8231,
"step": 31200
},
{
"epoch": 0.68,
"learning_rate": 2.246923076923077e-06,
"loss": 0.8059,
"step": 31250
},
{
"epoch": 0.68,
"learning_rate": 2.234102564102564e-06,
"loss": 0.8001,
"step": 31300
},
{
"epoch": 0.68,
"learning_rate": 2.2212820512820514e-06,
"loss": 0.7726,
"step": 31350
},
{
"epoch": 0.68,
"learning_rate": 2.2084615384615387e-06,
"loss": 0.7544,
"step": 31400
},
{
"epoch": 0.68,
"learning_rate": 2.195641025641026e-06,
"loss": 0.7802,
"step": 31450
},
{
"epoch": 0.68,
"learning_rate": 2.1828205128205127e-06,
"loss": 0.7977,
"step": 31500
},
{
"epoch": 0.68,
"learning_rate": 2.17e-06,
"loss": 0.8011,
"step": 31550
},
{
"epoch": 0.68,
"learning_rate": 2.1571794871794872e-06,
"loss": 0.7044,
"step": 31600
},
{
"epoch": 0.69,
"learning_rate": 2.1443589743589745e-06,
"loss": 0.776,
"step": 31650
},
{
"epoch": 0.69,
"learning_rate": 2.1315384615384617e-06,
"loss": 0.7611,
"step": 31700
},
{
"epoch": 0.69,
"learning_rate": 2.118717948717949e-06,
"loss": 0.7122,
"step": 31750
},
{
"epoch": 0.69,
"learning_rate": 2.1058974358974362e-06,
"loss": 0.7584,
"step": 31800
},
{
"epoch": 0.69,
"learning_rate": 2.093076923076923e-06,
"loss": 0.7443,
"step": 31850
},
{
"epoch": 0.69,
"learning_rate": 2.0802564102564103e-06,
"loss": 0.6693,
"step": 31900
},
{
"epoch": 0.69,
"learning_rate": 2.0674358974358975e-06,
"loss": 0.7922,
"step": 31950
},
{
"epoch": 0.69,
"learning_rate": 2.0546153846153848e-06,
"loss": 0.7403,
"step": 32000
},
{
"epoch": 0.69,
"eval_loss": 0.2685754895210266,
"eval_runtime": 2376.0859,
"eval_samples_per_second": 4.453,
"eval_steps_per_second": 0.139,
"eval_wer": 66.47136647136647,
"step": 32000
},
{
"epoch": 0.69,
"learning_rate": 2.0420512820512823e-06,
"loss": 0.6922,
"step": 32050
},
{
"epoch": 0.7,
"learning_rate": 2.0292307692307696e-06,
"loss": 0.7866,
"step": 32100
},
{
"epoch": 0.7,
"learning_rate": 2.016410256410257e-06,
"loss": 0.7605,
"step": 32150
},
{
"epoch": 0.7,
"learning_rate": 2.0035897435897436e-06,
"loss": 0.789,
"step": 32200
},
{
"epoch": 0.7,
"learning_rate": 1.990769230769231e-06,
"loss": 0.8101,
"step": 32250
},
{
"epoch": 0.7,
"learning_rate": 1.977948717948718e-06,
"loss": 0.7387,
"step": 32300
},
{
"epoch": 0.7,
"learning_rate": 1.9651282051282054e-06,
"loss": 0.7588,
"step": 32350
},
{
"epoch": 0.7,
"learning_rate": 1.9523076923076926e-06,
"loss": 0.8323,
"step": 32400
},
{
"epoch": 0.7,
"learning_rate": 1.93948717948718e-06,
"loss": 0.7556,
"step": 32450
},
{
"epoch": 0.7,
"learning_rate": 1.926666666666667e-06,
"loss": 0.6982,
"step": 32500
},
{
"epoch": 0.71,
"learning_rate": 1.913846153846154e-06,
"loss": 0.7028,
"step": 32550
},
{
"epoch": 0.71,
"learning_rate": 1.9010256410256412e-06,
"loss": 0.7567,
"step": 32600
},
{
"epoch": 0.71,
"learning_rate": 1.8882051282051285e-06,
"loss": 0.7187,
"step": 32650
},
{
"epoch": 0.71,
"learning_rate": 1.8753846153846155e-06,
"loss": 0.7655,
"step": 32700
},
{
"epoch": 0.71,
"learning_rate": 1.8625641025641027e-06,
"loss": 0.711,
"step": 32750
},
{
"epoch": 0.71,
"learning_rate": 1.84974358974359e-06,
"loss": 0.7573,
"step": 32800
},
{
"epoch": 0.71,
"learning_rate": 1.836923076923077e-06,
"loss": 0.7474,
"step": 32850
},
{
"epoch": 0.71,
"learning_rate": 1.8241025641025643e-06,
"loss": 0.7687,
"step": 32900
},
{
"epoch": 0.71,
"learning_rate": 1.8112820512820515e-06,
"loss": 0.7708,
"step": 32950
},
{
"epoch": 0.72,
"learning_rate": 1.7984615384615386e-06,
"loss": 0.7674,
"step": 33000
},
{
"epoch": 0.72,
"learning_rate": 1.7856410256410258e-06,
"loss": 0.7896,
"step": 33050
},
{
"epoch": 0.72,
"learning_rate": 1.772820512820513e-06,
"loss": 0.6707,
"step": 33100
},
{
"epoch": 0.72,
"learning_rate": 1.76e-06,
"loss": 0.7633,
"step": 33150
},
{
"epoch": 0.72,
"learning_rate": 1.7471794871794873e-06,
"loss": 0.7261,
"step": 33200
},
{
"epoch": 0.72,
"learning_rate": 1.7343589743589746e-06,
"loss": 0.7848,
"step": 33250
},
{
"epoch": 0.72,
"learning_rate": 1.7215384615384616e-06,
"loss": 0.7003,
"step": 33300
},
{
"epoch": 0.72,
"learning_rate": 1.7087179487179489e-06,
"loss": 0.7727,
"step": 33350
},
{
"epoch": 0.72,
"learning_rate": 1.6958974358974361e-06,
"loss": 0.739,
"step": 33400
},
{
"epoch": 0.73,
"learning_rate": 1.6830769230769232e-06,
"loss": 0.7728,
"step": 33450
},
{
"epoch": 0.73,
"learning_rate": 1.6702564102564104e-06,
"loss": 0.7418,
"step": 33500
},
{
"epoch": 0.73,
"learning_rate": 1.6574358974358976e-06,
"loss": 0.721,
"step": 33550
},
{
"epoch": 0.73,
"learning_rate": 1.6446153846153847e-06,
"loss": 0.8415,
"step": 33600
},
{
"epoch": 0.73,
"learning_rate": 1.631794871794872e-06,
"loss": 0.7834,
"step": 33650
},
{
"epoch": 0.73,
"learning_rate": 1.6189743589743592e-06,
"loss": 0.7671,
"step": 33700
},
{
"epoch": 0.73,
"learning_rate": 1.6061538461538462e-06,
"loss": 0.7303,
"step": 33750
},
{
"epoch": 0.73,
"learning_rate": 1.5933333333333335e-06,
"loss": 0.7665,
"step": 33800
},
{
"epoch": 0.73,
"learning_rate": 1.5805128205128207e-06,
"loss": 0.713,
"step": 33850
},
{
"epoch": 0.73,
"learning_rate": 1.5676923076923078e-06,
"loss": 0.7565,
"step": 33900
},
{
"epoch": 0.74,
"learning_rate": 1.554871794871795e-06,
"loss": 0.7617,
"step": 33950
},
{
"epoch": 0.74,
"learning_rate": 1.5420512820512822e-06,
"loss": 0.7506,
"step": 34000
},
{
"epoch": 0.74,
"learning_rate": 1.5292307692307693e-06,
"loss": 0.794,
"step": 34050
},
{
"epoch": 0.74,
"learning_rate": 1.5166666666666668e-06,
"loss": 0.7271,
"step": 34100
},
{
"epoch": 0.74,
"learning_rate": 1.503846153846154e-06,
"loss": 0.7134,
"step": 34150
},
{
"epoch": 0.74,
"learning_rate": 1.4910256410256411e-06,
"loss": 0.7287,
"step": 34200
},
{
"epoch": 0.74,
"learning_rate": 1.4782051282051281e-06,
"loss": 0.7653,
"step": 34250
},
{
"epoch": 0.74,
"learning_rate": 1.4653846153846154e-06,
"loss": 0.766,
"step": 34300
},
{
"epoch": 0.74,
"learning_rate": 1.4525641025641026e-06,
"loss": 0.7636,
"step": 34350
},
{
"epoch": 0.75,
"learning_rate": 1.4397435897435899e-06,
"loss": 0.7039,
"step": 34400
},
{
"epoch": 0.75,
"learning_rate": 1.4269230769230771e-06,
"loss": 0.769,
"step": 34450
},
{
"epoch": 0.75,
"learning_rate": 1.4141025641025644e-06,
"loss": 0.7586,
"step": 34500
},
{
"epoch": 0.75,
"learning_rate": 1.4012820512820512e-06,
"loss": 0.7566,
"step": 34550
},
{
"epoch": 0.75,
"learning_rate": 1.3884615384615385e-06,
"loss": 0.7221,
"step": 34600
},
{
"epoch": 0.75,
"learning_rate": 1.3756410256410257e-06,
"loss": 0.7783,
"step": 34650
},
{
"epoch": 0.75,
"learning_rate": 1.362820512820513e-06,
"loss": 0.7056,
"step": 34700
},
{
"epoch": 0.75,
"learning_rate": 1.3500000000000002e-06,
"loss": 0.7334,
"step": 34750
},
{
"epoch": 0.75,
"learning_rate": 1.3371794871794875e-06,
"loss": 0.717,
"step": 34800
},
{
"epoch": 0.76,
"learning_rate": 1.3243589743589743e-06,
"loss": 0.7286,
"step": 34850
},
{
"epoch": 0.76,
"learning_rate": 1.3115384615384615e-06,
"loss": 0.7139,
"step": 34900
},
{
"epoch": 0.76,
"learning_rate": 1.2987179487179488e-06,
"loss": 0.6625,
"step": 34950
},
{
"epoch": 0.76,
"learning_rate": 1.285897435897436e-06,
"loss": 0.7178,
"step": 35000
},
{
"epoch": 0.76,
"learning_rate": 1.2730769230769233e-06,
"loss": 0.7451,
"step": 35050
},
{
"epoch": 0.76,
"learning_rate": 1.2602564102564105e-06,
"loss": 0.779,
"step": 35100
},
{
"epoch": 0.76,
"learning_rate": 1.2474358974358976e-06,
"loss": 0.7849,
"step": 35150
},
{
"epoch": 0.76,
"learning_rate": 1.2346153846153846e-06,
"loss": 0.7037,
"step": 35200
},
{
"epoch": 0.76,
"learning_rate": 1.2217948717948718e-06,
"loss": 0.7218,
"step": 35250
},
{
"epoch": 0.77,
"learning_rate": 1.208974358974359e-06,
"loss": 0.7581,
"step": 35300
},
{
"epoch": 0.77,
"learning_rate": 1.1961538461538461e-06,
"loss": 0.7879,
"step": 35350
},
{
"epoch": 0.77,
"learning_rate": 1.1833333333333334e-06,
"loss": 0.7174,
"step": 35400
},
{
"epoch": 0.77,
"learning_rate": 1.1705128205128206e-06,
"loss": 0.7972,
"step": 35450
},
{
"epoch": 0.77,
"learning_rate": 1.1576923076923077e-06,
"loss": 0.8004,
"step": 35500
},
{
"epoch": 0.77,
"learning_rate": 1.144871794871795e-06,
"loss": 0.7127,
"step": 35550
},
{
"epoch": 0.77,
"learning_rate": 1.1320512820512821e-06,
"loss": 0.7797,
"step": 35600
},
{
"epoch": 0.77,
"learning_rate": 1.1192307692307692e-06,
"loss": 0.7893,
"step": 35650
},
{
"epoch": 0.77,
"learning_rate": 1.1064102564102564e-06,
"loss": 0.7495,
"step": 35700
},
{
"epoch": 0.77,
"learning_rate": 1.0935897435897437e-06,
"loss": 0.7285,
"step": 35750
},
{
"epoch": 0.78,
"learning_rate": 1.0807692307692307e-06,
"loss": 0.7662,
"step": 35800
},
{
"epoch": 0.78,
"learning_rate": 1.067948717948718e-06,
"loss": 0.8184,
"step": 35850
},
{
"epoch": 0.78,
"learning_rate": 1.0551282051282052e-06,
"loss": 0.7452,
"step": 35900
},
{
"epoch": 0.78,
"learning_rate": 1.0423076923076922e-06,
"loss": 0.7478,
"step": 35950
},
{
"epoch": 0.78,
"learning_rate": 1.0294871794871795e-06,
"loss": 0.7447,
"step": 36000
},
{
"epoch": 0.78,
"eval_loss": 0.26302000880241394,
"eval_runtime": 2362.0071,
"eval_samples_per_second": 4.48,
"eval_steps_per_second": 0.14,
"eval_wer": 65.44131544131544,
"step": 36000
},
{
"epoch": 0.78,
"learning_rate": 1.0166666666666667e-06,
"loss": 0.7675,
"step": 36050
},
{
"epoch": 0.78,
"learning_rate": 1.0038461538461538e-06,
"loss": 0.8359,
"step": 36100
},
{
"epoch": 0.78,
"learning_rate": 9.91025641025641e-07,
"loss": 0.7122,
"step": 36150
},
{
"epoch": 0.78,
"learning_rate": 9.782051282051283e-07,
"loss": 0.7186,
"step": 36200
},
{
"epoch": 0.79,
"learning_rate": 9.653846153846155e-07,
"loss": 0.7674,
"step": 36250
},
{
"epoch": 0.79,
"learning_rate": 9.525641025641027e-07,
"loss": 0.7558,
"step": 36300
},
{
"epoch": 0.79,
"learning_rate": 9.397435897435898e-07,
"loss": 0.8178,
"step": 36350
},
{
"epoch": 0.79,
"learning_rate": 9.269230769230771e-07,
"loss": 0.7274,
"step": 36400
},
{
"epoch": 0.79,
"learning_rate": 9.141025641025642e-07,
"loss": 0.7326,
"step": 36450
},
{
"epoch": 0.79,
"learning_rate": 9.012820512820513e-07,
"loss": 0.702,
"step": 36500
},
{
"epoch": 0.79,
"learning_rate": 8.884615384615386e-07,
"loss": 0.7311,
"step": 36550
},
{
"epoch": 0.79,
"learning_rate": 8.756410256410257e-07,
"loss": 0.783,
"step": 36600
},
{
"epoch": 0.79,
"learning_rate": 8.628205128205129e-07,
"loss": 0.7231,
"step": 36650
},
{
"epoch": 0.8,
"learning_rate": 8.500000000000001e-07,
"loss": 0.8113,
"step": 36700
},
{
"epoch": 0.8,
"learning_rate": 8.371794871794873e-07,
"loss": 0.7135,
"step": 36750
},
{
"epoch": 0.8,
"learning_rate": 8.243589743589744e-07,
"loss": 0.7334,
"step": 36800
},
{
"epoch": 0.8,
"learning_rate": 8.115384615384617e-07,
"loss": 0.782,
"step": 36850
},
{
"epoch": 0.8,
"learning_rate": 7.987179487179488e-07,
"loss": 0.7224,
"step": 36900
},
{
"epoch": 0.8,
"learning_rate": 7.858974358974359e-07,
"loss": 0.7627,
"step": 36950
},
{
"epoch": 0.8,
"learning_rate": 7.730769230769232e-07,
"loss": 0.6767,
"step": 37000
},
{
"epoch": 0.8,
"learning_rate": 7.602564102564103e-07,
"loss": 0.806,
"step": 37050
},
{
"epoch": 0.8,
"learning_rate": 7.474358974358975e-07,
"loss": 0.7469,
"step": 37100
},
{
"epoch": 0.81,
"learning_rate": 7.346153846153847e-07,
"loss": 0.7501,
"step": 37150
},
{
"epoch": 0.81,
"learning_rate": 7.217948717948719e-07,
"loss": 0.6524,
"step": 37200
},
{
"epoch": 0.81,
"learning_rate": 7.08974358974359e-07,
"loss": 0.7306,
"step": 37250
},
{
"epoch": 0.81,
"learning_rate": 6.961538461538462e-07,
"loss": 0.7573,
"step": 37300
},
{
"epoch": 0.81,
"learning_rate": 6.833333333333334e-07,
"loss": 0.7066,
"step": 37350
},
{
"epoch": 0.81,
"learning_rate": 6.705128205128205e-07,
"loss": 0.6994,
"step": 37400
},
{
"epoch": 0.81,
"learning_rate": 6.576923076923078e-07,
"loss": 0.7276,
"step": 37450
},
{
"epoch": 0.81,
"learning_rate": 6.448717948717949e-07,
"loss": 0.6802,
"step": 37500
},
{
"epoch": 0.81,
"learning_rate": 6.320512820512821e-07,
"loss": 0.646,
"step": 37550
},
{
"epoch": 0.82,
"learning_rate": 6.192307692307693e-07,
"loss": 0.7677,
"step": 37600
},
{
"epoch": 0.82,
"learning_rate": 6.064102564102565e-07,
"loss": 0.7558,
"step": 37650
},
{
"epoch": 0.82,
"learning_rate": 5.935897435897436e-07,
"loss": 0.6874,
"step": 37700
},
{
"epoch": 0.82,
"learning_rate": 5.807692307692308e-07,
"loss": 0.724,
"step": 37750
},
{
"epoch": 0.82,
"learning_rate": 5.67948717948718e-07,
"loss": 0.6969,
"step": 37800
},
{
"epoch": 0.82,
"learning_rate": 5.551282051282051e-07,
"loss": 0.711,
"step": 37850
},
{
"epoch": 0.82,
"learning_rate": 5.423076923076924e-07,
"loss": 0.746,
"step": 37900
},
{
"epoch": 0.82,
"learning_rate": 5.294871794871795e-07,
"loss": 0.7783,
"step": 37950
},
{
"epoch": 0.82,
"learning_rate": 5.166666666666667e-07,
"loss": 0.7197,
"step": 38000
},
{
"epoch": 0.82,
"learning_rate": 5.038461538461539e-07,
"loss": 0.7594,
"step": 38050
},
{
"epoch": 0.83,
"learning_rate": 4.91025641025641e-07,
"loss": 0.7868,
"step": 38100
},
{
"epoch": 0.83,
"learning_rate": 4.782051282051282e-07,
"loss": 0.7874,
"step": 38150
},
{
"epoch": 0.83,
"learning_rate": 4.653846153846154e-07,
"loss": 0.7854,
"step": 38200
},
{
"epoch": 0.83,
"learning_rate": 4.5256410256410264e-07,
"loss": 0.7108,
"step": 38250
},
{
"epoch": 0.83,
"learning_rate": 4.4e-07,
"loss": 0.7612,
"step": 38300
},
{
"epoch": 0.83,
"learning_rate": 4.271794871794872e-07,
"loss": 0.7923,
"step": 38350
},
{
"epoch": 0.83,
"learning_rate": 4.143589743589744e-07,
"loss": 0.756,
"step": 38400
},
{
"epoch": 0.83,
"learning_rate": 4.0153846153846155e-07,
"loss": 0.7409,
"step": 38450
},
{
"epoch": 0.83,
"learning_rate": 3.8871794871794875e-07,
"loss": 0.7754,
"step": 38500
},
{
"epoch": 0.84,
"learning_rate": 3.7589743589743594e-07,
"loss": 0.7874,
"step": 38550
},
{
"epoch": 0.84,
"learning_rate": 3.630769230769231e-07,
"loss": 0.717,
"step": 38600
},
{
"epoch": 0.84,
"learning_rate": 3.502564102564103e-07,
"loss": 0.7111,
"step": 38650
},
{
"epoch": 0.84,
"learning_rate": 3.374358974358975e-07,
"loss": 0.7798,
"step": 38700
},
{
"epoch": 0.84,
"learning_rate": 3.246153846153846e-07,
"loss": 0.771,
"step": 38750
},
{
"epoch": 0.84,
"learning_rate": 3.117948717948718e-07,
"loss": 0.6986,
"step": 38800
},
{
"epoch": 0.84,
"learning_rate": 2.98974358974359e-07,
"loss": 0.7233,
"step": 38850
},
{
"epoch": 0.84,
"learning_rate": 2.861538461538462e-07,
"loss": 0.7898,
"step": 38900
},
{
"epoch": 0.84,
"learning_rate": 2.7333333333333335e-07,
"loss": 0.6647,
"step": 38950
},
{
"epoch": 0.85,
"learning_rate": 2.6051282051282054e-07,
"loss": 0.7585,
"step": 39000
},
{
"epoch": 0.85,
"learning_rate": 2.4769230769230774e-07,
"loss": 0.727,
"step": 39050
},
{
"epoch": 0.85,
"learning_rate": 2.348717948717949e-07,
"loss": 0.7875,
"step": 39100
},
{
"epoch": 0.85,
"learning_rate": 2.2205128205128205e-07,
"loss": 0.6976,
"step": 39150
},
{
"epoch": 0.85,
"learning_rate": 2.0923076923076924e-07,
"loss": 0.7744,
"step": 39200
},
{
"epoch": 0.85,
"learning_rate": 1.9641025641025644e-07,
"loss": 0.7199,
"step": 39250
},
{
"epoch": 0.85,
"learning_rate": 1.8358974358974358e-07,
"loss": 0.7114,
"step": 39300
},
{
"epoch": 0.85,
"learning_rate": 1.7076923076923077e-07,
"loss": 0.7218,
"step": 39350
},
{
"epoch": 0.85,
"learning_rate": 1.5794871794871797e-07,
"loss": 0.7373,
"step": 39400
},
{
"epoch": 0.86,
"learning_rate": 1.4512820512820514e-07,
"loss": 0.7764,
"step": 39450
},
{
"epoch": 0.86,
"learning_rate": 1.323076923076923e-07,
"loss": 0.7593,
"step": 39500
},
{
"epoch": 0.86,
"learning_rate": 1.194871794871795e-07,
"loss": 0.7653,
"step": 39550
},
{
"epoch": 0.86,
"learning_rate": 1.0666666666666667e-07,
"loss": 0.8478,
"step": 39600
},
{
"epoch": 0.86,
"learning_rate": 9.384615384615386e-08,
"loss": 0.7755,
"step": 39650
},
{
"epoch": 0.86,
"learning_rate": 8.102564102564103e-08,
"loss": 0.7625,
"step": 39700
},
{
"epoch": 0.86,
"learning_rate": 6.820512820512821e-08,
"loss": 0.7187,
"step": 39750
},
{
"epoch": 0.86,
"learning_rate": 5.538461538461538e-08,
"loss": 0.7036,
"step": 39800
},
{
"epoch": 0.86,
"learning_rate": 4.2564102564102564e-08,
"loss": 0.7623,
"step": 39850
},
{
"epoch": 0.86,
"learning_rate": 2.9743589743589746e-08,
"loss": 0.7811,
"step": 39900
},
{
"epoch": 0.87,
"learning_rate": 1.6923076923076925e-08,
"loss": 0.7454,
"step": 39950
},
{
"epoch": 0.87,
"learning_rate": 4.102564102564102e-09,
"loss": 0.7396,
"step": 40000
},
{
"epoch": 0.87,
"eval_loss": 0.2601395547389984,
"eval_runtime": 2518.4395,
"eval_samples_per_second": 4.201,
"eval_steps_per_second": 0.131,
"eval_wer": 64.97826497826497,
"step": 40000
}
],
"max_steps": 40000,
"num_train_epochs": 1,
"total_flos": 4.15103975424e+19,
"trial_name": null,
"trial_params": null
}