whisper-tiny-mn-9 / trainer_state.json
bayartsogt's picture
End of training
d28f0f6
{
"best_metric": 45.51015949311776,
"best_model_checkpoint": "whisper-tiny-mn-9/checkpoint-20000",
"epoch": 13.86001386001386,
"global_step": 20000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.02,
"learning_rate": 4.4e-07,
"loss": 5.6802,
"step": 25
},
{
"epoch": 0.03,
"learning_rate": 9.400000000000001e-07,
"loss": 5.154,
"step": 50
},
{
"epoch": 0.05,
"learning_rate": 1.44e-06,
"loss": 4.3382,
"step": 75
},
{
"epoch": 0.07,
"learning_rate": 1.94e-06,
"loss": 3.6026,
"step": 100
},
{
"epoch": 0.09,
"learning_rate": 2.4400000000000004e-06,
"loss": 3.0061,
"step": 125
},
{
"epoch": 0.1,
"learning_rate": 2.9400000000000002e-06,
"loss": 2.5594,
"step": 150
},
{
"epoch": 0.12,
"learning_rate": 3.44e-06,
"loss": 2.2357,
"step": 175
},
{
"epoch": 0.14,
"learning_rate": 3.94e-06,
"loss": 1.9801,
"step": 200
},
{
"epoch": 0.16,
"learning_rate": 4.440000000000001e-06,
"loss": 1.7697,
"step": 225
},
{
"epoch": 0.17,
"learning_rate": 4.94e-06,
"loss": 1.6114,
"step": 250
},
{
"epoch": 0.19,
"learning_rate": 5.4400000000000004e-06,
"loss": 1.4906,
"step": 275
},
{
"epoch": 0.21,
"learning_rate": 5.94e-06,
"loss": 1.3715,
"step": 300
},
{
"epoch": 0.23,
"learning_rate": 6.440000000000001e-06,
"loss": 1.2579,
"step": 325
},
{
"epoch": 0.24,
"learning_rate": 6.9400000000000005e-06,
"loss": 1.1916,
"step": 350
},
{
"epoch": 0.26,
"learning_rate": 7.440000000000001e-06,
"loss": 1.0915,
"step": 375
},
{
"epoch": 0.28,
"learning_rate": 7.94e-06,
"loss": 1.0262,
"step": 400
},
{
"epoch": 0.29,
"learning_rate": 8.44e-06,
"loss": 0.9772,
"step": 425
},
{
"epoch": 0.31,
"learning_rate": 8.94e-06,
"loss": 0.948,
"step": 450
},
{
"epoch": 0.33,
"learning_rate": 9.440000000000001e-06,
"loss": 0.9136,
"step": 475
},
{
"epoch": 0.35,
"learning_rate": 9.940000000000001e-06,
"loss": 0.8684,
"step": 500
},
{
"epoch": 0.36,
"learning_rate": 9.98871794871795e-06,
"loss": 0.8394,
"step": 525
},
{
"epoch": 0.38,
"learning_rate": 9.975897435897436e-06,
"loss": 0.8173,
"step": 550
},
{
"epoch": 0.4,
"learning_rate": 9.963076923076925e-06,
"loss": 0.7998,
"step": 575
},
{
"epoch": 0.42,
"learning_rate": 9.950256410256412e-06,
"loss": 0.7589,
"step": 600
},
{
"epoch": 0.43,
"learning_rate": 9.937435897435898e-06,
"loss": 0.7577,
"step": 625
},
{
"epoch": 0.45,
"learning_rate": 9.924615384615385e-06,
"loss": 0.7371,
"step": 650
},
{
"epoch": 0.47,
"learning_rate": 9.911794871794874e-06,
"loss": 0.7167,
"step": 675
},
{
"epoch": 0.49,
"learning_rate": 9.89897435897436e-06,
"loss": 0.699,
"step": 700
},
{
"epoch": 0.5,
"learning_rate": 9.886153846153846e-06,
"loss": 0.6883,
"step": 725
},
{
"epoch": 0.52,
"learning_rate": 9.873333333333334e-06,
"loss": 0.6787,
"step": 750
},
{
"epoch": 0.54,
"learning_rate": 9.860512820512821e-06,
"loss": 0.6682,
"step": 775
},
{
"epoch": 0.55,
"learning_rate": 9.847692307692308e-06,
"loss": 0.6525,
"step": 800
},
{
"epoch": 0.57,
"learning_rate": 9.834871794871795e-06,
"loss": 0.6428,
"step": 825
},
{
"epoch": 0.59,
"learning_rate": 9.822051282051283e-06,
"loss": 0.6311,
"step": 850
},
{
"epoch": 0.61,
"learning_rate": 9.80923076923077e-06,
"loss": 0.6268,
"step": 875
},
{
"epoch": 0.62,
"learning_rate": 9.796410256410257e-06,
"loss": 0.6258,
"step": 900
},
{
"epoch": 0.64,
"learning_rate": 9.783589743589744e-06,
"loss": 0.6037,
"step": 925
},
{
"epoch": 0.66,
"learning_rate": 9.770769230769232e-06,
"loss": 0.6141,
"step": 950
},
{
"epoch": 0.68,
"learning_rate": 9.757948717948719e-06,
"loss": 0.5919,
"step": 975
},
{
"epoch": 0.69,
"learning_rate": 9.745128205128206e-06,
"loss": 0.587,
"step": 1000
},
{
"epoch": 0.69,
"eval_cer": 29.67639230484148,
"eval_loss": 0.6937438249588013,
"eval_runtime": 166.5539,
"eval_samples_per_second": 11.324,
"eval_steps_per_second": 0.18,
"eval_wer": 75.63360279659166,
"step": 1000
},
{
"epoch": 0.71,
"learning_rate": 9.732307692307693e-06,
"loss": 0.5903,
"step": 1025
},
{
"epoch": 0.73,
"learning_rate": 9.71948717948718e-06,
"loss": 0.5744,
"step": 1050
},
{
"epoch": 0.74,
"learning_rate": 9.706666666666668e-06,
"loss": 0.5705,
"step": 1075
},
{
"epoch": 0.76,
"learning_rate": 9.693846153846155e-06,
"loss": 0.5772,
"step": 1100
},
{
"epoch": 0.78,
"learning_rate": 9.681025641025642e-06,
"loss": 0.558,
"step": 1125
},
{
"epoch": 0.8,
"learning_rate": 9.668205128205129e-06,
"loss": 0.5568,
"step": 1150
},
{
"epoch": 0.81,
"learning_rate": 9.655384615384617e-06,
"loss": 0.5573,
"step": 1175
},
{
"epoch": 0.83,
"learning_rate": 9.642564102564104e-06,
"loss": 0.549,
"step": 1200
},
{
"epoch": 0.85,
"learning_rate": 9.62974358974359e-06,
"loss": 0.5582,
"step": 1225
},
{
"epoch": 0.87,
"learning_rate": 9.616923076923077e-06,
"loss": 0.5485,
"step": 1250
},
{
"epoch": 0.88,
"learning_rate": 9.604102564102566e-06,
"loss": 0.529,
"step": 1275
},
{
"epoch": 0.9,
"learning_rate": 9.591282051282053e-06,
"loss": 0.5238,
"step": 1300
},
{
"epoch": 0.92,
"learning_rate": 9.578461538461538e-06,
"loss": 0.541,
"step": 1325
},
{
"epoch": 0.94,
"learning_rate": 9.565641025641026e-06,
"loss": 0.5281,
"step": 1350
},
{
"epoch": 0.95,
"learning_rate": 9.552820512820513e-06,
"loss": 0.5165,
"step": 1375
},
{
"epoch": 0.97,
"learning_rate": 9.54e-06,
"loss": 0.5146,
"step": 1400
},
{
"epoch": 0.99,
"learning_rate": 9.527179487179487e-06,
"loss": 0.5197,
"step": 1425
},
{
"epoch": 1.0,
"learning_rate": 9.514358974358975e-06,
"loss": 0.504,
"step": 1450
},
{
"epoch": 1.02,
"learning_rate": 9.501538461538462e-06,
"loss": 0.486,
"step": 1475
},
{
"epoch": 1.04,
"learning_rate": 9.488717948717949e-06,
"loss": 0.4967,
"step": 1500
},
{
"epoch": 1.06,
"learning_rate": 9.475897435897436e-06,
"loss": 0.4858,
"step": 1525
},
{
"epoch": 1.07,
"learning_rate": 9.463076923076924e-06,
"loss": 0.4866,
"step": 1550
},
{
"epoch": 1.09,
"learning_rate": 9.450256410256411e-06,
"loss": 0.4791,
"step": 1575
},
{
"epoch": 1.11,
"learning_rate": 9.437435897435898e-06,
"loss": 0.4746,
"step": 1600
},
{
"epoch": 1.13,
"learning_rate": 9.424615384615385e-06,
"loss": 0.4695,
"step": 1625
},
{
"epoch": 1.14,
"learning_rate": 9.411794871794872e-06,
"loss": 0.4619,
"step": 1650
},
{
"epoch": 1.16,
"learning_rate": 9.39897435897436e-06,
"loss": 0.4786,
"step": 1675
},
{
"epoch": 1.18,
"learning_rate": 9.386153846153847e-06,
"loss": 0.469,
"step": 1700
},
{
"epoch": 1.2,
"learning_rate": 9.373333333333334e-06,
"loss": 0.4671,
"step": 1725
},
{
"epoch": 1.21,
"learning_rate": 9.36051282051282e-06,
"loss": 0.4573,
"step": 1750
},
{
"epoch": 1.23,
"learning_rate": 9.34769230769231e-06,
"loss": 0.4634,
"step": 1775
},
{
"epoch": 1.25,
"learning_rate": 9.334871794871796e-06,
"loss": 0.4656,
"step": 1800
},
{
"epoch": 1.26,
"learning_rate": 9.322051282051283e-06,
"loss": 0.4572,
"step": 1825
},
{
"epoch": 1.28,
"learning_rate": 9.30923076923077e-06,
"loss": 0.4623,
"step": 1850
},
{
"epoch": 1.3,
"learning_rate": 9.296410256410258e-06,
"loss": 0.4574,
"step": 1875
},
{
"epoch": 1.32,
"learning_rate": 9.283589743589745e-06,
"loss": 0.4537,
"step": 1900
},
{
"epoch": 1.33,
"learning_rate": 9.270769230769232e-06,
"loss": 0.4544,
"step": 1925
},
{
"epoch": 1.35,
"learning_rate": 9.257948717948719e-06,
"loss": 0.4482,
"step": 1950
},
{
"epoch": 1.37,
"learning_rate": 9.245128205128206e-06,
"loss": 0.441,
"step": 1975
},
{
"epoch": 1.39,
"learning_rate": 9.232307692307692e-06,
"loss": 0.4536,
"step": 2000
},
{
"epoch": 1.39,
"eval_cer": 24.8323843536269,
"eval_loss": 0.553851306438446,
"eval_runtime": 180.9289,
"eval_samples_per_second": 10.424,
"eval_steps_per_second": 0.166,
"eval_wer": 64.818658509941,
"step": 2000
},
{
"epoch": 1.4,
"learning_rate": 9.21948717948718e-06,
"loss": 0.4498,
"step": 2025
},
{
"epoch": 1.42,
"learning_rate": 9.206666666666668e-06,
"loss": 0.4298,
"step": 2050
},
{
"epoch": 1.44,
"learning_rate": 9.193846153846155e-06,
"loss": 0.4314,
"step": 2075
},
{
"epoch": 1.46,
"learning_rate": 9.181025641025641e-06,
"loss": 0.4362,
"step": 2100
},
{
"epoch": 1.47,
"learning_rate": 9.168205128205128e-06,
"loss": 0.4431,
"step": 2125
},
{
"epoch": 1.49,
"learning_rate": 9.155384615384617e-06,
"loss": 0.4272,
"step": 2150
},
{
"epoch": 1.51,
"learning_rate": 9.142564102564104e-06,
"loss": 0.4334,
"step": 2175
},
{
"epoch": 1.52,
"learning_rate": 9.12974358974359e-06,
"loss": 0.4318,
"step": 2200
},
{
"epoch": 1.54,
"learning_rate": 9.116923076923077e-06,
"loss": 0.4221,
"step": 2225
},
{
"epoch": 1.56,
"learning_rate": 9.104102564102566e-06,
"loss": 0.4271,
"step": 2250
},
{
"epoch": 1.58,
"learning_rate": 9.091282051282053e-06,
"loss": 0.4208,
"step": 2275
},
{
"epoch": 1.59,
"learning_rate": 9.07846153846154e-06,
"loss": 0.4272,
"step": 2300
},
{
"epoch": 1.61,
"learning_rate": 9.065641025641026e-06,
"loss": 0.4188,
"step": 2325
},
{
"epoch": 1.63,
"learning_rate": 9.052820512820513e-06,
"loss": 0.4217,
"step": 2350
},
{
"epoch": 1.65,
"learning_rate": 9.040000000000002e-06,
"loss": 0.4231,
"step": 2375
},
{
"epoch": 1.66,
"learning_rate": 9.027179487179488e-06,
"loss": 0.415,
"step": 2400
},
{
"epoch": 1.68,
"learning_rate": 9.014358974358975e-06,
"loss": 0.4112,
"step": 2425
},
{
"epoch": 1.7,
"learning_rate": 9.001538461538462e-06,
"loss": 0.4164,
"step": 2450
},
{
"epoch": 1.72,
"learning_rate": 8.98871794871795e-06,
"loss": 0.4163,
"step": 2475
},
{
"epoch": 1.73,
"learning_rate": 8.975897435897437e-06,
"loss": 0.4109,
"step": 2500
},
{
"epoch": 1.75,
"learning_rate": 8.963076923076924e-06,
"loss": 0.4035,
"step": 2525
},
{
"epoch": 1.77,
"learning_rate": 8.950256410256411e-06,
"loss": 0.4082,
"step": 2550
},
{
"epoch": 1.78,
"learning_rate": 8.937435897435898e-06,
"loss": 0.4099,
"step": 2575
},
{
"epoch": 1.8,
"learning_rate": 8.924615384615385e-06,
"loss": 0.4137,
"step": 2600
},
{
"epoch": 1.82,
"learning_rate": 8.911794871794871e-06,
"loss": 0.409,
"step": 2625
},
{
"epoch": 1.84,
"learning_rate": 8.89897435897436e-06,
"loss": 0.4055,
"step": 2650
},
{
"epoch": 1.85,
"learning_rate": 8.886153846153847e-06,
"loss": 0.4052,
"step": 2675
},
{
"epoch": 1.87,
"learning_rate": 8.873333333333334e-06,
"loss": 0.4104,
"step": 2700
},
{
"epoch": 1.89,
"learning_rate": 8.86051282051282e-06,
"loss": 0.4025,
"step": 2725
},
{
"epoch": 1.91,
"learning_rate": 8.847692307692309e-06,
"loss": 0.4053,
"step": 2750
},
{
"epoch": 1.92,
"learning_rate": 8.834871794871796e-06,
"loss": 0.3937,
"step": 2775
},
{
"epoch": 1.94,
"learning_rate": 8.822051282051283e-06,
"loss": 0.4009,
"step": 2800
},
{
"epoch": 1.96,
"learning_rate": 8.80923076923077e-06,
"loss": 0.402,
"step": 2825
},
{
"epoch": 1.98,
"learning_rate": 8.796410256410258e-06,
"loss": 0.4011,
"step": 2850
},
{
"epoch": 1.99,
"learning_rate": 8.783589743589745e-06,
"loss": 0.4024,
"step": 2875
},
{
"epoch": 2.01,
"learning_rate": 8.770769230769232e-06,
"loss": 0.3799,
"step": 2900
},
{
"epoch": 2.03,
"learning_rate": 8.757948717948718e-06,
"loss": 0.3791,
"step": 2925
},
{
"epoch": 2.04,
"learning_rate": 8.745128205128205e-06,
"loss": 0.3766,
"step": 2950
},
{
"epoch": 2.06,
"learning_rate": 8.732307692307694e-06,
"loss": 0.3736,
"step": 2975
},
{
"epoch": 2.08,
"learning_rate": 8.71948717948718e-06,
"loss": 0.3798,
"step": 3000
},
{
"epoch": 2.08,
"eval_cer": 22.18422559886796,
"eval_loss": 0.49632859230041504,
"eval_runtime": 159.8672,
"eval_samples_per_second": 11.797,
"eval_steps_per_second": 0.188,
"eval_wer": 57.79440681669216,
"step": 3000
},
{
"epoch": 2.1,
"learning_rate": 8.706666666666667e-06,
"loss": 0.3678,
"step": 3025
},
{
"epoch": 2.11,
"learning_rate": 8.693846153846154e-06,
"loss": 0.3698,
"step": 3050
},
{
"epoch": 2.13,
"learning_rate": 8.681025641025643e-06,
"loss": 0.386,
"step": 3075
},
{
"epoch": 2.15,
"learning_rate": 8.66820512820513e-06,
"loss": 0.3633,
"step": 3100
},
{
"epoch": 2.17,
"learning_rate": 8.655384615384616e-06,
"loss": 0.36,
"step": 3125
},
{
"epoch": 2.18,
"learning_rate": 8.642564102564103e-06,
"loss": 0.3637,
"step": 3150
},
{
"epoch": 2.2,
"learning_rate": 8.62974358974359e-06,
"loss": 0.3643,
"step": 3175
},
{
"epoch": 2.22,
"learning_rate": 8.616923076923077e-06,
"loss": 0.372,
"step": 3200
},
{
"epoch": 2.23,
"learning_rate": 8.604102564102564e-06,
"loss": 0.3688,
"step": 3225
},
{
"epoch": 2.25,
"learning_rate": 8.591282051282052e-06,
"loss": 0.3692,
"step": 3250
},
{
"epoch": 2.27,
"learning_rate": 8.578461538461539e-06,
"loss": 0.3741,
"step": 3275
},
{
"epoch": 2.29,
"learning_rate": 8.565641025641026e-06,
"loss": 0.3755,
"step": 3300
},
{
"epoch": 2.3,
"learning_rate": 8.552820512820513e-06,
"loss": 0.3667,
"step": 3325
},
{
"epoch": 2.32,
"learning_rate": 8.540000000000001e-06,
"loss": 0.372,
"step": 3350
},
{
"epoch": 2.34,
"learning_rate": 8.527179487179488e-06,
"loss": 0.3723,
"step": 3375
},
{
"epoch": 2.36,
"learning_rate": 8.514358974358975e-06,
"loss": 0.3581,
"step": 3400
},
{
"epoch": 2.37,
"learning_rate": 8.501538461538462e-06,
"loss": 0.3676,
"step": 3425
},
{
"epoch": 2.39,
"learning_rate": 8.48871794871795e-06,
"loss": 0.3671,
"step": 3450
},
{
"epoch": 2.41,
"learning_rate": 8.475897435897437e-06,
"loss": 0.3622,
"step": 3475
},
{
"epoch": 2.43,
"learning_rate": 8.463076923076924e-06,
"loss": 0.3596,
"step": 3500
},
{
"epoch": 2.44,
"learning_rate": 8.45025641025641e-06,
"loss": 0.3637,
"step": 3525
},
{
"epoch": 2.46,
"learning_rate": 8.437435897435898e-06,
"loss": 0.3656,
"step": 3550
},
{
"epoch": 2.48,
"learning_rate": 8.424615384615386e-06,
"loss": 0.3637,
"step": 3575
},
{
"epoch": 2.49,
"learning_rate": 8.411794871794873e-06,
"loss": 0.3612,
"step": 3600
},
{
"epoch": 2.51,
"learning_rate": 8.39897435897436e-06,
"loss": 0.3568,
"step": 3625
},
{
"epoch": 2.53,
"learning_rate": 8.386153846153847e-06,
"loss": 0.3624,
"step": 3650
},
{
"epoch": 2.55,
"learning_rate": 8.373333333333335e-06,
"loss": 0.3558,
"step": 3675
},
{
"epoch": 2.56,
"learning_rate": 8.360512820512822e-06,
"loss": 0.3594,
"step": 3700
},
{
"epoch": 2.58,
"learning_rate": 8.347692307692309e-06,
"loss": 0.3547,
"step": 3725
},
{
"epoch": 2.6,
"learning_rate": 8.334871794871796e-06,
"loss": 0.3545,
"step": 3750
},
{
"epoch": 2.62,
"learning_rate": 8.322051282051282e-06,
"loss": 0.3484,
"step": 3775
},
{
"epoch": 2.63,
"learning_rate": 8.30923076923077e-06,
"loss": 0.3506,
"step": 3800
},
{
"epoch": 2.65,
"learning_rate": 8.296410256410256e-06,
"loss": 0.3614,
"step": 3825
},
{
"epoch": 2.67,
"learning_rate": 8.283589743589745e-06,
"loss": 0.3486,
"step": 3850
},
{
"epoch": 2.69,
"learning_rate": 8.270769230769231e-06,
"loss": 0.3542,
"step": 3875
},
{
"epoch": 2.7,
"learning_rate": 8.257948717948718e-06,
"loss": 0.3549,
"step": 3900
},
{
"epoch": 2.72,
"learning_rate": 8.245128205128205e-06,
"loss": 0.3505,
"step": 3925
},
{
"epoch": 2.74,
"learning_rate": 8.232307692307694e-06,
"loss": 0.3427,
"step": 3950
},
{
"epoch": 2.75,
"learning_rate": 8.21948717948718e-06,
"loss": 0.3506,
"step": 3975
},
{
"epoch": 2.77,
"learning_rate": 8.206666666666667e-06,
"loss": 0.3423,
"step": 4000
},
{
"epoch": 2.77,
"eval_cer": 20.97048616960345,
"eval_loss": 0.46611809730529785,
"eval_runtime": 150.5434,
"eval_samples_per_second": 12.528,
"eval_steps_per_second": 0.199,
"eval_wer": 54.37513655232685,
"step": 4000
},
{
"epoch": 2.79,
"learning_rate": 8.193846153846154e-06,
"loss": 0.3449,
"step": 4025
},
{
"epoch": 2.81,
"learning_rate": 8.181025641025642e-06,
"loss": 0.3498,
"step": 4050
},
{
"epoch": 2.82,
"learning_rate": 8.16820512820513e-06,
"loss": 0.3403,
"step": 4075
},
{
"epoch": 2.84,
"learning_rate": 8.155384615384616e-06,
"loss": 0.3489,
"step": 4100
},
{
"epoch": 2.86,
"learning_rate": 8.142564102564103e-06,
"loss": 0.3561,
"step": 4125
},
{
"epoch": 2.88,
"learning_rate": 8.12974358974359e-06,
"loss": 0.3476,
"step": 4150
},
{
"epoch": 2.89,
"learning_rate": 8.116923076923078e-06,
"loss": 0.3399,
"step": 4175
},
{
"epoch": 2.91,
"learning_rate": 8.104102564102565e-06,
"loss": 0.3555,
"step": 4200
},
{
"epoch": 2.93,
"learning_rate": 8.091282051282052e-06,
"loss": 0.3354,
"step": 4225
},
{
"epoch": 2.95,
"learning_rate": 8.078461538461539e-06,
"loss": 0.3411,
"step": 4250
},
{
"epoch": 2.96,
"learning_rate": 8.065641025641027e-06,
"loss": 0.3486,
"step": 4275
},
{
"epoch": 2.98,
"learning_rate": 8.052820512820514e-06,
"loss": 0.3468,
"step": 4300
},
{
"epoch": 3.0,
"learning_rate": 8.040000000000001e-06,
"loss": 0.3414,
"step": 4325
},
{
"epoch": 3.01,
"learning_rate": 8.027179487179488e-06,
"loss": 0.3374,
"step": 4350
},
{
"epoch": 3.03,
"learning_rate": 8.014358974358975e-06,
"loss": 0.3301,
"step": 4375
},
{
"epoch": 3.05,
"learning_rate": 8.001538461538461e-06,
"loss": 0.3253,
"step": 4400
},
{
"epoch": 3.07,
"learning_rate": 7.988717948717948e-06,
"loss": 0.321,
"step": 4425
},
{
"epoch": 3.08,
"learning_rate": 7.975897435897437e-06,
"loss": 0.3226,
"step": 4450
},
{
"epoch": 3.1,
"learning_rate": 7.963076923076924e-06,
"loss": 0.3274,
"step": 4475
},
{
"epoch": 3.12,
"learning_rate": 7.95025641025641e-06,
"loss": 0.315,
"step": 4500
},
{
"epoch": 3.14,
"learning_rate": 7.937435897435897e-06,
"loss": 0.322,
"step": 4525
},
{
"epoch": 3.15,
"learning_rate": 7.924615384615386e-06,
"loss": 0.327,
"step": 4550
},
{
"epoch": 3.17,
"learning_rate": 7.911794871794873e-06,
"loss": 0.3262,
"step": 4575
},
{
"epoch": 3.19,
"learning_rate": 7.89897435897436e-06,
"loss": 0.3273,
"step": 4600
},
{
"epoch": 3.21,
"learning_rate": 7.886153846153846e-06,
"loss": 0.3336,
"step": 4625
},
{
"epoch": 3.22,
"learning_rate": 7.873333333333335e-06,
"loss": 0.3263,
"step": 4650
},
{
"epoch": 3.24,
"learning_rate": 7.860512820512822e-06,
"loss": 0.3227,
"step": 4675
},
{
"epoch": 3.26,
"learning_rate": 7.847692307692308e-06,
"loss": 0.3123,
"step": 4700
},
{
"epoch": 3.27,
"learning_rate": 7.834871794871795e-06,
"loss": 0.3231,
"step": 4725
},
{
"epoch": 3.29,
"learning_rate": 7.822051282051282e-06,
"loss": 0.3241,
"step": 4750
},
{
"epoch": 3.31,
"learning_rate": 7.80923076923077e-06,
"loss": 0.3365,
"step": 4775
},
{
"epoch": 3.33,
"learning_rate": 7.796410256410257e-06,
"loss": 0.3153,
"step": 4800
},
{
"epoch": 3.34,
"learning_rate": 7.783589743589744e-06,
"loss": 0.33,
"step": 4825
},
{
"epoch": 3.36,
"learning_rate": 7.770769230769231e-06,
"loss": 0.321,
"step": 4850
},
{
"epoch": 3.38,
"learning_rate": 7.75794871794872e-06,
"loss": 0.3202,
"step": 4875
},
{
"epoch": 3.4,
"learning_rate": 7.745128205128206e-06,
"loss": 0.3245,
"step": 4900
},
{
"epoch": 3.41,
"learning_rate": 7.732307692307693e-06,
"loss": 0.3217,
"step": 4925
},
{
"epoch": 3.43,
"learning_rate": 7.71948717948718e-06,
"loss": 0.3225,
"step": 4950
},
{
"epoch": 3.45,
"learning_rate": 7.706666666666669e-06,
"loss": 0.3212,
"step": 4975
},
{
"epoch": 3.47,
"learning_rate": 7.693846153846154e-06,
"loss": 0.3122,
"step": 5000
},
{
"epoch": 3.47,
"eval_cer": 20.340453488763856,
"eval_loss": 0.4448564648628235,
"eval_runtime": 151.8479,
"eval_samples_per_second": 12.42,
"eval_steps_per_second": 0.198,
"eval_wer": 52.59449421018134,
"step": 5000
},
{
"epoch": 3.48,
"learning_rate": 7.68102564102564e-06,
"loss": 0.3173,
"step": 5025
},
{
"epoch": 3.5,
"learning_rate": 7.668205128205129e-06,
"loss": 0.3252,
"step": 5050
},
{
"epoch": 3.52,
"learning_rate": 7.655384615384616e-06,
"loss": 0.3174,
"step": 5075
},
{
"epoch": 3.53,
"learning_rate": 7.642564102564103e-06,
"loss": 0.3111,
"step": 5100
},
{
"epoch": 3.55,
"learning_rate": 7.62974358974359e-06,
"loss": 0.3074,
"step": 5125
},
{
"epoch": 3.57,
"learning_rate": 7.616923076923077e-06,
"loss": 0.3127,
"step": 5150
},
{
"epoch": 3.59,
"learning_rate": 7.604102564102565e-06,
"loss": 0.3129,
"step": 5175
},
{
"epoch": 3.6,
"learning_rate": 7.591282051282052e-06,
"loss": 0.3136,
"step": 5200
},
{
"epoch": 3.62,
"learning_rate": 7.578461538461539e-06,
"loss": 0.3143,
"step": 5225
},
{
"epoch": 3.64,
"learning_rate": 7.565641025641026e-06,
"loss": 0.3106,
"step": 5250
},
{
"epoch": 3.66,
"learning_rate": 7.552820512820514e-06,
"loss": 0.3162,
"step": 5275
},
{
"epoch": 3.67,
"learning_rate": 7.540000000000001e-06,
"loss": 0.3163,
"step": 5300
},
{
"epoch": 3.69,
"learning_rate": 7.5271794871794875e-06,
"loss": 0.3138,
"step": 5325
},
{
"epoch": 3.71,
"learning_rate": 7.514358974358975e-06,
"loss": 0.3131,
"step": 5350
},
{
"epoch": 3.72,
"learning_rate": 7.501538461538462e-06,
"loss": 0.3164,
"step": 5375
},
{
"epoch": 3.74,
"learning_rate": 7.48871794871795e-06,
"loss": 0.3119,
"step": 5400
},
{
"epoch": 3.76,
"learning_rate": 7.4758974358974365e-06,
"loss": 0.3087,
"step": 5425
},
{
"epoch": 3.78,
"learning_rate": 7.463076923076924e-06,
"loss": 0.3089,
"step": 5450
},
{
"epoch": 3.79,
"learning_rate": 7.450256410256411e-06,
"loss": 0.3066,
"step": 5475
},
{
"epoch": 3.81,
"learning_rate": 7.437435897435899e-06,
"loss": 0.3115,
"step": 5500
},
{
"epoch": 3.83,
"learning_rate": 7.4246153846153855e-06,
"loss": 0.3133,
"step": 5525
},
{
"epoch": 3.85,
"learning_rate": 7.411794871794873e-06,
"loss": 0.31,
"step": 5550
},
{
"epoch": 3.86,
"learning_rate": 7.39897435897436e-06,
"loss": 0.3123,
"step": 5575
},
{
"epoch": 3.88,
"learning_rate": 7.386153846153846e-06,
"loss": 0.3149,
"step": 5600
},
{
"epoch": 3.9,
"learning_rate": 7.373333333333334e-06,
"loss": 0.314,
"step": 5625
},
{
"epoch": 3.92,
"learning_rate": 7.3605128205128204e-06,
"loss": 0.3138,
"step": 5650
},
{
"epoch": 3.93,
"learning_rate": 7.347692307692308e-06,
"loss": 0.3207,
"step": 5675
},
{
"epoch": 3.95,
"learning_rate": 7.334871794871795e-06,
"loss": 0.3207,
"step": 5700
},
{
"epoch": 3.97,
"learning_rate": 7.322051282051283e-06,
"loss": 0.3134,
"step": 5725
},
{
"epoch": 3.98,
"learning_rate": 7.309230769230769e-06,
"loss": 0.3095,
"step": 5750
},
{
"epoch": 4.0,
"learning_rate": 7.296410256410257e-06,
"loss": 0.304,
"step": 5775
},
{
"epoch": 4.02,
"learning_rate": 7.283589743589744e-06,
"loss": 0.2911,
"step": 5800
},
{
"epoch": 4.04,
"learning_rate": 7.270769230769232e-06,
"loss": 0.2908,
"step": 5825
},
{
"epoch": 4.05,
"learning_rate": 7.257948717948718e-06,
"loss": 0.291,
"step": 5850
},
{
"epoch": 4.07,
"learning_rate": 7.245128205128206e-06,
"loss": 0.2951,
"step": 5875
},
{
"epoch": 4.09,
"learning_rate": 7.232307692307693e-06,
"loss": 0.2929,
"step": 5900
},
{
"epoch": 4.11,
"learning_rate": 7.21948717948718e-06,
"loss": 0.2987,
"step": 5925
},
{
"epoch": 4.12,
"learning_rate": 7.206666666666667e-06,
"loss": 0.3001,
"step": 5950
},
{
"epoch": 4.14,
"learning_rate": 7.193846153846154e-06,
"loss": 0.2914,
"step": 5975
},
{
"epoch": 4.16,
"learning_rate": 7.181025641025642e-06,
"loss": 0.3002,
"step": 6000
},
{
"epoch": 4.16,
"eval_cer": 19.349920824770056,
"eval_loss": 0.42852291464805603,
"eval_runtime": 150.6853,
"eval_samples_per_second": 12.516,
"eval_steps_per_second": 0.199,
"eval_wer": 50.507974655888134,
"step": 6000
},
{
"epoch": 4.18,
"learning_rate": 7.168205128205129e-06,
"loss": 0.2952,
"step": 6025
},
{
"epoch": 4.19,
"learning_rate": 7.155384615384616e-06,
"loss": 0.296,
"step": 6050
},
{
"epoch": 4.21,
"learning_rate": 7.142564102564103e-06,
"loss": 0.283,
"step": 6075
},
{
"epoch": 4.23,
"learning_rate": 7.129743589743591e-06,
"loss": 0.2912,
"step": 6100
},
{
"epoch": 4.24,
"learning_rate": 7.116923076923078e-06,
"loss": 0.2941,
"step": 6125
},
{
"epoch": 4.26,
"learning_rate": 7.104102564102565e-06,
"loss": 0.2931,
"step": 6150
},
{
"epoch": 4.28,
"learning_rate": 7.091282051282052e-06,
"loss": 0.2904,
"step": 6175
},
{
"epoch": 4.3,
"learning_rate": 7.078461538461538e-06,
"loss": 0.2949,
"step": 6200
},
{
"epoch": 4.31,
"learning_rate": 7.065641025641026e-06,
"loss": 0.3002,
"step": 6225
},
{
"epoch": 4.33,
"learning_rate": 7.052820512820513e-06,
"loss": 0.291,
"step": 6250
},
{
"epoch": 4.35,
"learning_rate": 7.04e-06,
"loss": 0.2851,
"step": 6275
},
{
"epoch": 4.37,
"learning_rate": 7.027179487179487e-06,
"loss": 0.2827,
"step": 6300
},
{
"epoch": 4.38,
"learning_rate": 7.014358974358975e-06,
"loss": 0.2966,
"step": 6325
},
{
"epoch": 4.4,
"learning_rate": 7.001538461538462e-06,
"loss": 0.2902,
"step": 6350
},
{
"epoch": 4.42,
"learning_rate": 6.988717948717949e-06,
"loss": 0.2981,
"step": 6375
},
{
"epoch": 4.44,
"learning_rate": 6.975897435897436e-06,
"loss": 0.2989,
"step": 6400
},
{
"epoch": 4.45,
"learning_rate": 6.963076923076924e-06,
"loss": 0.2868,
"step": 6425
},
{
"epoch": 4.47,
"learning_rate": 6.950256410256411e-06,
"loss": 0.288,
"step": 6450
},
{
"epoch": 4.49,
"learning_rate": 6.937435897435898e-06,
"loss": 0.2941,
"step": 6475
},
{
"epoch": 4.5,
"learning_rate": 6.924615384615385e-06,
"loss": 0.2922,
"step": 6500
},
{
"epoch": 4.52,
"learning_rate": 6.911794871794872e-06,
"loss": 0.2867,
"step": 6525
},
{
"epoch": 4.54,
"learning_rate": 6.89897435897436e-06,
"loss": 0.2993,
"step": 6550
},
{
"epoch": 4.56,
"learning_rate": 6.8861538461538465e-06,
"loss": 0.2889,
"step": 6575
},
{
"epoch": 4.57,
"learning_rate": 6.873333333333334e-06,
"loss": 0.2941,
"step": 6600
},
{
"epoch": 4.59,
"learning_rate": 6.860512820512821e-06,
"loss": 0.2939,
"step": 6625
},
{
"epoch": 4.61,
"learning_rate": 6.847692307692309e-06,
"loss": 0.2979,
"step": 6650
},
{
"epoch": 4.63,
"learning_rate": 6.8348717948717955e-06,
"loss": 0.2894,
"step": 6675
},
{
"epoch": 4.64,
"learning_rate": 6.822051282051283e-06,
"loss": 0.2878,
"step": 6700
},
{
"epoch": 4.66,
"learning_rate": 6.80923076923077e-06,
"loss": 0.2887,
"step": 6725
},
{
"epoch": 4.68,
"learning_rate": 6.796410256410258e-06,
"loss": 0.2859,
"step": 6750
},
{
"epoch": 4.7,
"learning_rate": 6.7835897435897445e-06,
"loss": 0.2929,
"step": 6775
},
{
"epoch": 4.71,
"learning_rate": 6.770769230769232e-06,
"loss": 0.2888,
"step": 6800
},
{
"epoch": 4.73,
"learning_rate": 6.757948717948718e-06,
"loss": 0.2969,
"step": 6825
},
{
"epoch": 4.75,
"learning_rate": 6.745128205128205e-06,
"loss": 0.289,
"step": 6850
},
{
"epoch": 4.76,
"learning_rate": 6.732307692307693e-06,
"loss": 0.2876,
"step": 6875
},
{
"epoch": 4.78,
"learning_rate": 6.7194871794871794e-06,
"loss": 0.2868,
"step": 6900
},
{
"epoch": 4.8,
"learning_rate": 6.706666666666667e-06,
"loss": 0.2839,
"step": 6925
},
{
"epoch": 4.82,
"learning_rate": 6.693846153846154e-06,
"loss": 0.2807,
"step": 6950
},
{
"epoch": 4.83,
"learning_rate": 6.681025641025642e-06,
"loss": 0.286,
"step": 6975
},
{
"epoch": 4.85,
"learning_rate": 6.6682051282051284e-06,
"loss": 0.2842,
"step": 7000
},
{
"epoch": 4.85,
"eval_cer": 19.02816616690812,
"eval_loss": 0.41709569096565247,
"eval_runtime": 150.2276,
"eval_samples_per_second": 12.554,
"eval_steps_per_second": 0.2,
"eval_wer": 49.393707668778674,
"step": 7000
},
{
"epoch": 4.87,
"learning_rate": 6.655384615384616e-06,
"loss": 0.2869,
"step": 7025
},
{
"epoch": 4.89,
"learning_rate": 6.642564102564103e-06,
"loss": 0.2916,
"step": 7050
},
{
"epoch": 4.9,
"learning_rate": 6.629743589743591e-06,
"loss": 0.2826,
"step": 7075
},
{
"epoch": 4.92,
"learning_rate": 6.616923076923077e-06,
"loss": 0.298,
"step": 7100
},
{
"epoch": 4.94,
"learning_rate": 6.604102564102565e-06,
"loss": 0.2878,
"step": 7125
},
{
"epoch": 4.95,
"learning_rate": 6.591282051282052e-06,
"loss": 0.2898,
"step": 7150
},
{
"epoch": 4.97,
"learning_rate": 6.578461538461539e-06,
"loss": 0.29,
"step": 7175
},
{
"epoch": 4.99,
"learning_rate": 6.565641025641026e-06,
"loss": 0.2902,
"step": 7200
},
{
"epoch": 5.01,
"learning_rate": 6.552820512820513e-06,
"loss": 0.2766,
"step": 7225
},
{
"epoch": 5.02,
"learning_rate": 6.540000000000001e-06,
"loss": 0.2669,
"step": 7250
},
{
"epoch": 5.04,
"learning_rate": 6.527179487179488e-06,
"loss": 0.2708,
"step": 7275
},
{
"epoch": 5.06,
"learning_rate": 6.514358974358975e-06,
"loss": 0.2743,
"step": 7300
},
{
"epoch": 5.08,
"learning_rate": 6.501538461538462e-06,
"loss": 0.2736,
"step": 7325
},
{
"epoch": 5.09,
"learning_rate": 6.48871794871795e-06,
"loss": 0.271,
"step": 7350
},
{
"epoch": 5.11,
"learning_rate": 6.475897435897437e-06,
"loss": 0.2633,
"step": 7375
},
{
"epoch": 5.13,
"learning_rate": 6.463076923076924e-06,
"loss": 0.271,
"step": 7400
},
{
"epoch": 5.15,
"learning_rate": 6.45025641025641e-06,
"loss": 0.2744,
"step": 7425
},
{
"epoch": 5.16,
"learning_rate": 6.437435897435897e-06,
"loss": 0.2713,
"step": 7450
},
{
"epoch": 5.18,
"learning_rate": 6.424615384615385e-06,
"loss": 0.2758,
"step": 7475
},
{
"epoch": 5.2,
"learning_rate": 6.411794871794872e-06,
"loss": 0.2766,
"step": 7500
},
{
"epoch": 5.21,
"learning_rate": 6.398974358974359e-06,
"loss": 0.2741,
"step": 7525
},
{
"epoch": 5.23,
"learning_rate": 6.386153846153846e-06,
"loss": 0.2735,
"step": 7550
},
{
"epoch": 5.25,
"learning_rate": 6.373333333333334e-06,
"loss": 0.2666,
"step": 7575
},
{
"epoch": 5.27,
"learning_rate": 6.360512820512821e-06,
"loss": 0.276,
"step": 7600
},
{
"epoch": 5.28,
"learning_rate": 6.347692307692308e-06,
"loss": 0.2742,
"step": 7625
},
{
"epoch": 5.3,
"learning_rate": 6.334871794871795e-06,
"loss": 0.2684,
"step": 7650
},
{
"epoch": 5.32,
"learning_rate": 6.322051282051283e-06,
"loss": 0.2833,
"step": 7675
},
{
"epoch": 5.34,
"learning_rate": 6.30923076923077e-06,
"loss": 0.2681,
"step": 7700
},
{
"epoch": 5.35,
"learning_rate": 6.296410256410257e-06,
"loss": 0.2719,
"step": 7725
},
{
"epoch": 5.37,
"learning_rate": 6.283589743589744e-06,
"loss": 0.2617,
"step": 7750
},
{
"epoch": 5.39,
"learning_rate": 6.270769230769231e-06,
"loss": 0.272,
"step": 7775
},
{
"epoch": 5.41,
"learning_rate": 6.257948717948719e-06,
"loss": 0.2744,
"step": 7800
},
{
"epoch": 5.42,
"learning_rate": 6.2451282051282055e-06,
"loss": 0.2734,
"step": 7825
},
{
"epoch": 5.44,
"learning_rate": 6.232307692307693e-06,
"loss": 0.2767,
"step": 7850
},
{
"epoch": 5.46,
"learning_rate": 6.21948717948718e-06,
"loss": 0.2781,
"step": 7875
},
{
"epoch": 5.47,
"learning_rate": 6.206666666666668e-06,
"loss": 0.2743,
"step": 7900
},
{
"epoch": 5.49,
"learning_rate": 6.1938461538461545e-06,
"loss": 0.2651,
"step": 7925
},
{
"epoch": 5.51,
"learning_rate": 6.181025641025642e-06,
"loss": 0.2684,
"step": 7950
},
{
"epoch": 5.53,
"learning_rate": 6.168205128205129e-06,
"loss": 0.2656,
"step": 7975
},
{
"epoch": 5.54,
"learning_rate": 6.155384615384617e-06,
"loss": 0.2655,
"step": 8000
},
{
"epoch": 5.54,
"eval_cer": 18.604494457733903,
"eval_loss": 0.40993332862854004,
"eval_runtime": 151.2755,
"eval_samples_per_second": 12.467,
"eval_steps_per_second": 0.198,
"eval_wer": 48.67271138300197,
"step": 8000
},
{
"epoch": 5.56,
"learning_rate": 6.142564102564103e-06,
"loss": 0.2794,
"step": 8025
},
{
"epoch": 5.58,
"learning_rate": 6.1297435897435895e-06,
"loss": 0.271,
"step": 8050
},
{
"epoch": 5.6,
"learning_rate": 6.1174358974358986e-06,
"loss": 0.276,
"step": 8075
},
{
"epoch": 5.61,
"learning_rate": 6.104615384615385e-06,
"loss": 0.2712,
"step": 8100
},
{
"epoch": 5.63,
"learning_rate": 6.091794871794873e-06,
"loss": 0.2731,
"step": 8125
},
{
"epoch": 5.65,
"learning_rate": 6.07897435897436e-06,
"loss": 0.2726,
"step": 8150
},
{
"epoch": 5.67,
"learning_rate": 6.0661538461538476e-06,
"loss": 0.2723,
"step": 8175
},
{
"epoch": 5.68,
"learning_rate": 6.0533333333333335e-06,
"loss": 0.2694,
"step": 8200
},
{
"epoch": 5.7,
"learning_rate": 6.04051282051282e-06,
"loss": 0.2756,
"step": 8225
},
{
"epoch": 5.72,
"learning_rate": 6.027692307692308e-06,
"loss": 0.2666,
"step": 8250
},
{
"epoch": 5.73,
"learning_rate": 6.014871794871795e-06,
"loss": 0.2757,
"step": 8275
},
{
"epoch": 5.75,
"learning_rate": 6.0020512820512825e-06,
"loss": 0.2717,
"step": 8300
},
{
"epoch": 5.77,
"learning_rate": 5.989230769230769e-06,
"loss": 0.2808,
"step": 8325
},
{
"epoch": 5.79,
"learning_rate": 5.976410256410257e-06,
"loss": 0.2699,
"step": 8350
},
{
"epoch": 5.8,
"learning_rate": 5.963589743589744e-06,
"loss": 0.2711,
"step": 8375
},
{
"epoch": 5.82,
"learning_rate": 5.950769230769231e-06,
"loss": 0.2649,
"step": 8400
},
{
"epoch": 5.84,
"learning_rate": 5.937948717948718e-06,
"loss": 0.2647,
"step": 8425
},
{
"epoch": 5.86,
"learning_rate": 5.925128205128205e-06,
"loss": 0.2696,
"step": 8450
},
{
"epoch": 5.87,
"learning_rate": 5.912307692307693e-06,
"loss": 0.2662,
"step": 8475
},
{
"epoch": 5.89,
"learning_rate": 5.89948717948718e-06,
"loss": 0.2714,
"step": 8500
},
{
"epoch": 5.91,
"learning_rate": 5.886666666666667e-06,
"loss": 0.2693,
"step": 8525
},
{
"epoch": 5.93,
"learning_rate": 5.873846153846154e-06,
"loss": 0.2694,
"step": 8550
},
{
"epoch": 5.94,
"learning_rate": 5.861025641025642e-06,
"loss": 0.2661,
"step": 8575
},
{
"epoch": 5.96,
"learning_rate": 5.848205128205129e-06,
"loss": 0.2779,
"step": 8600
},
{
"epoch": 5.98,
"learning_rate": 5.835384615384616e-06,
"loss": 0.2744,
"step": 8625
},
{
"epoch": 5.99,
"learning_rate": 5.822564102564103e-06,
"loss": 0.2628,
"step": 8650
},
{
"epoch": 6.01,
"learning_rate": 5.809743589743591e-06,
"loss": 0.2587,
"step": 8675
},
{
"epoch": 6.03,
"learning_rate": 5.796923076923078e-06,
"loss": 0.2622,
"step": 8700
},
{
"epoch": 6.05,
"learning_rate": 5.784102564102565e-06,
"loss": 0.2532,
"step": 8725
},
{
"epoch": 6.06,
"learning_rate": 5.771282051282052e-06,
"loss": 0.2564,
"step": 8750
},
{
"epoch": 6.08,
"learning_rate": 5.75846153846154e-06,
"loss": 0.261,
"step": 8775
},
{
"epoch": 6.1,
"learning_rate": 5.745641025641027e-06,
"loss": 0.2553,
"step": 8800
},
{
"epoch": 6.12,
"learning_rate": 5.732820512820513e-06,
"loss": 0.256,
"step": 8825
},
{
"epoch": 6.13,
"learning_rate": 5.72e-06,
"loss": 0.2517,
"step": 8850
},
{
"epoch": 6.15,
"learning_rate": 5.707179487179487e-06,
"loss": 0.2559,
"step": 8875
},
{
"epoch": 6.17,
"learning_rate": 5.694358974358975e-06,
"loss": 0.2568,
"step": 8900
},
{
"epoch": 6.19,
"learning_rate": 5.681538461538462e-06,
"loss": 0.2557,
"step": 8925
},
{
"epoch": 6.2,
"learning_rate": 5.668717948717949e-06,
"loss": 0.2598,
"step": 8950
},
{
"epoch": 6.22,
"learning_rate": 5.655897435897436e-06,
"loss": 0.2602,
"step": 8975
},
{
"epoch": 6.24,
"learning_rate": 5.643076923076923e-06,
"loss": 0.2555,
"step": 9000
},
{
"epoch": 6.24,
"eval_cer": 18.33917320844985,
"eval_loss": 0.40347620844841003,
"eval_runtime": 151.4937,
"eval_samples_per_second": 12.449,
"eval_steps_per_second": 0.198,
"eval_wer": 48.20843347170636,
"step": 9000
},
{
"epoch": 6.25,
"learning_rate": 5.630256410256411e-06,
"loss": 0.2542,
"step": 9025
},
{
"epoch": 6.27,
"learning_rate": 5.6174358974358974e-06,
"loss": 0.2552,
"step": 9050
},
{
"epoch": 6.29,
"learning_rate": 5.604615384615385e-06,
"loss": 0.2568,
"step": 9075
},
{
"epoch": 6.31,
"learning_rate": 5.591794871794872e-06,
"loss": 0.2594,
"step": 9100
},
{
"epoch": 6.32,
"learning_rate": 5.57897435897436e-06,
"loss": 0.2597,
"step": 9125
},
{
"epoch": 6.34,
"learning_rate": 5.566153846153846e-06,
"loss": 0.2556,
"step": 9150
},
{
"epoch": 6.36,
"learning_rate": 5.553333333333334e-06,
"loss": 0.2526,
"step": 9175
},
{
"epoch": 6.38,
"learning_rate": 5.540512820512821e-06,
"loss": 0.2609,
"step": 9200
},
{
"epoch": 6.39,
"learning_rate": 5.527692307692309e-06,
"loss": 0.2605,
"step": 9225
},
{
"epoch": 6.41,
"learning_rate": 5.514871794871795e-06,
"loss": 0.257,
"step": 9250
},
{
"epoch": 6.43,
"learning_rate": 5.502051282051283e-06,
"loss": 0.2616,
"step": 9275
},
{
"epoch": 6.44,
"learning_rate": 5.48923076923077e-06,
"loss": 0.2561,
"step": 9300
},
{
"epoch": 6.46,
"learning_rate": 5.476410256410258e-06,
"loss": 0.2558,
"step": 9325
},
{
"epoch": 6.48,
"learning_rate": 5.463589743589744e-06,
"loss": 0.2517,
"step": 9350
},
{
"epoch": 6.5,
"learning_rate": 5.450769230769232e-06,
"loss": 0.2546,
"step": 9375
},
{
"epoch": 6.51,
"learning_rate": 5.437948717948719e-06,
"loss": 0.2548,
"step": 9400
},
{
"epoch": 6.53,
"learning_rate": 5.425128205128205e-06,
"loss": 0.2541,
"step": 9425
},
{
"epoch": 6.55,
"learning_rate": 5.4123076923076925e-06,
"loss": 0.2581,
"step": 9450
},
{
"epoch": 6.57,
"learning_rate": 5.399487179487179e-06,
"loss": 0.2578,
"step": 9475
},
{
"epoch": 6.58,
"learning_rate": 5.386666666666667e-06,
"loss": 0.2519,
"step": 9500
},
{
"epoch": 6.6,
"learning_rate": 5.373846153846154e-06,
"loss": 0.2651,
"step": 9525
},
{
"epoch": 6.62,
"learning_rate": 5.3610256410256415e-06,
"loss": 0.2562,
"step": 9550
},
{
"epoch": 6.64,
"learning_rate": 5.348205128205128e-06,
"loss": 0.2552,
"step": 9575
},
{
"epoch": 6.65,
"learning_rate": 5.335384615384615e-06,
"loss": 0.2658,
"step": 9600
},
{
"epoch": 6.67,
"learning_rate": 5.322564102564103e-06,
"loss": 0.2504,
"step": 9625
},
{
"epoch": 6.69,
"learning_rate": 5.30974358974359e-06,
"loss": 0.2531,
"step": 9650
},
{
"epoch": 6.7,
"learning_rate": 5.296923076923077e-06,
"loss": 0.2529,
"step": 9675
},
{
"epoch": 6.72,
"learning_rate": 5.284102564102564e-06,
"loss": 0.2569,
"step": 9700
},
{
"epoch": 6.74,
"learning_rate": 5.271282051282052e-06,
"loss": 0.2634,
"step": 9725
},
{
"epoch": 6.76,
"learning_rate": 5.258461538461539e-06,
"loss": 0.2586,
"step": 9750
},
{
"epoch": 6.77,
"learning_rate": 5.245641025641026e-06,
"loss": 0.2544,
"step": 9775
},
{
"epoch": 6.79,
"learning_rate": 5.232820512820513e-06,
"loss": 0.2585,
"step": 9800
},
{
"epoch": 6.81,
"learning_rate": 5.220000000000001e-06,
"loss": 0.2569,
"step": 9825
},
{
"epoch": 6.83,
"learning_rate": 5.207179487179488e-06,
"loss": 0.2511,
"step": 9850
},
{
"epoch": 6.84,
"learning_rate": 5.194358974358975e-06,
"loss": 0.2517,
"step": 9875
},
{
"epoch": 6.86,
"learning_rate": 5.181538461538462e-06,
"loss": 0.2508,
"step": 9900
},
{
"epoch": 6.88,
"learning_rate": 5.16871794871795e-06,
"loss": 0.2537,
"step": 9925
},
{
"epoch": 6.9,
"learning_rate": 5.155897435897437e-06,
"loss": 0.2525,
"step": 9950
},
{
"epoch": 6.91,
"learning_rate": 5.143076923076924e-06,
"loss": 0.2592,
"step": 9975
},
{
"epoch": 6.93,
"learning_rate": 5.130256410256411e-06,
"loss": 0.2525,
"step": 10000
},
{
"epoch": 6.93,
"eval_cer": 17.83379940028975,
"eval_loss": 0.39897266030311584,
"eval_runtime": 142.0559,
"eval_samples_per_second": 13.276,
"eval_steps_per_second": 0.211,
"eval_wer": 47.32903648678173,
"step": 10000
},
{
"epoch": 6.95,
"learning_rate": 5.117435897435897e-06,
"loss": 0.2527,
"step": 10025
},
{
"epoch": 6.96,
"learning_rate": 5.104615384615385e-06,
"loss": 0.2529,
"step": 10050
},
{
"epoch": 6.98,
"learning_rate": 5.091794871794872e-06,
"loss": 0.2515,
"step": 10075
},
{
"epoch": 7.0,
"learning_rate": 5.078974358974359e-06,
"loss": 0.2612,
"step": 10100
},
{
"epoch": 7.02,
"learning_rate": 5.0666666666666676e-06,
"loss": 0.2435,
"step": 10125
},
{
"epoch": 7.03,
"learning_rate": 5.053846153846154e-06,
"loss": 0.2416,
"step": 10150
},
{
"epoch": 7.05,
"learning_rate": 5.041025641025642e-06,
"loss": 0.2346,
"step": 10175
},
{
"epoch": 7.07,
"learning_rate": 5.028205128205128e-06,
"loss": 0.2408,
"step": 10200
},
{
"epoch": 7.09,
"learning_rate": 5.015384615384616e-06,
"loss": 0.2412,
"step": 10225
},
{
"epoch": 7.1,
"learning_rate": 5.0025641025641025e-06,
"loss": 0.2456,
"step": 10250
},
{
"epoch": 7.12,
"learning_rate": 4.98974358974359e-06,
"loss": 0.2434,
"step": 10275
},
{
"epoch": 7.14,
"learning_rate": 4.976923076923078e-06,
"loss": 0.2446,
"step": 10300
},
{
"epoch": 7.16,
"learning_rate": 4.964102564102565e-06,
"loss": 0.2444,
"step": 10325
},
{
"epoch": 7.17,
"learning_rate": 4.9512820512820515e-06,
"loss": 0.2508,
"step": 10350
},
{
"epoch": 7.19,
"learning_rate": 4.938461538461538e-06,
"loss": 0.242,
"step": 10375
},
{
"epoch": 7.21,
"learning_rate": 4.925641025641026e-06,
"loss": 0.2388,
"step": 10400
},
{
"epoch": 7.22,
"learning_rate": 4.912820512820513e-06,
"loss": 0.2411,
"step": 10425
},
{
"epoch": 7.24,
"learning_rate": 4.9000000000000005e-06,
"loss": 0.2489,
"step": 10450
},
{
"epoch": 7.26,
"learning_rate": 4.887179487179487e-06,
"loss": 0.2474,
"step": 10475
},
{
"epoch": 7.28,
"learning_rate": 4.874358974358975e-06,
"loss": 0.246,
"step": 10500
},
{
"epoch": 7.29,
"learning_rate": 4.861538461538462e-06,
"loss": 0.2382,
"step": 10525
},
{
"epoch": 7.31,
"learning_rate": 4.8487179487179495e-06,
"loss": 0.2473,
"step": 10550
},
{
"epoch": 7.33,
"learning_rate": 4.835897435897436e-06,
"loss": 0.2483,
"step": 10575
},
{
"epoch": 7.35,
"learning_rate": 4.823076923076924e-06,
"loss": 0.2456,
"step": 10600
},
{
"epoch": 7.36,
"learning_rate": 4.810256410256411e-06,
"loss": 0.2509,
"step": 10625
},
{
"epoch": 7.38,
"learning_rate": 4.7974358974358985e-06,
"loss": 0.2449,
"step": 10650
},
{
"epoch": 7.4,
"learning_rate": 4.7846153846153845e-06,
"loss": 0.2377,
"step": 10675
},
{
"epoch": 7.42,
"learning_rate": 4.771794871794872e-06,
"loss": 0.2507,
"step": 10700
},
{
"epoch": 7.43,
"learning_rate": 4.758974358974359e-06,
"loss": 0.2443,
"step": 10725
},
{
"epoch": 7.45,
"learning_rate": 4.746153846153847e-06,
"loss": 0.2441,
"step": 10750
},
{
"epoch": 7.47,
"learning_rate": 4.7333333333333335e-06,
"loss": 0.2493,
"step": 10775
},
{
"epoch": 7.48,
"learning_rate": 4.720512820512821e-06,
"loss": 0.2355,
"step": 10800
},
{
"epoch": 7.5,
"learning_rate": 4.707692307692308e-06,
"loss": 0.2391,
"step": 10825
},
{
"epoch": 7.52,
"learning_rate": 4.694871794871796e-06,
"loss": 0.2375,
"step": 10850
},
{
"epoch": 7.54,
"learning_rate": 4.6820512820512825e-06,
"loss": 0.2453,
"step": 10875
},
{
"epoch": 7.55,
"learning_rate": 4.66923076923077e-06,
"loss": 0.2469,
"step": 10900
},
{
"epoch": 7.57,
"learning_rate": 4.656410256410257e-06,
"loss": 0.2428,
"step": 10925
},
{
"epoch": 7.59,
"learning_rate": 4.643589743589745e-06,
"loss": 0.243,
"step": 10950
},
{
"epoch": 7.61,
"learning_rate": 4.630769230769231e-06,
"loss": 0.2448,
"step": 10975
},
{
"epoch": 7.62,
"learning_rate": 4.617948717948718e-06,
"loss": 0.243,
"step": 11000
},
{
"epoch": 7.62,
"eval_cer": 18.252417371382364,
"eval_loss": 0.39634308218955994,
"eval_runtime": 151.5788,
"eval_samples_per_second": 12.442,
"eval_steps_per_second": 0.198,
"eval_wer": 47.05593183307843,
"step": 11000
},
{
"epoch": 7.64,
"learning_rate": 4.605128205128205e-06,
"loss": 0.2444,
"step": 11025
},
{
"epoch": 7.66,
"learning_rate": 4.592307692307693e-06,
"loss": 0.2537,
"step": 11050
},
{
"epoch": 7.67,
"learning_rate": 4.57948717948718e-06,
"loss": 0.2423,
"step": 11075
},
{
"epoch": 7.69,
"learning_rate": 4.566666666666667e-06,
"loss": 0.2405,
"step": 11100
},
{
"epoch": 7.71,
"learning_rate": 4.553846153846154e-06,
"loss": 0.2438,
"step": 11125
},
{
"epoch": 7.73,
"learning_rate": 4.541025641025642e-06,
"loss": 0.2439,
"step": 11150
},
{
"epoch": 7.74,
"learning_rate": 4.528205128205129e-06,
"loss": 0.2447,
"step": 11175
},
{
"epoch": 7.76,
"learning_rate": 4.515384615384616e-06,
"loss": 0.2412,
"step": 11200
},
{
"epoch": 7.78,
"learning_rate": 4.502564102564103e-06,
"loss": 0.2421,
"step": 11225
},
{
"epoch": 7.8,
"learning_rate": 4.489743589743591e-06,
"loss": 0.2418,
"step": 11250
},
{
"epoch": 7.81,
"learning_rate": 4.476923076923077e-06,
"loss": 0.2444,
"step": 11275
},
{
"epoch": 7.83,
"learning_rate": 4.464102564102564e-06,
"loss": 0.2411,
"step": 11300
},
{
"epoch": 7.85,
"learning_rate": 4.451282051282051e-06,
"loss": 0.251,
"step": 11325
},
{
"epoch": 7.87,
"learning_rate": 4.438461538461539e-06,
"loss": 0.2412,
"step": 11350
},
{
"epoch": 7.88,
"learning_rate": 4.425641025641026e-06,
"loss": 0.2457,
"step": 11375
},
{
"epoch": 7.9,
"learning_rate": 4.412820512820513e-06,
"loss": 0.2419,
"step": 11400
},
{
"epoch": 7.92,
"learning_rate": 4.4e-06,
"loss": 0.2469,
"step": 11425
},
{
"epoch": 7.93,
"learning_rate": 4.387179487179488e-06,
"loss": 0.2432,
"step": 11450
},
{
"epoch": 7.95,
"learning_rate": 4.374358974358975e-06,
"loss": 0.2461,
"step": 11475
},
{
"epoch": 7.97,
"learning_rate": 4.361538461538462e-06,
"loss": 0.2409,
"step": 11500
},
{
"epoch": 7.99,
"learning_rate": 4.348717948717949e-06,
"loss": 0.2443,
"step": 11525
},
{
"epoch": 8.0,
"learning_rate": 4.335897435897437e-06,
"loss": 0.2467,
"step": 11550
},
{
"epoch": 8.02,
"learning_rate": 4.323076923076923e-06,
"loss": 0.2341,
"step": 11575
},
{
"epoch": 8.04,
"learning_rate": 4.3102564102564105e-06,
"loss": 0.2319,
"step": 11600
},
{
"epoch": 8.06,
"learning_rate": 4.297435897435897e-06,
"loss": 0.2308,
"step": 11625
},
{
"epoch": 8.07,
"learning_rate": 4.284615384615385e-06,
"loss": 0.2379,
"step": 11650
},
{
"epoch": 8.09,
"learning_rate": 4.271794871794872e-06,
"loss": 0.2352,
"step": 11675
},
{
"epoch": 8.11,
"learning_rate": 4.2589743589743595e-06,
"loss": 0.2359,
"step": 11700
},
{
"epoch": 8.13,
"learning_rate": 4.246153846153846e-06,
"loss": 0.2386,
"step": 11725
},
{
"epoch": 8.14,
"learning_rate": 4.233333333333334e-06,
"loss": 0.2344,
"step": 11750
},
{
"epoch": 8.16,
"learning_rate": 4.220512820512821e-06,
"loss": 0.2325,
"step": 11775
},
{
"epoch": 8.18,
"learning_rate": 4.2076923076923085e-06,
"loss": 0.2293,
"step": 11800
},
{
"epoch": 8.19,
"learning_rate": 4.194871794871795e-06,
"loss": 0.2316,
"step": 11825
},
{
"epoch": 8.21,
"learning_rate": 4.182051282051283e-06,
"loss": 0.2358,
"step": 11850
},
{
"epoch": 8.23,
"learning_rate": 4.169230769230769e-06,
"loss": 0.2354,
"step": 11875
},
{
"epoch": 8.25,
"learning_rate": 4.156410256410257e-06,
"loss": 0.2327,
"step": 11900
},
{
"epoch": 8.26,
"learning_rate": 4.1435897435897435e-06,
"loss": 0.2349,
"step": 11925
},
{
"epoch": 8.28,
"learning_rate": 4.130769230769231e-06,
"loss": 0.2391,
"step": 11950
},
{
"epoch": 8.3,
"learning_rate": 4.117948717948718e-06,
"loss": 0.2391,
"step": 11975
},
{
"epoch": 8.32,
"learning_rate": 4.105128205128206e-06,
"loss": 0.2358,
"step": 12000
},
{
"epoch": 8.32,
"eval_cer": 17.818638186044943,
"eval_loss": 0.3948447108268738,
"eval_runtime": 151.3726,
"eval_samples_per_second": 12.459,
"eval_steps_per_second": 0.198,
"eval_wer": 46.733668341708544,
"step": 12000
},
{
"epoch": 8.33,
"learning_rate": 4.0923076923076925e-06,
"loss": 0.2293,
"step": 12025
},
{
"epoch": 8.35,
"learning_rate": 4.07948717948718e-06,
"loss": 0.2345,
"step": 12050
},
{
"epoch": 8.37,
"learning_rate": 4.066666666666667e-06,
"loss": 0.2317,
"step": 12075
},
{
"epoch": 8.39,
"learning_rate": 4.053846153846155e-06,
"loss": 0.2325,
"step": 12100
},
{
"epoch": 8.4,
"learning_rate": 4.0410256410256415e-06,
"loss": 0.2346,
"step": 12125
},
{
"epoch": 8.42,
"learning_rate": 4.028205128205129e-06,
"loss": 0.2287,
"step": 12150
},
{
"epoch": 8.44,
"learning_rate": 4.015384615384615e-06,
"loss": 0.2352,
"step": 12175
},
{
"epoch": 8.45,
"learning_rate": 4.002564102564103e-06,
"loss": 0.231,
"step": 12200
},
{
"epoch": 8.47,
"learning_rate": 3.98974358974359e-06,
"loss": 0.2305,
"step": 12225
},
{
"epoch": 8.49,
"learning_rate": 3.976923076923077e-06,
"loss": 0.2392,
"step": 12250
},
{
"epoch": 8.51,
"learning_rate": 3.964102564102564e-06,
"loss": 0.2344,
"step": 12275
},
{
"epoch": 8.52,
"learning_rate": 3.951282051282052e-06,
"loss": 0.2405,
"step": 12300
},
{
"epoch": 8.54,
"learning_rate": 3.938461538461539e-06,
"loss": 0.233,
"step": 12325
},
{
"epoch": 8.56,
"learning_rate": 3.925641025641026e-06,
"loss": 0.2371,
"step": 12350
},
{
"epoch": 8.58,
"learning_rate": 3.913333333333334e-06,
"loss": 0.2319,
"step": 12375
},
{
"epoch": 8.59,
"learning_rate": 3.9005128205128205e-06,
"loss": 0.2351,
"step": 12400
},
{
"epoch": 8.61,
"learning_rate": 3.887692307692308e-06,
"loss": 0.235,
"step": 12425
},
{
"epoch": 8.63,
"learning_rate": 3.874871794871795e-06,
"loss": 0.2396,
"step": 12450
},
{
"epoch": 8.65,
"learning_rate": 3.862051282051283e-06,
"loss": 0.2351,
"step": 12475
},
{
"epoch": 8.66,
"learning_rate": 3.8492307692307695e-06,
"loss": 0.2379,
"step": 12500
},
{
"epoch": 8.68,
"learning_rate": 3.836410256410257e-06,
"loss": 0.2295,
"step": 12525
},
{
"epoch": 8.7,
"learning_rate": 3.823589743589744e-06,
"loss": 0.2333,
"step": 12550
},
{
"epoch": 8.71,
"learning_rate": 3.8107692307692313e-06,
"loss": 0.2312,
"step": 12575
},
{
"epoch": 8.73,
"learning_rate": 3.7979487179487185e-06,
"loss": 0.2348,
"step": 12600
},
{
"epoch": 8.75,
"learning_rate": 3.7851282051282058e-06,
"loss": 0.2336,
"step": 12625
},
{
"epoch": 8.77,
"learning_rate": 3.772307692307693e-06,
"loss": 0.2333,
"step": 12650
},
{
"epoch": 8.78,
"learning_rate": 3.7594871794871794e-06,
"loss": 0.2299,
"step": 12675
},
{
"epoch": 8.8,
"learning_rate": 3.7466666666666667e-06,
"loss": 0.2347,
"step": 12700
},
{
"epoch": 8.82,
"learning_rate": 3.733846153846154e-06,
"loss": 0.2348,
"step": 12725
},
{
"epoch": 8.84,
"learning_rate": 3.721025641025641e-06,
"loss": 0.228,
"step": 12750
},
{
"epoch": 8.85,
"learning_rate": 3.7082051282051284e-06,
"loss": 0.2304,
"step": 12775
},
{
"epoch": 8.87,
"learning_rate": 3.6953846153846156e-06,
"loss": 0.2353,
"step": 12800
},
{
"epoch": 8.89,
"learning_rate": 3.682564102564103e-06,
"loss": 0.2365,
"step": 12825
},
{
"epoch": 8.91,
"learning_rate": 3.66974358974359e-06,
"loss": 0.2296,
"step": 12850
},
{
"epoch": 8.92,
"learning_rate": 3.6569230769230774e-06,
"loss": 0.239,
"step": 12875
},
{
"epoch": 8.94,
"learning_rate": 3.6441025641025646e-06,
"loss": 0.2344,
"step": 12900
},
{
"epoch": 8.96,
"learning_rate": 3.631282051282052e-06,
"loss": 0.2311,
"step": 12925
},
{
"epoch": 8.97,
"learning_rate": 3.618461538461539e-06,
"loss": 0.2327,
"step": 12950
},
{
"epoch": 8.99,
"learning_rate": 3.6056410256410255e-06,
"loss": 0.2312,
"step": 12975
},
{
"epoch": 9.01,
"learning_rate": 3.5928205128205128e-06,
"loss": 0.2288,
"step": 13000
},
{
"epoch": 9.01,
"eval_cer": 17.917186078636167,
"eval_loss": 0.39013856649398804,
"eval_runtime": 159.4832,
"eval_samples_per_second": 11.826,
"eval_steps_per_second": 0.188,
"eval_wer": 46.5479571771903,
"step": 13000
},
{
"epoch": 9.03,
"learning_rate": 3.58e-06,
"loss": 0.222,
"step": 13025
},
{
"epoch": 9.04,
"learning_rate": 3.5671794871794873e-06,
"loss": 0.2322,
"step": 13050
},
{
"epoch": 9.06,
"learning_rate": 3.5543589743589745e-06,
"loss": 0.2276,
"step": 13075
},
{
"epoch": 9.08,
"learning_rate": 3.5415384615384618e-06,
"loss": 0.221,
"step": 13100
},
{
"epoch": 9.1,
"learning_rate": 3.528717948717949e-06,
"loss": 0.2222,
"step": 13125
},
{
"epoch": 9.11,
"learning_rate": 3.5158974358974363e-06,
"loss": 0.2186,
"step": 13150
},
{
"epoch": 9.13,
"learning_rate": 3.5030769230769235e-06,
"loss": 0.2205,
"step": 13175
},
{
"epoch": 9.15,
"learning_rate": 3.4902564102564108e-06,
"loss": 0.2269,
"step": 13200
},
{
"epoch": 9.16,
"learning_rate": 3.477435897435898e-06,
"loss": 0.223,
"step": 13225
},
{
"epoch": 9.18,
"learning_rate": 3.4646153846153853e-06,
"loss": 0.2321,
"step": 13250
},
{
"epoch": 9.2,
"learning_rate": 3.4517948717948717e-06,
"loss": 0.2304,
"step": 13275
},
{
"epoch": 9.22,
"learning_rate": 3.438974358974359e-06,
"loss": 0.2217,
"step": 13300
},
{
"epoch": 9.23,
"learning_rate": 3.426153846153846e-06,
"loss": 0.2216,
"step": 13325
},
{
"epoch": 9.25,
"learning_rate": 3.4133333333333334e-06,
"loss": 0.2274,
"step": 13350
},
{
"epoch": 9.27,
"learning_rate": 3.4005128205128207e-06,
"loss": 0.2267,
"step": 13375
},
{
"epoch": 9.29,
"learning_rate": 3.387692307692308e-06,
"loss": 0.2302,
"step": 13400
},
{
"epoch": 9.3,
"learning_rate": 3.374871794871795e-06,
"loss": 0.2209,
"step": 13425
},
{
"epoch": 9.32,
"learning_rate": 3.3620512820512824e-06,
"loss": 0.2262,
"step": 13450
},
{
"epoch": 9.34,
"learning_rate": 3.3492307692307696e-06,
"loss": 0.2223,
"step": 13475
},
{
"epoch": 9.36,
"learning_rate": 3.336410256410257e-06,
"loss": 0.2289,
"step": 13500
},
{
"epoch": 9.37,
"learning_rate": 3.323589743589744e-06,
"loss": 0.2267,
"step": 13525
},
{
"epoch": 9.39,
"learning_rate": 3.3107692307692314e-06,
"loss": 0.2276,
"step": 13550
},
{
"epoch": 9.41,
"learning_rate": 3.297948717948718e-06,
"loss": 0.2213,
"step": 13575
},
{
"epoch": 9.42,
"learning_rate": 3.285128205128205e-06,
"loss": 0.2319,
"step": 13600
},
{
"epoch": 9.44,
"learning_rate": 3.2723076923076923e-06,
"loss": 0.2286,
"step": 13625
},
{
"epoch": 9.46,
"learning_rate": 3.2594871794871795e-06,
"loss": 0.2252,
"step": 13650
},
{
"epoch": 9.48,
"learning_rate": 3.2466666666666668e-06,
"loss": 0.2256,
"step": 13675
},
{
"epoch": 9.49,
"learning_rate": 3.233846153846154e-06,
"loss": 0.2237,
"step": 13700
},
{
"epoch": 9.51,
"learning_rate": 3.2210256410256413e-06,
"loss": 0.2271,
"step": 13725
},
{
"epoch": 9.53,
"learning_rate": 3.2082051282051285e-06,
"loss": 0.2232,
"step": 13750
},
{
"epoch": 9.55,
"learning_rate": 3.1953846153846158e-06,
"loss": 0.2295,
"step": 13775
},
{
"epoch": 9.56,
"learning_rate": 3.182564102564103e-06,
"loss": 0.2183,
"step": 13800
},
{
"epoch": 9.58,
"learning_rate": 3.1697435897435903e-06,
"loss": 0.2304,
"step": 13825
},
{
"epoch": 9.6,
"learning_rate": 3.1569230769230775e-06,
"loss": 0.2194,
"step": 13850
},
{
"epoch": 9.62,
"learning_rate": 3.144102564102564e-06,
"loss": 0.2192,
"step": 13875
},
{
"epoch": 9.63,
"learning_rate": 3.131282051282051e-06,
"loss": 0.231,
"step": 13900
},
{
"epoch": 9.65,
"learning_rate": 3.1184615384615384e-06,
"loss": 0.2348,
"step": 13925
},
{
"epoch": 9.67,
"learning_rate": 3.1056410256410257e-06,
"loss": 0.2242,
"step": 13950
},
{
"epoch": 9.68,
"learning_rate": 3.092820512820513e-06,
"loss": 0.2294,
"step": 13975
},
{
"epoch": 9.7,
"learning_rate": 3.08e-06,
"loss": 0.2171,
"step": 14000
},
{
"epoch": 9.7,
"eval_cer": 17.626596138944105,
"eval_loss": 0.39104682207107544,
"eval_runtime": 149.7053,
"eval_samples_per_second": 12.598,
"eval_steps_per_second": 0.2,
"eval_wer": 46.02359624207997,
"step": 14000
},
{
"epoch": 9.72,
"learning_rate": 3.0671794871794874e-06,
"loss": 0.2298,
"step": 14025
},
{
"epoch": 9.74,
"learning_rate": 3.0543589743589747e-06,
"loss": 0.2239,
"step": 14050
},
{
"epoch": 9.75,
"learning_rate": 3.041538461538462e-06,
"loss": 0.2251,
"step": 14075
},
{
"epoch": 9.77,
"learning_rate": 3.028717948717949e-06,
"loss": 0.2331,
"step": 14100
},
{
"epoch": 9.79,
"learning_rate": 3.0158974358974364e-06,
"loss": 0.2199,
"step": 14125
},
{
"epoch": 9.81,
"learning_rate": 3.0030769230769236e-06,
"loss": 0.2268,
"step": 14150
},
{
"epoch": 9.82,
"learning_rate": 2.99025641025641e-06,
"loss": 0.2272,
"step": 14175
},
{
"epoch": 9.84,
"learning_rate": 2.9774358974358973e-06,
"loss": 0.2332,
"step": 14200
},
{
"epoch": 9.86,
"learning_rate": 2.9646153846153845e-06,
"loss": 0.2222,
"step": 14225
},
{
"epoch": 9.88,
"learning_rate": 2.951794871794872e-06,
"loss": 0.2254,
"step": 14250
},
{
"epoch": 9.89,
"learning_rate": 2.938974358974359e-06,
"loss": 0.2279,
"step": 14275
},
{
"epoch": 9.91,
"learning_rate": 2.9261538461538463e-06,
"loss": 0.2249,
"step": 14300
},
{
"epoch": 9.93,
"learning_rate": 2.9133333333333335e-06,
"loss": 0.2295,
"step": 14325
},
{
"epoch": 9.94,
"learning_rate": 2.9005128205128208e-06,
"loss": 0.2229,
"step": 14350
},
{
"epoch": 9.96,
"learning_rate": 2.887692307692308e-06,
"loss": 0.2295,
"step": 14375
},
{
"epoch": 9.98,
"learning_rate": 2.8748717948717953e-06,
"loss": 0.2242,
"step": 14400
},
{
"epoch": 10.0,
"learning_rate": 2.8620512820512825e-06,
"loss": 0.2291,
"step": 14425
},
{
"epoch": 10.01,
"learning_rate": 2.8492307692307698e-06,
"loss": 0.2151,
"step": 14450
},
{
"epoch": 10.03,
"learning_rate": 2.836410256410257e-06,
"loss": 0.2147,
"step": 14475
},
{
"epoch": 10.05,
"learning_rate": 2.8235897435897434e-06,
"loss": 0.2167,
"step": 14500
},
{
"epoch": 10.07,
"learning_rate": 2.8107692307692307e-06,
"loss": 0.2182,
"step": 14525
},
{
"epoch": 10.08,
"learning_rate": 2.797948717948718e-06,
"loss": 0.2181,
"step": 14550
},
{
"epoch": 10.1,
"learning_rate": 2.785128205128205e-06,
"loss": 0.2182,
"step": 14575
},
{
"epoch": 10.12,
"learning_rate": 2.7723076923076924e-06,
"loss": 0.2156,
"step": 14600
},
{
"epoch": 10.14,
"learning_rate": 2.7594871794871797e-06,
"loss": 0.2229,
"step": 14625
},
{
"epoch": 10.15,
"learning_rate": 2.746666666666667e-06,
"loss": 0.2183,
"step": 14650
},
{
"epoch": 10.17,
"learning_rate": 2.733846153846154e-06,
"loss": 0.2213,
"step": 14675
},
{
"epoch": 10.19,
"learning_rate": 2.7210256410256414e-06,
"loss": 0.2149,
"step": 14700
},
{
"epoch": 10.2,
"learning_rate": 2.7082051282051287e-06,
"loss": 0.2229,
"step": 14725
},
{
"epoch": 10.22,
"learning_rate": 2.695384615384616e-06,
"loss": 0.2203,
"step": 14750
},
{
"epoch": 10.24,
"learning_rate": 2.682564102564103e-06,
"loss": 0.2146,
"step": 14775
},
{
"epoch": 10.26,
"learning_rate": 2.6697435897435896e-06,
"loss": 0.2191,
"step": 14800
},
{
"epoch": 10.27,
"learning_rate": 2.656923076923077e-06,
"loss": 0.2274,
"step": 14825
},
{
"epoch": 10.29,
"learning_rate": 2.644102564102564e-06,
"loss": 0.2219,
"step": 14850
},
{
"epoch": 10.31,
"learning_rate": 2.6312820512820513e-06,
"loss": 0.223,
"step": 14875
},
{
"epoch": 10.33,
"learning_rate": 2.6184615384615385e-06,
"loss": 0.2166,
"step": 14900
},
{
"epoch": 10.34,
"learning_rate": 2.605641025641026e-06,
"loss": 0.2279,
"step": 14925
},
{
"epoch": 10.36,
"learning_rate": 2.592820512820513e-06,
"loss": 0.2222,
"step": 14950
},
{
"epoch": 10.38,
"learning_rate": 2.5800000000000003e-06,
"loss": 0.2194,
"step": 14975
},
{
"epoch": 10.4,
"learning_rate": 2.5671794871794875e-06,
"loss": 0.2184,
"step": 15000
},
{
"epoch": 10.4,
"eval_cer": 17.82284963444628,
"eval_loss": 0.39042380452156067,
"eval_runtime": 151.2507,
"eval_samples_per_second": 12.469,
"eval_steps_per_second": 0.198,
"eval_wer": 46.438715315708976,
"step": 15000
},
{
"epoch": 10.41,
"learning_rate": 2.5543589743589748e-06,
"loss": 0.2113,
"step": 15025
},
{
"epoch": 10.43,
"learning_rate": 2.541538461538462e-06,
"loss": 0.2196,
"step": 15050
},
{
"epoch": 10.45,
"learning_rate": 2.5287179487179493e-06,
"loss": 0.2189,
"step": 15075
},
{
"epoch": 10.46,
"learning_rate": 2.5158974358974357e-06,
"loss": 0.2185,
"step": 15100
},
{
"epoch": 10.48,
"learning_rate": 2.503076923076923e-06,
"loss": 0.2174,
"step": 15125
},
{
"epoch": 10.5,
"learning_rate": 2.4902564102564106e-06,
"loss": 0.2262,
"step": 15150
},
{
"epoch": 10.52,
"learning_rate": 2.4774358974358974e-06,
"loss": 0.2241,
"step": 15175
},
{
"epoch": 10.53,
"learning_rate": 2.4646153846153847e-06,
"loss": 0.2185,
"step": 15200
},
{
"epoch": 10.55,
"learning_rate": 2.451794871794872e-06,
"loss": 0.2246,
"step": 15225
},
{
"epoch": 10.57,
"learning_rate": 2.438974358974359e-06,
"loss": 0.2172,
"step": 15250
},
{
"epoch": 10.59,
"learning_rate": 2.426666666666667e-06,
"loss": 0.2219,
"step": 15275
},
{
"epoch": 10.6,
"learning_rate": 2.4138461538461543e-06,
"loss": 0.2155,
"step": 15300
},
{
"epoch": 10.62,
"learning_rate": 2.4010256410256415e-06,
"loss": 0.2143,
"step": 15325
},
{
"epoch": 10.64,
"learning_rate": 2.3882051282051283e-06,
"loss": 0.2209,
"step": 15350
},
{
"epoch": 10.65,
"learning_rate": 2.3753846153846156e-06,
"loss": 0.2176,
"step": 15375
},
{
"epoch": 10.67,
"learning_rate": 2.362564102564103e-06,
"loss": 0.2151,
"step": 15400
},
{
"epoch": 10.69,
"learning_rate": 2.34974358974359e-06,
"loss": 0.2188,
"step": 15425
},
{
"epoch": 10.71,
"learning_rate": 2.3369230769230773e-06,
"loss": 0.2236,
"step": 15450
},
{
"epoch": 10.72,
"learning_rate": 2.3241025641025646e-06,
"loss": 0.2176,
"step": 15475
},
{
"epoch": 10.74,
"learning_rate": 2.3112820512820514e-06,
"loss": 0.2146,
"step": 15500
},
{
"epoch": 10.76,
"learning_rate": 2.2984615384615386e-06,
"loss": 0.2198,
"step": 15525
},
{
"epoch": 10.78,
"learning_rate": 2.285641025641026e-06,
"loss": 0.216,
"step": 15550
},
{
"epoch": 10.79,
"learning_rate": 2.272820512820513e-06,
"loss": 0.2225,
"step": 15575
},
{
"epoch": 10.81,
"learning_rate": 2.2600000000000004e-06,
"loss": 0.2194,
"step": 15600
},
{
"epoch": 10.83,
"learning_rate": 2.2471794871794876e-06,
"loss": 0.2164,
"step": 15625
},
{
"epoch": 10.85,
"learning_rate": 2.2343589743589745e-06,
"loss": 0.2202,
"step": 15650
},
{
"epoch": 10.86,
"learning_rate": 2.2215384615384617e-06,
"loss": 0.2251,
"step": 15675
},
{
"epoch": 10.88,
"learning_rate": 2.208717948717949e-06,
"loss": 0.2192,
"step": 15700
},
{
"epoch": 10.9,
"learning_rate": 2.195897435897436e-06,
"loss": 0.2197,
"step": 15725
},
{
"epoch": 10.91,
"learning_rate": 2.1830769230769234e-06,
"loss": 0.2138,
"step": 15750
},
{
"epoch": 10.93,
"learning_rate": 2.1702564102564107e-06,
"loss": 0.2227,
"step": 15775
},
{
"epoch": 10.95,
"learning_rate": 2.1574358974358975e-06,
"loss": 0.2195,
"step": 15800
},
{
"epoch": 10.97,
"learning_rate": 2.1446153846153848e-06,
"loss": 0.2206,
"step": 15825
},
{
"epoch": 10.98,
"learning_rate": 2.131794871794872e-06,
"loss": 0.2108,
"step": 15850
},
{
"epoch": 11.0,
"learning_rate": 2.1189743589743593e-06,
"loss": 0.2204,
"step": 15875
},
{
"epoch": 11.02,
"learning_rate": 2.1061538461538465e-06,
"loss": 0.2156,
"step": 15900
},
{
"epoch": 11.04,
"learning_rate": 2.0933333333333338e-06,
"loss": 0.2086,
"step": 15925
},
{
"epoch": 11.05,
"learning_rate": 2.0805128205128206e-06,
"loss": 0.2094,
"step": 15950
},
{
"epoch": 11.07,
"learning_rate": 2.067692307692308e-06,
"loss": 0.2129,
"step": 15975
},
{
"epoch": 11.09,
"learning_rate": 2.054871794871795e-06,
"loss": 0.2099,
"step": 16000
},
{
"epoch": 11.09,
"eval_cer": 17.43792325056433,
"eval_loss": 0.38932469487190247,
"eval_runtime": 139.9957,
"eval_samples_per_second": 13.472,
"eval_steps_per_second": 0.214,
"eval_wer": 45.97443740441337,
"step": 16000
},
{
"epoch": 11.11,
"learning_rate": 2.0420512820512823e-06,
"loss": 0.2151,
"step": 16025
},
{
"epoch": 11.12,
"learning_rate": 2.0292307692307696e-06,
"loss": 0.2101,
"step": 16050
},
{
"epoch": 11.14,
"learning_rate": 2.016410256410257e-06,
"loss": 0.2172,
"step": 16075
},
{
"epoch": 11.16,
"learning_rate": 2.0035897435897436e-06,
"loss": 0.2127,
"step": 16100
},
{
"epoch": 11.17,
"learning_rate": 1.990769230769231e-06,
"loss": 0.2099,
"step": 16125
},
{
"epoch": 11.19,
"learning_rate": 1.977948717948718e-06,
"loss": 0.2161,
"step": 16150
},
{
"epoch": 11.21,
"learning_rate": 1.9651282051282054e-06,
"loss": 0.2148,
"step": 16175
},
{
"epoch": 11.23,
"learning_rate": 1.9523076923076926e-06,
"loss": 0.2117,
"step": 16200
},
{
"epoch": 11.24,
"learning_rate": 1.93948717948718e-06,
"loss": 0.2176,
"step": 16225
},
{
"epoch": 11.26,
"learning_rate": 1.926666666666667e-06,
"loss": 0.2103,
"step": 16250
},
{
"epoch": 11.28,
"learning_rate": 1.913846153846154e-06,
"loss": 0.2115,
"step": 16275
},
{
"epoch": 11.3,
"learning_rate": 1.9010256410256412e-06,
"loss": 0.2156,
"step": 16300
},
{
"epoch": 11.31,
"learning_rate": 1.8882051282051285e-06,
"loss": 0.2115,
"step": 16325
},
{
"epoch": 11.33,
"learning_rate": 1.8753846153846155e-06,
"loss": 0.2101,
"step": 16350
},
{
"epoch": 11.35,
"learning_rate": 1.8625641025641027e-06,
"loss": 0.2139,
"step": 16375
},
{
"epoch": 11.37,
"learning_rate": 1.84974358974359e-06,
"loss": 0.2147,
"step": 16400
},
{
"epoch": 11.38,
"learning_rate": 1.836923076923077e-06,
"loss": 0.2124,
"step": 16425
},
{
"epoch": 11.4,
"learning_rate": 1.8241025641025643e-06,
"loss": 0.2077,
"step": 16450
},
{
"epoch": 11.42,
"learning_rate": 1.8112820512820515e-06,
"loss": 0.2138,
"step": 16475
},
{
"epoch": 11.43,
"learning_rate": 1.7984615384615386e-06,
"loss": 0.2165,
"step": 16500
},
{
"epoch": 11.45,
"learning_rate": 1.7856410256410258e-06,
"loss": 0.2157,
"step": 16525
},
{
"epoch": 11.47,
"learning_rate": 1.772820512820513e-06,
"loss": 0.2029,
"step": 16550
},
{
"epoch": 11.49,
"learning_rate": 1.76e-06,
"loss": 0.2175,
"step": 16575
},
{
"epoch": 11.5,
"learning_rate": 1.7471794871794873e-06,
"loss": 0.2182,
"step": 16600
},
{
"epoch": 11.52,
"learning_rate": 1.7343589743589746e-06,
"loss": 0.2133,
"step": 16625
},
{
"epoch": 11.54,
"learning_rate": 1.7215384615384616e-06,
"loss": 0.2138,
"step": 16650
},
{
"epoch": 11.56,
"learning_rate": 1.7087179487179489e-06,
"loss": 0.2163,
"step": 16675
},
{
"epoch": 11.57,
"learning_rate": 1.6958974358974361e-06,
"loss": 0.2094,
"step": 16700
},
{
"epoch": 11.59,
"learning_rate": 1.6830769230769232e-06,
"loss": 0.2167,
"step": 16725
},
{
"epoch": 11.61,
"learning_rate": 1.6702564102564104e-06,
"loss": 0.2107,
"step": 16750
},
{
"epoch": 11.63,
"learning_rate": 1.6574358974358976e-06,
"loss": 0.2223,
"step": 16775
},
{
"epoch": 11.64,
"learning_rate": 1.6446153846153847e-06,
"loss": 0.2185,
"step": 16800
},
{
"epoch": 11.66,
"learning_rate": 1.631794871794872e-06,
"loss": 0.2144,
"step": 16825
},
{
"epoch": 11.68,
"learning_rate": 1.6189743589743592e-06,
"loss": 0.2097,
"step": 16850
},
{
"epoch": 11.69,
"learning_rate": 1.6061538461538462e-06,
"loss": 0.2164,
"step": 16875
},
{
"epoch": 11.71,
"learning_rate": 1.5933333333333335e-06,
"loss": 0.2142,
"step": 16900
},
{
"epoch": 11.73,
"learning_rate": 1.5805128205128207e-06,
"loss": 0.2133,
"step": 16925
},
{
"epoch": 11.75,
"learning_rate": 1.5676923076923078e-06,
"loss": 0.2122,
"step": 16950
},
{
"epoch": 11.76,
"learning_rate": 1.554871794871795e-06,
"loss": 0.2138,
"step": 16975
},
{
"epoch": 11.78,
"learning_rate": 1.5420512820512822e-06,
"loss": 0.216,
"step": 17000
},
{
"epoch": 11.78,
"eval_cer": 17.293891715238704,
"eval_loss": 0.3888736069202423,
"eval_runtime": 140.9328,
"eval_samples_per_second": 13.382,
"eval_steps_per_second": 0.213,
"eval_wer": 45.619401354599084,
"step": 17000
},
{
"epoch": 11.8,
"learning_rate": 1.5292307692307693e-06,
"loss": 0.2154,
"step": 17025
},
{
"epoch": 11.82,
"learning_rate": 1.5164102564102565e-06,
"loss": 0.2075,
"step": 17050
},
{
"epoch": 11.83,
"learning_rate": 1.5035897435897438e-06,
"loss": 0.2186,
"step": 17075
},
{
"epoch": 11.85,
"learning_rate": 1.4907692307692308e-06,
"loss": 0.2173,
"step": 17100
},
{
"epoch": 11.87,
"learning_rate": 1.477948717948718e-06,
"loss": 0.2146,
"step": 17125
},
{
"epoch": 11.88,
"learning_rate": 1.4651282051282053e-06,
"loss": 0.2144,
"step": 17150
},
{
"epoch": 11.9,
"learning_rate": 1.4523076923076923e-06,
"loss": 0.2201,
"step": 17175
},
{
"epoch": 11.92,
"learning_rate": 1.4394871794871796e-06,
"loss": 0.2198,
"step": 17200
},
{
"epoch": 11.94,
"learning_rate": 1.4266666666666668e-06,
"loss": 0.2107,
"step": 17225
},
{
"epoch": 11.95,
"learning_rate": 1.4138461538461539e-06,
"loss": 0.2174,
"step": 17250
},
{
"epoch": 11.97,
"learning_rate": 1.4010256410256411e-06,
"loss": 0.2123,
"step": 17275
},
{
"epoch": 11.99,
"learning_rate": 1.3882051282051284e-06,
"loss": 0.2136,
"step": 17300
},
{
"epoch": 12.01,
"learning_rate": 1.3753846153846154e-06,
"loss": 0.2169,
"step": 17325
},
{
"epoch": 12.02,
"learning_rate": 1.3625641025641027e-06,
"loss": 0.208,
"step": 17350
},
{
"epoch": 12.04,
"learning_rate": 1.34974358974359e-06,
"loss": 0.2108,
"step": 17375
},
{
"epoch": 12.06,
"learning_rate": 1.336923076923077e-06,
"loss": 0.2042,
"step": 17400
},
{
"epoch": 12.08,
"learning_rate": 1.3241025641025642e-06,
"loss": 0.2041,
"step": 17425
},
{
"epoch": 12.09,
"learning_rate": 1.3112820512820514e-06,
"loss": 0.2097,
"step": 17450
},
{
"epoch": 12.11,
"learning_rate": 1.2984615384615385e-06,
"loss": 0.2054,
"step": 17475
},
{
"epoch": 12.13,
"learning_rate": 1.2856410256410257e-06,
"loss": 0.2103,
"step": 17500
},
{
"epoch": 12.14,
"learning_rate": 1.272820512820513e-06,
"loss": 0.2131,
"step": 17525
},
{
"epoch": 12.16,
"learning_rate": 1.26e-06,
"loss": 0.2124,
"step": 17550
},
{
"epoch": 12.18,
"learning_rate": 1.2471794871794873e-06,
"loss": 0.2168,
"step": 17575
},
{
"epoch": 12.2,
"learning_rate": 1.2343589743589745e-06,
"loss": 0.2079,
"step": 17600
},
{
"epoch": 12.21,
"learning_rate": 1.2215384615384618e-06,
"loss": 0.2169,
"step": 17625
},
{
"epoch": 12.23,
"learning_rate": 1.2087179487179488e-06,
"loss": 0.2097,
"step": 17650
},
{
"epoch": 12.25,
"learning_rate": 1.195897435897436e-06,
"loss": 0.2064,
"step": 17675
},
{
"epoch": 12.27,
"learning_rate": 1.1830769230769233e-06,
"loss": 0.2071,
"step": 17700
},
{
"epoch": 12.28,
"learning_rate": 1.1702564102564103e-06,
"loss": 0.2115,
"step": 17725
},
{
"epoch": 12.3,
"learning_rate": 1.1574358974358976e-06,
"loss": 0.2157,
"step": 17750
},
{
"epoch": 12.32,
"learning_rate": 1.1446153846153848e-06,
"loss": 0.212,
"step": 17775
},
{
"epoch": 12.34,
"learning_rate": 1.1317948717948719e-06,
"loss": 0.2123,
"step": 17800
},
{
"epoch": 12.35,
"learning_rate": 1.1194871794871797e-06,
"loss": 0.2149,
"step": 17825
},
{
"epoch": 12.37,
"learning_rate": 1.1066666666666667e-06,
"loss": 0.207,
"step": 17850
},
{
"epoch": 12.39,
"learning_rate": 1.093846153846154e-06,
"loss": 0.2044,
"step": 17875
},
{
"epoch": 12.4,
"learning_rate": 1.0810256410256412e-06,
"loss": 0.2092,
"step": 17900
},
{
"epoch": 12.42,
"learning_rate": 1.0682051282051283e-06,
"loss": 0.2071,
"step": 17925
},
{
"epoch": 12.44,
"learning_rate": 1.0553846153846155e-06,
"loss": 0.2083,
"step": 17950
},
{
"epoch": 12.46,
"learning_rate": 1.0425641025641028e-06,
"loss": 0.2104,
"step": 17975
},
{
"epoch": 12.47,
"learning_rate": 1.0297435897435898e-06,
"loss": 0.2095,
"step": 18000
},
{
"epoch": 12.47,
"eval_cer": 17.443819278326202,
"eval_loss": 0.38952764868736267,
"eval_runtime": 141.0838,
"eval_samples_per_second": 13.368,
"eval_steps_per_second": 0.213,
"eval_wer": 45.78872623989513,
"step": 18000
},
{
"epoch": 12.49,
"learning_rate": 1.016923076923077e-06,
"loss": 0.2086,
"step": 18025
},
{
"epoch": 12.51,
"learning_rate": 1.0041025641025643e-06,
"loss": 0.2032,
"step": 18050
},
{
"epoch": 12.53,
"learning_rate": 9.912820512820513e-07,
"loss": 0.2056,
"step": 18075
},
{
"epoch": 12.54,
"learning_rate": 9.784615384615386e-07,
"loss": 0.2012,
"step": 18100
},
{
"epoch": 12.56,
"learning_rate": 9.656410256410258e-07,
"loss": 0.2045,
"step": 18125
},
{
"epoch": 12.58,
"learning_rate": 9.528205128205129e-07,
"loss": 0.2103,
"step": 18150
},
{
"epoch": 12.6,
"learning_rate": 9.400000000000001e-07,
"loss": 0.211,
"step": 18175
},
{
"epoch": 12.61,
"learning_rate": 9.271794871794874e-07,
"loss": 0.2083,
"step": 18200
},
{
"epoch": 12.63,
"learning_rate": 9.143589743589744e-07,
"loss": 0.2103,
"step": 18225
},
{
"epoch": 12.65,
"learning_rate": 9.015384615384616e-07,
"loss": 0.2058,
"step": 18250
},
{
"epoch": 12.66,
"learning_rate": 8.887179487179489e-07,
"loss": 0.2092,
"step": 18275
},
{
"epoch": 12.68,
"learning_rate": 8.758974358974359e-07,
"loss": 0.2134,
"step": 18300
},
{
"epoch": 12.7,
"learning_rate": 8.630769230769232e-07,
"loss": 0.2139,
"step": 18325
},
{
"epoch": 12.72,
"learning_rate": 8.502564102564104e-07,
"loss": 0.2119,
"step": 18350
},
{
"epoch": 12.73,
"learning_rate": 8.374358974358975e-07,
"loss": 0.2036,
"step": 18375
},
{
"epoch": 12.75,
"learning_rate": 8.246153846153847e-07,
"loss": 0.214,
"step": 18400
},
{
"epoch": 12.77,
"learning_rate": 8.11794871794872e-07,
"loss": 0.2136,
"step": 18425
},
{
"epoch": 12.79,
"learning_rate": 7.98974358974359e-07,
"loss": 0.2084,
"step": 18450
},
{
"epoch": 12.8,
"learning_rate": 7.861538461538462e-07,
"loss": 0.2132,
"step": 18475
},
{
"epoch": 12.82,
"learning_rate": 7.733333333333335e-07,
"loss": 0.2043,
"step": 18500
},
{
"epoch": 12.84,
"learning_rate": 7.605128205128205e-07,
"loss": 0.2136,
"step": 18525
},
{
"epoch": 12.86,
"learning_rate": 7.476923076923078e-07,
"loss": 0.2053,
"step": 18550
},
{
"epoch": 12.87,
"learning_rate": 7.34871794871795e-07,
"loss": 0.2134,
"step": 18575
},
{
"epoch": 12.89,
"learning_rate": 7.22051282051282e-07,
"loss": 0.2126,
"step": 18600
},
{
"epoch": 12.91,
"learning_rate": 7.092307692307693e-07,
"loss": 0.2045,
"step": 18625
},
{
"epoch": 12.92,
"learning_rate": 6.964102564102565e-07,
"loss": 0.2138,
"step": 18650
},
{
"epoch": 12.94,
"learning_rate": 6.835897435897436e-07,
"loss": 0.2157,
"step": 18675
},
{
"epoch": 12.96,
"learning_rate": 6.707692307692308e-07,
"loss": 0.216,
"step": 18700
},
{
"epoch": 12.98,
"learning_rate": 6.579487179487181e-07,
"loss": 0.2097,
"step": 18725
},
{
"epoch": 12.99,
"learning_rate": 6.451282051282051e-07,
"loss": 0.2159,
"step": 18750
},
{
"epoch": 13.01,
"learning_rate": 6.323076923076924e-07,
"loss": 0.1995,
"step": 18775
},
{
"epoch": 13.03,
"learning_rate": 6.194871794871796e-07,
"loss": 0.2117,
"step": 18800
},
{
"epoch": 13.05,
"learning_rate": 6.066666666666668e-07,
"loss": 0.2154,
"step": 18825
},
{
"epoch": 13.06,
"learning_rate": 5.938461538461539e-07,
"loss": 0.2058,
"step": 18850
},
{
"epoch": 13.08,
"learning_rate": 5.810256410256411e-07,
"loss": 0.212,
"step": 18875
},
{
"epoch": 13.1,
"learning_rate": 5.682051282051283e-07,
"loss": 0.2053,
"step": 18900
},
{
"epoch": 13.12,
"learning_rate": 5.553846153846154e-07,
"loss": 0.2022,
"step": 18925
},
{
"epoch": 13.13,
"learning_rate": 5.425641025641027e-07,
"loss": 0.2072,
"step": 18950
},
{
"epoch": 13.15,
"learning_rate": 5.297435897435898e-07,
"loss": 0.2017,
"step": 18975
},
{
"epoch": 13.17,
"learning_rate": 5.16923076923077e-07,
"loss": 0.2056,
"step": 19000
},
{
"epoch": 13.17,
"eval_cer": 17.288837977157105,
"eval_loss": 0.3881835341453552,
"eval_runtime": 141.1347,
"eval_samples_per_second": 13.363,
"eval_steps_per_second": 0.213,
"eval_wer": 45.60847716845095,
"step": 19000
},
{
"epoch": 13.18,
"learning_rate": 5.041025641025642e-07,
"loss": 0.2008,
"step": 19025
},
{
"epoch": 13.2,
"learning_rate": 4.912820512820513e-07,
"loss": 0.2086,
"step": 19050
},
{
"epoch": 13.22,
"learning_rate": 4.784615384615385e-07,
"loss": 0.1969,
"step": 19075
},
{
"epoch": 13.24,
"learning_rate": 4.656410256410257e-07,
"loss": 0.2077,
"step": 19100
},
{
"epoch": 13.25,
"learning_rate": 4.528205128205129e-07,
"loss": 0.2061,
"step": 19125
},
{
"epoch": 13.27,
"learning_rate": 4.4e-07,
"loss": 0.2096,
"step": 19150
},
{
"epoch": 13.29,
"learning_rate": 4.271794871794872e-07,
"loss": 0.205,
"step": 19175
},
{
"epoch": 13.31,
"learning_rate": 4.143589743589744e-07,
"loss": 0.202,
"step": 19200
},
{
"epoch": 13.32,
"learning_rate": 4.0153846153846155e-07,
"loss": 0.2068,
"step": 19225
},
{
"epoch": 13.34,
"learning_rate": 3.8871794871794875e-07,
"loss": 0.2063,
"step": 19250
},
{
"epoch": 13.36,
"learning_rate": 3.7589743589743594e-07,
"loss": 0.2087,
"step": 19275
},
{
"epoch": 13.37,
"learning_rate": 3.630769230769231e-07,
"loss": 0.2052,
"step": 19300
},
{
"epoch": 13.39,
"learning_rate": 3.502564102564103e-07,
"loss": 0.206,
"step": 19325
},
{
"epoch": 13.41,
"learning_rate": 3.374358974358975e-07,
"loss": 0.2082,
"step": 19350
},
{
"epoch": 13.43,
"learning_rate": 3.246153846153846e-07,
"loss": 0.2068,
"step": 19375
},
{
"epoch": 13.44,
"learning_rate": 3.117948717948718e-07,
"loss": 0.2104,
"step": 19400
},
{
"epoch": 13.46,
"learning_rate": 2.98974358974359e-07,
"loss": 0.2128,
"step": 19425
},
{
"epoch": 13.48,
"learning_rate": 2.861538461538462e-07,
"loss": 0.2034,
"step": 19450
},
{
"epoch": 13.5,
"learning_rate": 2.7333333333333335e-07,
"loss": 0.2062,
"step": 19475
},
{
"epoch": 13.51,
"learning_rate": 2.6051282051282054e-07,
"loss": 0.2019,
"step": 19500
},
{
"epoch": 13.53,
"learning_rate": 2.4769230769230774e-07,
"loss": 0.2113,
"step": 19525
},
{
"epoch": 13.55,
"learning_rate": 2.348717948717949e-07,
"loss": 0.2041,
"step": 19550
},
{
"epoch": 13.57,
"learning_rate": 2.2205128205128205e-07,
"loss": 0.2043,
"step": 19575
},
{
"epoch": 13.58,
"learning_rate": 2.0923076923076924e-07,
"loss": 0.2062,
"step": 19600
},
{
"epoch": 13.6,
"learning_rate": 1.9641025641025644e-07,
"loss": 0.2045,
"step": 19625
},
{
"epoch": 13.62,
"learning_rate": 1.8358974358974358e-07,
"loss": 0.207,
"step": 19650
},
{
"epoch": 13.63,
"learning_rate": 1.7076923076923077e-07,
"loss": 0.2088,
"step": 19675
},
{
"epoch": 13.65,
"learning_rate": 1.5794871794871797e-07,
"loss": 0.2085,
"step": 19700
},
{
"epoch": 13.67,
"learning_rate": 1.4512820512820514e-07,
"loss": 0.2049,
"step": 19725
},
{
"epoch": 13.69,
"learning_rate": 1.323076923076923e-07,
"loss": 0.2122,
"step": 19750
},
{
"epoch": 13.7,
"learning_rate": 1.194871794871795e-07,
"loss": 0.2023,
"step": 19775
},
{
"epoch": 13.72,
"learning_rate": 1.0666666666666667e-07,
"loss": 0.2104,
"step": 19800
},
{
"epoch": 13.74,
"learning_rate": 9.384615384615386e-08,
"loss": 0.2012,
"step": 19825
},
{
"epoch": 13.76,
"learning_rate": 8.102564102564103e-08,
"loss": 0.2117,
"step": 19850
},
{
"epoch": 13.77,
"learning_rate": 6.820512820512821e-08,
"loss": 0.2082,
"step": 19875
},
{
"epoch": 13.79,
"learning_rate": 5.538461538461538e-08,
"loss": 0.2046,
"step": 19900
},
{
"epoch": 13.81,
"learning_rate": 4.2564102564102564e-08,
"loss": 0.2088,
"step": 19925
},
{
"epoch": 13.83,
"learning_rate": 2.9743589743589746e-08,
"loss": 0.2068,
"step": 19950
},
{
"epoch": 13.84,
"learning_rate": 1.6923076923076925e-08,
"loss": 0.2098,
"step": 19975
},
{
"epoch": 13.86,
"learning_rate": 4.102564102564102e-09,
"loss": 0.2064,
"step": 20000
},
{
"epoch": 13.86,
"eval_cer": 17.33769077861258,
"eval_loss": 0.3884678781032562,
"eval_runtime": 140.6948,
"eval_samples_per_second": 13.405,
"eval_steps_per_second": 0.213,
"eval_wer": 45.51015949311776,
"step": 20000
},
{
"epoch": 13.86,
"step": 20000,
"total_flos": 3.150929254404096e+19,
"train_loss": 0.3324837454319,
"train_runtime": 17628.1069,
"train_samples_per_second": 72.611,
"train_steps_per_second": 1.135
},
{
"epoch": 13.86,
"eval_cer": 17.33769077861258,
"eval_loss": 0.3884678781032562,
"eval_runtime": 139.1963,
"eval_samples_per_second": 13.549,
"eval_steps_per_second": 0.216,
"eval_wer": 45.51015949311776,
"step": 20000
}
],
"max_steps": 20000,
"num_train_epochs": 14,
"total_flos": 3.150929254404096e+19,
"trial_name": null,
"trial_params": null
}