whisper-base-eu-cv16_1 / trainer_state.json
zuazo's picture
End of training
a267c05 verified
raw
history blame contribute delete
No virus
204 kB
{
"best_metric": 16.17652806002814,
"best_model_checkpoint": "./checkpoint-26000",
"epoch": 400.0,
"eval_steps": 1000,
"global_step": 40000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.25,
"learning_rate": 1.2000000000000002e-06,
"loss": 2.0919,
"step": 25
},
{
"epoch": 0.5,
"learning_rate": 2.4500000000000003e-06,
"loss": 1.6487,
"step": 50
},
{
"epoch": 0.75,
"learning_rate": 3.7e-06,
"loss": 1.1675,
"step": 75
},
{
"epoch": 1.0,
"learning_rate": 4.950000000000001e-06,
"loss": 0.8978,
"step": 100
},
{
"epoch": 1.25,
"learning_rate": 6.2e-06,
"loss": 0.7365,
"step": 125
},
{
"epoch": 1.5,
"learning_rate": 7.45e-06,
"loss": 0.6371,
"step": 150
},
{
"epoch": 1.75,
"learning_rate": 8.7e-06,
"loss": 0.5723,
"step": 175
},
{
"epoch": 2.0,
"learning_rate": 9.950000000000001e-06,
"loss": 0.5174,
"step": 200
},
{
"epoch": 2.25,
"learning_rate": 1.1200000000000001e-05,
"loss": 0.4378,
"step": 225
},
{
"epoch": 2.5,
"learning_rate": 1.2450000000000001e-05,
"loss": 0.4126,
"step": 250
},
{
"epoch": 2.75,
"learning_rate": 1.3700000000000001e-05,
"loss": 0.3876,
"step": 275
},
{
"epoch": 3.0,
"learning_rate": 1.4950000000000001e-05,
"loss": 0.3605,
"step": 300
},
{
"epoch": 3.25,
"learning_rate": 1.62e-05,
"loss": 0.2987,
"step": 325
},
{
"epoch": 3.5,
"learning_rate": 1.745e-05,
"loss": 0.2859,
"step": 350
},
{
"epoch": 3.75,
"learning_rate": 1.87e-05,
"loss": 0.2754,
"step": 375
},
{
"epoch": 4.0,
"learning_rate": 1.995e-05,
"loss": 0.2734,
"step": 400
},
{
"epoch": 4.25,
"learning_rate": 2.12e-05,
"loss": 0.2129,
"step": 425
},
{
"epoch": 4.5,
"learning_rate": 2.245e-05,
"loss": 0.2011,
"step": 450
},
{
"epoch": 4.75,
"learning_rate": 2.37e-05,
"loss": 0.2023,
"step": 475
},
{
"epoch": 5.0,
"learning_rate": 2.495e-05,
"loss": 0.1981,
"step": 500
},
{
"epoch": 5.25,
"learning_rate": 2.498481012658228e-05,
"loss": 0.1425,
"step": 525
},
{
"epoch": 5.5,
"learning_rate": 2.4968987341772155e-05,
"loss": 0.14,
"step": 550
},
{
"epoch": 5.75,
"learning_rate": 2.4953164556962027e-05,
"loss": 0.1406,
"step": 575
},
{
"epoch": 6.0,
"learning_rate": 2.4937341772151902e-05,
"loss": 0.1418,
"step": 600
},
{
"epoch": 6.25,
"learning_rate": 2.4921518987341774e-05,
"loss": 0.0935,
"step": 625
},
{
"epoch": 6.5,
"learning_rate": 2.4905696202531646e-05,
"loss": 0.0949,
"step": 650
},
{
"epoch": 6.75,
"learning_rate": 2.488987341772152e-05,
"loss": 0.0966,
"step": 675
},
{
"epoch": 7.0,
"learning_rate": 2.4874050632911393e-05,
"loss": 0.0951,
"step": 700
},
{
"epoch": 7.25,
"learning_rate": 2.485822784810127e-05,
"loss": 0.0582,
"step": 725
},
{
"epoch": 7.5,
"learning_rate": 2.484240506329114e-05,
"loss": 0.0607,
"step": 750
},
{
"epoch": 7.75,
"learning_rate": 2.4826582278481016e-05,
"loss": 0.0615,
"step": 775
},
{
"epoch": 8.0,
"learning_rate": 2.4810759493670887e-05,
"loss": 0.0622,
"step": 800
},
{
"epoch": 8.25,
"learning_rate": 2.479493670886076e-05,
"loss": 0.0359,
"step": 825
},
{
"epoch": 8.5,
"learning_rate": 2.4779113924050635e-05,
"loss": 0.0361,
"step": 850
},
{
"epoch": 8.75,
"learning_rate": 2.4763291139240506e-05,
"loss": 0.0384,
"step": 875
},
{
"epoch": 9.0,
"learning_rate": 2.474746835443038e-05,
"loss": 0.0376,
"step": 900
},
{
"epoch": 9.25,
"learning_rate": 2.4731645569620254e-05,
"loss": 0.0221,
"step": 925
},
{
"epoch": 9.5,
"learning_rate": 2.471582278481013e-05,
"loss": 0.0217,
"step": 950
},
{
"epoch": 9.75,
"learning_rate": 2.47e-05,
"loss": 0.0225,
"step": 975
},
{
"epoch": 10.0,
"learning_rate": 2.4684177215189873e-05,
"loss": 0.0225,
"step": 1000
},
{
"epoch": 10.0,
"eval_loss": 0.3059324324131012,
"eval_runtime": 169.4514,
"eval_samples_per_second": 75.196,
"eval_steps_per_second": 1.18,
"eval_wer": 19.08120994216039,
"step": 1000
},
{
"epoch": 10.25,
"learning_rate": 2.4668354430379748e-05,
"loss": 0.014,
"step": 1025
},
{
"epoch": 10.5,
"learning_rate": 2.465253164556962e-05,
"loss": 0.0151,
"step": 1050
},
{
"epoch": 10.75,
"learning_rate": 2.4636708860759495e-05,
"loss": 0.0146,
"step": 1075
},
{
"epoch": 11.0,
"learning_rate": 2.4620886075949367e-05,
"loss": 0.014,
"step": 1100
},
{
"epoch": 11.25,
"learning_rate": 2.4605063291139242e-05,
"loss": 0.0101,
"step": 1125
},
{
"epoch": 11.5,
"learning_rate": 2.4589240506329114e-05,
"loss": 0.0098,
"step": 1150
},
{
"epoch": 11.75,
"learning_rate": 2.457341772151899e-05,
"loss": 0.0091,
"step": 1175
},
{
"epoch": 12.0,
"learning_rate": 2.455759493670886e-05,
"loss": 0.0096,
"step": 1200
},
{
"epoch": 12.25,
"learning_rate": 2.4541772151898733e-05,
"loss": 0.0075,
"step": 1225
},
{
"epoch": 12.5,
"learning_rate": 2.4525949367088608e-05,
"loss": 0.007,
"step": 1250
},
{
"epoch": 12.75,
"learning_rate": 2.451012658227848e-05,
"loss": 0.0069,
"step": 1275
},
{
"epoch": 13.0,
"learning_rate": 2.4494303797468355e-05,
"loss": 0.0074,
"step": 1300
},
{
"epoch": 13.25,
"learning_rate": 2.447848101265823e-05,
"loss": 0.0058,
"step": 1325
},
{
"epoch": 13.5,
"learning_rate": 2.4462658227848103e-05,
"loss": 0.0057,
"step": 1350
},
{
"epoch": 13.75,
"learning_rate": 2.4446835443037978e-05,
"loss": 0.0056,
"step": 1375
},
{
"epoch": 14.0,
"learning_rate": 2.443101265822785e-05,
"loss": 0.006,
"step": 1400
},
{
"epoch": 14.25,
"learning_rate": 2.4415189873417725e-05,
"loss": 0.0051,
"step": 1425
},
{
"epoch": 14.5,
"learning_rate": 2.4399367088607597e-05,
"loss": 0.0048,
"step": 1450
},
{
"epoch": 14.75,
"learning_rate": 2.438354430379747e-05,
"loss": 0.0054,
"step": 1475
},
{
"epoch": 15.0,
"learning_rate": 2.4367721518987344e-05,
"loss": 0.0067,
"step": 1500
},
{
"epoch": 15.25,
"learning_rate": 2.4351898734177216e-05,
"loss": 0.0059,
"step": 1525
},
{
"epoch": 15.5,
"learning_rate": 2.433607594936709e-05,
"loss": 0.0053,
"step": 1550
},
{
"epoch": 15.75,
"learning_rate": 2.4320253164556963e-05,
"loss": 0.005,
"step": 1575
},
{
"epoch": 16.0,
"learning_rate": 2.4304430379746838e-05,
"loss": 0.0053,
"step": 1600
},
{
"epoch": 16.25,
"learning_rate": 2.428860759493671e-05,
"loss": 0.0049,
"step": 1625
},
{
"epoch": 16.5,
"learning_rate": 2.4272784810126585e-05,
"loss": 0.0064,
"step": 1650
},
{
"epoch": 16.75,
"learning_rate": 2.4256962025316457e-05,
"loss": 0.0066,
"step": 1675
},
{
"epoch": 17.0,
"learning_rate": 2.424113924050633e-05,
"loss": 0.0071,
"step": 1700
},
{
"epoch": 17.25,
"learning_rate": 2.4225316455696204e-05,
"loss": 0.0069,
"step": 1725
},
{
"epoch": 17.5,
"learning_rate": 2.4209493670886076e-05,
"loss": 0.0063,
"step": 1750
},
{
"epoch": 17.75,
"learning_rate": 2.419367088607595e-05,
"loss": 0.0056,
"step": 1775
},
{
"epoch": 18.0,
"learning_rate": 2.4177848101265823e-05,
"loss": 0.0068,
"step": 1800
},
{
"epoch": 18.25,
"learning_rate": 2.41620253164557e-05,
"loss": 0.0059,
"step": 1825
},
{
"epoch": 18.5,
"learning_rate": 2.414620253164557e-05,
"loss": 0.0052,
"step": 1850
},
{
"epoch": 18.75,
"learning_rate": 2.4130379746835442e-05,
"loss": 0.0052,
"step": 1875
},
{
"epoch": 19.0,
"learning_rate": 2.4114556962025318e-05,
"loss": 0.005,
"step": 1900
},
{
"epoch": 19.25,
"learning_rate": 2.409873417721519e-05,
"loss": 0.0037,
"step": 1925
},
{
"epoch": 19.5,
"learning_rate": 2.4082911392405065e-05,
"loss": 0.0034,
"step": 1950
},
{
"epoch": 19.75,
"learning_rate": 2.4067088607594937e-05,
"loss": 0.0035,
"step": 1975
},
{
"epoch": 20.0,
"learning_rate": 2.4051265822784812e-05,
"loss": 0.0037,
"step": 2000
},
{
"epoch": 20.0,
"eval_loss": 0.35300523042678833,
"eval_runtime": 158.6202,
"eval_samples_per_second": 80.33,
"eval_steps_per_second": 1.261,
"eval_wer": 18.461778958886978,
"step": 2000
},
{
"epoch": 20.25,
"learning_rate": 2.4035443037974684e-05,
"loss": 0.0029,
"step": 2025
},
{
"epoch": 20.5,
"learning_rate": 2.4019620253164556e-05,
"loss": 0.0029,
"step": 2050
},
{
"epoch": 20.75,
"learning_rate": 2.400379746835443e-05,
"loss": 0.0029,
"step": 2075
},
{
"epoch": 21.0,
"learning_rate": 2.3987974683544303e-05,
"loss": 0.0027,
"step": 2100
},
{
"epoch": 21.25,
"learning_rate": 2.3972151898734178e-05,
"loss": 0.0023,
"step": 2125
},
{
"epoch": 21.5,
"learning_rate": 2.3956329113924053e-05,
"loss": 0.0022,
"step": 2150
},
{
"epoch": 21.75,
"learning_rate": 2.3940506329113925e-05,
"loss": 0.0022,
"step": 2175
},
{
"epoch": 22.0,
"learning_rate": 2.39246835443038e-05,
"loss": 0.0024,
"step": 2200
},
{
"epoch": 22.25,
"learning_rate": 2.3908860759493672e-05,
"loss": 0.0019,
"step": 2225
},
{
"epoch": 22.5,
"learning_rate": 2.3893037974683548e-05,
"loss": 0.0017,
"step": 2250
},
{
"epoch": 22.75,
"learning_rate": 2.387721518987342e-05,
"loss": 0.0019,
"step": 2275
},
{
"epoch": 23.0,
"learning_rate": 2.3861392405063295e-05,
"loss": 0.0029,
"step": 2300
},
{
"epoch": 23.25,
"learning_rate": 2.3845569620253167e-05,
"loss": 0.0031,
"step": 2325
},
{
"epoch": 23.5,
"learning_rate": 2.382974683544304e-05,
"loss": 0.003,
"step": 2350
},
{
"epoch": 23.75,
"learning_rate": 2.3813924050632914e-05,
"loss": 0.0033,
"step": 2375
},
{
"epoch": 24.0,
"learning_rate": 2.3798101265822786e-05,
"loss": 0.0037,
"step": 2400
},
{
"epoch": 24.25,
"learning_rate": 2.378227848101266e-05,
"loss": 0.0036,
"step": 2425
},
{
"epoch": 24.5,
"learning_rate": 2.3766455696202533e-05,
"loss": 0.0038,
"step": 2450
},
{
"epoch": 24.75,
"learning_rate": 2.3750632911392408e-05,
"loss": 0.0043,
"step": 2475
},
{
"epoch": 25.0,
"learning_rate": 2.373481012658228e-05,
"loss": 0.005,
"step": 2500
},
{
"epoch": 25.25,
"learning_rate": 2.3718987341772152e-05,
"loss": 0.0043,
"step": 2525
},
{
"epoch": 25.5,
"learning_rate": 2.3703164556962027e-05,
"loss": 0.0042,
"step": 2550
},
{
"epoch": 25.75,
"learning_rate": 2.36873417721519e-05,
"loss": 0.0039,
"step": 2575
},
{
"epoch": 26.0,
"learning_rate": 2.3671518987341774e-05,
"loss": 0.0045,
"step": 2600
},
{
"epoch": 26.25,
"learning_rate": 2.3655696202531646e-05,
"loss": 0.0033,
"step": 2625
},
{
"epoch": 26.5,
"learning_rate": 2.363987341772152e-05,
"loss": 0.0033,
"step": 2650
},
{
"epoch": 26.75,
"learning_rate": 2.3624050632911393e-05,
"loss": 0.0041,
"step": 2675
},
{
"epoch": 27.0,
"learning_rate": 2.3608227848101265e-05,
"loss": 0.0041,
"step": 2700
},
{
"epoch": 27.25,
"learning_rate": 2.359240506329114e-05,
"loss": 0.0035,
"step": 2725
},
{
"epoch": 27.5,
"learning_rate": 2.3576582278481012e-05,
"loss": 0.0035,
"step": 2750
},
{
"epoch": 27.75,
"learning_rate": 2.3560759493670888e-05,
"loss": 0.0028,
"step": 2775
},
{
"epoch": 28.0,
"learning_rate": 2.354493670886076e-05,
"loss": 0.0029,
"step": 2800
},
{
"epoch": 28.25,
"learning_rate": 2.3529113924050635e-05,
"loss": 0.0024,
"step": 2825
},
{
"epoch": 28.5,
"learning_rate": 2.3513291139240507e-05,
"loss": 0.0021,
"step": 2850
},
{
"epoch": 28.75,
"learning_rate": 2.349746835443038e-05,
"loss": 0.002,
"step": 2875
},
{
"epoch": 29.0,
"learning_rate": 2.3481645569620254e-05,
"loss": 0.0019,
"step": 2900
},
{
"epoch": 29.25,
"learning_rate": 2.3465822784810126e-05,
"loss": 0.0015,
"step": 2925
},
{
"epoch": 29.5,
"learning_rate": 2.345e-05,
"loss": 0.0013,
"step": 2950
},
{
"epoch": 29.75,
"learning_rate": 2.3434177215189876e-05,
"loss": 0.0012,
"step": 2975
},
{
"epoch": 30.0,
"learning_rate": 2.3418354430379748e-05,
"loss": 0.0012,
"step": 3000
},
{
"epoch": 30.0,
"eval_loss": 0.37241747975349426,
"eval_runtime": 159.669,
"eval_samples_per_second": 79.803,
"eval_steps_per_second": 1.253,
"eval_wer": 17.93321088010005,
"step": 3000
},
{
"epoch": 30.25,
"learning_rate": 2.3402531645569623e-05,
"loss": 0.001,
"step": 3025
},
{
"epoch": 30.5,
"learning_rate": 2.3386708860759495e-05,
"loss": 0.0009,
"step": 3050
},
{
"epoch": 30.75,
"learning_rate": 2.337088607594937e-05,
"loss": 0.0009,
"step": 3075
},
{
"epoch": 31.0,
"learning_rate": 2.3355063291139242e-05,
"loss": 0.0008,
"step": 3100
},
{
"epoch": 31.25,
"learning_rate": 2.3339240506329117e-05,
"loss": 0.0007,
"step": 3125
},
{
"epoch": 31.5,
"learning_rate": 2.332341772151899e-05,
"loss": 0.0007,
"step": 3150
},
{
"epoch": 31.75,
"learning_rate": 2.330759493670886e-05,
"loss": 0.0007,
"step": 3175
},
{
"epoch": 32.0,
"learning_rate": 2.3291772151898736e-05,
"loss": 0.0007,
"step": 3200
},
{
"epoch": 32.25,
"learning_rate": 2.327594936708861e-05,
"loss": 0.0006,
"step": 3225
},
{
"epoch": 32.5,
"learning_rate": 2.3260126582278484e-05,
"loss": 0.0006,
"step": 3250
},
{
"epoch": 32.75,
"learning_rate": 2.3244303797468355e-05,
"loss": 0.0006,
"step": 3275
},
{
"epoch": 33.0,
"learning_rate": 2.322848101265823e-05,
"loss": 0.0006,
"step": 3300
},
{
"epoch": 33.25,
"learning_rate": 2.3212658227848103e-05,
"loss": 0.0006,
"step": 3325
},
{
"epoch": 33.5,
"learning_rate": 2.3196835443037975e-05,
"loss": 0.0006,
"step": 3350
},
{
"epoch": 33.75,
"learning_rate": 2.318101265822785e-05,
"loss": 0.0006,
"step": 3375
},
{
"epoch": 34.0,
"learning_rate": 2.316518987341772e-05,
"loss": 0.0006,
"step": 3400
},
{
"epoch": 34.25,
"learning_rate": 2.3149367088607597e-05,
"loss": 0.0005,
"step": 3425
},
{
"epoch": 34.5,
"learning_rate": 2.313354430379747e-05,
"loss": 0.0005,
"step": 3450
},
{
"epoch": 34.75,
"learning_rate": 2.3117721518987344e-05,
"loss": 0.0005,
"step": 3475
},
{
"epoch": 35.0,
"learning_rate": 2.3101898734177216e-05,
"loss": 0.0005,
"step": 3500
},
{
"epoch": 35.25,
"learning_rate": 2.3086075949367088e-05,
"loss": 0.0005,
"step": 3525
},
{
"epoch": 35.5,
"learning_rate": 2.3070253164556963e-05,
"loss": 0.0005,
"step": 3550
},
{
"epoch": 35.75,
"learning_rate": 2.3054430379746835e-05,
"loss": 0.0005,
"step": 3575
},
{
"epoch": 36.0,
"learning_rate": 2.303860759493671e-05,
"loss": 0.0005,
"step": 3600
},
{
"epoch": 36.25,
"learning_rate": 2.3022784810126582e-05,
"loss": 0.0005,
"step": 3625
},
{
"epoch": 36.5,
"learning_rate": 2.3006962025316457e-05,
"loss": 0.0004,
"step": 3650
},
{
"epoch": 36.75,
"learning_rate": 2.299113924050633e-05,
"loss": 0.0004,
"step": 3675
},
{
"epoch": 37.0,
"learning_rate": 2.29753164556962e-05,
"loss": 0.0004,
"step": 3700
},
{
"epoch": 37.25,
"learning_rate": 2.2959493670886076e-05,
"loss": 0.0004,
"step": 3725
},
{
"epoch": 37.5,
"learning_rate": 2.2943670886075948e-05,
"loss": 0.0004,
"step": 3750
},
{
"epoch": 37.75,
"learning_rate": 2.2927848101265823e-05,
"loss": 0.0004,
"step": 3775
},
{
"epoch": 38.0,
"learning_rate": 2.29120253164557e-05,
"loss": 0.0004,
"step": 3800
},
{
"epoch": 38.25,
"learning_rate": 2.289620253164557e-05,
"loss": 0.0004,
"step": 3825
},
{
"epoch": 38.5,
"learning_rate": 2.2880379746835446e-05,
"loss": 0.0004,
"step": 3850
},
{
"epoch": 38.75,
"learning_rate": 2.2864556962025318e-05,
"loss": 0.0004,
"step": 3875
},
{
"epoch": 39.0,
"learning_rate": 2.2848734177215193e-05,
"loss": 0.0004,
"step": 3900
},
{
"epoch": 39.25,
"learning_rate": 2.2832911392405065e-05,
"loss": 0.0004,
"step": 3925
},
{
"epoch": 39.5,
"learning_rate": 2.281708860759494e-05,
"loss": 0.0004,
"step": 3950
},
{
"epoch": 39.75,
"learning_rate": 2.2801265822784812e-05,
"loss": 0.0004,
"step": 3975
},
{
"epoch": 40.0,
"learning_rate": 2.2785443037974684e-05,
"loss": 0.0004,
"step": 4000
},
{
"epoch": 40.0,
"eval_loss": 0.4025060534477234,
"eval_runtime": 158.6218,
"eval_samples_per_second": 80.329,
"eval_steps_per_second": 1.261,
"eval_wer": 17.89510708144443,
"step": 4000
},
{
"epoch": 40.25,
"learning_rate": 2.276962025316456e-05,
"loss": 0.0003,
"step": 4025
},
{
"epoch": 40.5,
"learning_rate": 2.275379746835443e-05,
"loss": 0.0003,
"step": 4050
},
{
"epoch": 40.75,
"learning_rate": 2.2737974683544306e-05,
"loss": 0.0003,
"step": 4075
},
{
"epoch": 41.0,
"learning_rate": 2.2722151898734178e-05,
"loss": 0.0004,
"step": 4100
},
{
"epoch": 41.25,
"learning_rate": 2.2706329113924053e-05,
"loss": 0.0003,
"step": 4125
},
{
"epoch": 41.5,
"learning_rate": 2.2690506329113925e-05,
"loss": 0.0003,
"step": 4150
},
{
"epoch": 41.75,
"learning_rate": 2.2674683544303797e-05,
"loss": 0.0003,
"step": 4175
},
{
"epoch": 42.0,
"learning_rate": 2.2658860759493672e-05,
"loss": 0.0003,
"step": 4200
},
{
"epoch": 42.25,
"learning_rate": 2.2643037974683544e-05,
"loss": 0.0003,
"step": 4225
},
{
"epoch": 42.5,
"learning_rate": 2.262721518987342e-05,
"loss": 0.0003,
"step": 4250
},
{
"epoch": 42.75,
"learning_rate": 2.261139240506329e-05,
"loss": 0.0003,
"step": 4275
},
{
"epoch": 43.0,
"learning_rate": 2.2595569620253167e-05,
"loss": 0.0003,
"step": 4300
},
{
"epoch": 43.25,
"learning_rate": 2.257974683544304e-05,
"loss": 0.0003,
"step": 4325
},
{
"epoch": 43.5,
"learning_rate": 2.256392405063291e-05,
"loss": 0.0003,
"step": 4350
},
{
"epoch": 43.75,
"learning_rate": 2.2548101265822786e-05,
"loss": 0.0003,
"step": 4375
},
{
"epoch": 44.0,
"learning_rate": 2.2532278481012658e-05,
"loss": 0.0003,
"step": 4400
},
{
"epoch": 44.25,
"learning_rate": 2.2516455696202533e-05,
"loss": 0.0003,
"step": 4425
},
{
"epoch": 44.5,
"learning_rate": 2.2500632911392405e-05,
"loss": 0.0003,
"step": 4450
},
{
"epoch": 44.75,
"learning_rate": 2.248481012658228e-05,
"loss": 0.0003,
"step": 4475
},
{
"epoch": 45.0,
"learning_rate": 2.2468987341772152e-05,
"loss": 0.0003,
"step": 4500
},
{
"epoch": 45.25,
"learning_rate": 2.2453164556962024e-05,
"loss": 0.0003,
"step": 4525
},
{
"epoch": 45.5,
"learning_rate": 2.24373417721519e-05,
"loss": 0.0003,
"step": 4550
},
{
"epoch": 45.75,
"learning_rate": 2.242151898734177e-05,
"loss": 0.0002,
"step": 4575
},
{
"epoch": 46.0,
"learning_rate": 2.240569620253165e-05,
"loss": 0.0003,
"step": 4600
},
{
"epoch": 46.25,
"learning_rate": 2.238987341772152e-05,
"loss": 0.0002,
"step": 4625
},
{
"epoch": 46.5,
"learning_rate": 2.2374050632911393e-05,
"loss": 0.0002,
"step": 4650
},
{
"epoch": 46.75,
"learning_rate": 2.235822784810127e-05,
"loss": 0.0002,
"step": 4675
},
{
"epoch": 47.0,
"learning_rate": 2.234240506329114e-05,
"loss": 0.0002,
"step": 4700
},
{
"epoch": 47.25,
"learning_rate": 2.2326582278481016e-05,
"loss": 0.0002,
"step": 4725
},
{
"epoch": 47.5,
"learning_rate": 2.2310759493670888e-05,
"loss": 0.0002,
"step": 4750
},
{
"epoch": 47.75,
"learning_rate": 2.2294936708860763e-05,
"loss": 0.0002,
"step": 4775
},
{
"epoch": 48.0,
"learning_rate": 2.2279113924050635e-05,
"loss": 0.0002,
"step": 4800
},
{
"epoch": 48.25,
"learning_rate": 2.2263291139240507e-05,
"loss": 0.0002,
"step": 4825
},
{
"epoch": 48.5,
"learning_rate": 2.2247468354430382e-05,
"loss": 0.0002,
"step": 4850
},
{
"epoch": 48.75,
"learning_rate": 2.2231645569620254e-05,
"loss": 0.0002,
"step": 4875
},
{
"epoch": 49.0,
"learning_rate": 2.221582278481013e-05,
"loss": 0.0002,
"step": 4900
},
{
"epoch": 49.25,
"learning_rate": 2.22e-05,
"loss": 0.0002,
"step": 4925
},
{
"epoch": 49.5,
"learning_rate": 2.2184177215189876e-05,
"loss": 0.0002,
"step": 4950
},
{
"epoch": 49.75,
"learning_rate": 2.2168354430379748e-05,
"loss": 0.0002,
"step": 4975
},
{
"epoch": 50.0,
"learning_rate": 2.215253164556962e-05,
"loss": 0.0002,
"step": 5000
},
{
"epoch": 50.0,
"eval_loss": 0.42450690269470215,
"eval_runtime": 158.7789,
"eval_samples_per_second": 80.25,
"eval_steps_per_second": 1.26,
"eval_wer": 17.89510708144443,
"step": 5000
},
{
"epoch": 50.25,
"learning_rate": 2.2136708860759495e-05,
"loss": 0.0002,
"step": 5025
},
{
"epoch": 50.5,
"learning_rate": 2.2120886075949367e-05,
"loss": 0.0002,
"step": 5050
},
{
"epoch": 50.75,
"learning_rate": 2.2105063291139242e-05,
"loss": 0.0002,
"step": 5075
},
{
"epoch": 51.0,
"learning_rate": 2.2089240506329114e-05,
"loss": 0.0002,
"step": 5100
},
{
"epoch": 51.25,
"learning_rate": 2.207341772151899e-05,
"loss": 0.0002,
"step": 5125
},
{
"epoch": 51.5,
"learning_rate": 2.205759493670886e-05,
"loss": 0.0002,
"step": 5150
},
{
"epoch": 51.75,
"learning_rate": 2.2041772151898733e-05,
"loss": 0.0002,
"step": 5175
},
{
"epoch": 52.0,
"learning_rate": 2.202594936708861e-05,
"loss": 0.0002,
"step": 5200
},
{
"epoch": 52.25,
"learning_rate": 2.201012658227848e-05,
"loss": 0.0002,
"step": 5225
},
{
"epoch": 52.5,
"learning_rate": 2.1994303797468356e-05,
"loss": 0.0002,
"step": 5250
},
{
"epoch": 52.75,
"learning_rate": 2.1978481012658227e-05,
"loss": 0.0002,
"step": 5275
},
{
"epoch": 53.0,
"learning_rate": 2.1962658227848103e-05,
"loss": 0.0002,
"step": 5300
},
{
"epoch": 53.25,
"learning_rate": 2.1946835443037975e-05,
"loss": 0.0002,
"step": 5325
},
{
"epoch": 53.5,
"learning_rate": 2.1931012658227846e-05,
"loss": 0.0002,
"step": 5350
},
{
"epoch": 53.75,
"learning_rate": 2.1915189873417722e-05,
"loss": 0.0002,
"step": 5375
},
{
"epoch": 54.0,
"learning_rate": 2.1899367088607594e-05,
"loss": 0.0002,
"step": 5400
},
{
"epoch": 54.25,
"learning_rate": 2.1883544303797472e-05,
"loss": 0.0002,
"step": 5425
},
{
"epoch": 54.5,
"learning_rate": 2.1867721518987344e-05,
"loss": 0.0002,
"step": 5450
},
{
"epoch": 54.75,
"learning_rate": 2.1851898734177216e-05,
"loss": 0.0002,
"step": 5475
},
{
"epoch": 55.0,
"learning_rate": 2.183607594936709e-05,
"loss": 0.0002,
"step": 5500
},
{
"epoch": 55.25,
"learning_rate": 2.1820253164556963e-05,
"loss": 0.0001,
"step": 5525
},
{
"epoch": 55.5,
"learning_rate": 2.180443037974684e-05,
"loss": 0.0001,
"step": 5550
},
{
"epoch": 55.75,
"learning_rate": 2.178860759493671e-05,
"loss": 0.0001,
"step": 5575
},
{
"epoch": 56.0,
"learning_rate": 2.1772784810126586e-05,
"loss": 0.0002,
"step": 5600
},
{
"epoch": 56.25,
"learning_rate": 2.1756962025316457e-05,
"loss": 0.0001,
"step": 5625
},
{
"epoch": 56.5,
"learning_rate": 2.174113924050633e-05,
"loss": 0.0001,
"step": 5650
},
{
"epoch": 56.75,
"learning_rate": 2.1725316455696205e-05,
"loss": 0.0002,
"step": 5675
},
{
"epoch": 57.0,
"learning_rate": 2.1709493670886076e-05,
"loss": 0.0001,
"step": 5700
},
{
"epoch": 57.25,
"learning_rate": 2.1693670886075952e-05,
"loss": 0.0001,
"step": 5725
},
{
"epoch": 57.5,
"learning_rate": 2.1677848101265824e-05,
"loss": 0.0001,
"step": 5750
},
{
"epoch": 57.75,
"learning_rate": 2.16620253164557e-05,
"loss": 0.0001,
"step": 5775
},
{
"epoch": 58.0,
"learning_rate": 2.164620253164557e-05,
"loss": 0.0001,
"step": 5800
},
{
"epoch": 58.25,
"learning_rate": 2.1630379746835443e-05,
"loss": 0.0001,
"step": 5825
},
{
"epoch": 58.5,
"learning_rate": 2.1614556962025318e-05,
"loss": 0.0001,
"step": 5850
},
{
"epoch": 58.75,
"learning_rate": 2.159873417721519e-05,
"loss": 0.0001,
"step": 5875
},
{
"epoch": 59.0,
"learning_rate": 2.1582911392405065e-05,
"loss": 0.0001,
"step": 5900
},
{
"epoch": 59.25,
"learning_rate": 2.1567088607594937e-05,
"loss": 0.0001,
"step": 5925
},
{
"epoch": 59.5,
"learning_rate": 2.1551265822784812e-05,
"loss": 0.0001,
"step": 5950
},
{
"epoch": 59.75,
"learning_rate": 2.1535443037974684e-05,
"loss": 0.0001,
"step": 5975
},
{
"epoch": 60.0,
"learning_rate": 2.1519620253164556e-05,
"loss": 0.0001,
"step": 6000
},
{
"epoch": 60.0,
"eval_loss": 0.44586753845214844,
"eval_runtime": 159.5286,
"eval_samples_per_second": 79.873,
"eval_steps_per_second": 1.254,
"eval_wer": 17.977176801625763,
"step": 6000
},
{
"epoch": 60.25,
"learning_rate": 2.150379746835443e-05,
"loss": 0.0001,
"step": 6025
},
{
"epoch": 60.5,
"learning_rate": 2.1487974683544303e-05,
"loss": 0.0001,
"step": 6050
},
{
"epoch": 60.75,
"learning_rate": 2.147215189873418e-05,
"loss": 0.0001,
"step": 6075
},
{
"epoch": 61.0,
"learning_rate": 2.145632911392405e-05,
"loss": 0.0001,
"step": 6100
},
{
"epoch": 61.25,
"learning_rate": 2.1440506329113925e-05,
"loss": 0.0001,
"step": 6125
},
{
"epoch": 61.5,
"learning_rate": 2.1424683544303797e-05,
"loss": 0.0001,
"step": 6150
},
{
"epoch": 61.75,
"learning_rate": 2.140886075949367e-05,
"loss": 0.0001,
"step": 6175
},
{
"epoch": 62.0,
"learning_rate": 2.1393037974683544e-05,
"loss": 0.0001,
"step": 6200
},
{
"epoch": 62.25,
"learning_rate": 2.1377215189873416e-05,
"loss": 0.0001,
"step": 6225
},
{
"epoch": 62.5,
"learning_rate": 2.1361392405063295e-05,
"loss": 0.0001,
"step": 6250
},
{
"epoch": 62.75,
"learning_rate": 2.1345569620253167e-05,
"loss": 0.0001,
"step": 6275
},
{
"epoch": 63.0,
"learning_rate": 2.132974683544304e-05,
"loss": 0.0001,
"step": 6300
},
{
"epoch": 63.25,
"learning_rate": 2.1313924050632914e-05,
"loss": 0.0001,
"step": 6325
},
{
"epoch": 63.5,
"learning_rate": 2.1298101265822786e-05,
"loss": 0.0001,
"step": 6350
},
{
"epoch": 63.75,
"learning_rate": 2.128227848101266e-05,
"loss": 0.0001,
"step": 6375
},
{
"epoch": 64.0,
"learning_rate": 2.1266455696202533e-05,
"loss": 0.0001,
"step": 6400
},
{
"epoch": 64.25,
"learning_rate": 2.1250632911392408e-05,
"loss": 0.0001,
"step": 6425
},
{
"epoch": 64.5,
"learning_rate": 2.123481012658228e-05,
"loss": 0.0001,
"step": 6450
},
{
"epoch": 64.75,
"learning_rate": 2.1218987341772152e-05,
"loss": 0.0001,
"step": 6475
},
{
"epoch": 65.0,
"learning_rate": 2.1203164556962027e-05,
"loss": 0.0001,
"step": 6500
},
{
"epoch": 65.25,
"learning_rate": 2.11873417721519e-05,
"loss": 0.0001,
"step": 6525
},
{
"epoch": 65.5,
"learning_rate": 2.1171518987341774e-05,
"loss": 0.0001,
"step": 6550
},
{
"epoch": 65.75,
"learning_rate": 2.1155696202531646e-05,
"loss": 0.0001,
"step": 6575
},
{
"epoch": 66.0,
"learning_rate": 2.113987341772152e-05,
"loss": 0.0001,
"step": 6600
},
{
"epoch": 66.25,
"learning_rate": 2.1124050632911393e-05,
"loss": 0.0001,
"step": 6625
},
{
"epoch": 66.5,
"learning_rate": 2.1108227848101265e-05,
"loss": 0.0001,
"step": 6650
},
{
"epoch": 66.75,
"learning_rate": 2.109240506329114e-05,
"loss": 0.0001,
"step": 6675
},
{
"epoch": 67.0,
"learning_rate": 2.1076582278481012e-05,
"loss": 0.0001,
"step": 6700
},
{
"epoch": 67.25,
"learning_rate": 2.1060759493670888e-05,
"loss": 0.0001,
"step": 6725
},
{
"epoch": 67.5,
"learning_rate": 2.104493670886076e-05,
"loss": 0.0001,
"step": 6750
},
{
"epoch": 67.75,
"learning_rate": 2.1029113924050635e-05,
"loss": 0.0001,
"step": 6775
},
{
"epoch": 68.0,
"learning_rate": 2.1013291139240507e-05,
"loss": 0.0001,
"step": 6800
},
{
"epoch": 68.25,
"learning_rate": 2.099746835443038e-05,
"loss": 0.0001,
"step": 6825
},
{
"epoch": 68.5,
"learning_rate": 2.0981645569620254e-05,
"loss": 0.0001,
"step": 6850
},
{
"epoch": 68.75,
"learning_rate": 2.0965822784810126e-05,
"loss": 0.0001,
"step": 6875
},
{
"epoch": 69.0,
"learning_rate": 2.095e-05,
"loss": 0.0001,
"step": 6900
},
{
"epoch": 69.25,
"learning_rate": 2.0934177215189873e-05,
"loss": 0.0001,
"step": 6925
},
{
"epoch": 69.5,
"learning_rate": 2.0918354430379748e-05,
"loss": 0.0001,
"step": 6950
},
{
"epoch": 69.75,
"learning_rate": 2.090253164556962e-05,
"loss": 0.0001,
"step": 6975
},
{
"epoch": 70.0,
"learning_rate": 2.0886708860759492e-05,
"loss": 0.0001,
"step": 7000
},
{
"epoch": 70.0,
"eval_loss": 0.4665044844150543,
"eval_runtime": 159.7302,
"eval_samples_per_second": 79.772,
"eval_steps_per_second": 1.252,
"eval_wer": 18.01625762075973,
"step": 7000
},
{
"epoch": 70.25,
"learning_rate": 2.0870886075949367e-05,
"loss": 0.0001,
"step": 7025
},
{
"epoch": 70.5,
"learning_rate": 2.085506329113924e-05,
"loss": 0.0001,
"step": 7050
},
{
"epoch": 70.75,
"learning_rate": 2.0839240506329118e-05,
"loss": 0.0001,
"step": 7075
},
{
"epoch": 71.0,
"learning_rate": 2.082341772151899e-05,
"loss": 0.0001,
"step": 7100
},
{
"epoch": 71.25,
"learning_rate": 2.080759493670886e-05,
"loss": 0.0001,
"step": 7125
},
{
"epoch": 71.5,
"learning_rate": 2.0791772151898737e-05,
"loss": 0.0001,
"step": 7150
},
{
"epoch": 71.75,
"learning_rate": 2.077594936708861e-05,
"loss": 0.0001,
"step": 7175
},
{
"epoch": 72.0,
"learning_rate": 2.0760126582278484e-05,
"loss": 0.0001,
"step": 7200
},
{
"epoch": 72.25,
"learning_rate": 2.0744303797468356e-05,
"loss": 0.0001,
"step": 7225
},
{
"epoch": 72.5,
"learning_rate": 2.072848101265823e-05,
"loss": 0.0001,
"step": 7250
},
{
"epoch": 72.75,
"learning_rate": 2.0712658227848103e-05,
"loss": 0.0001,
"step": 7275
},
{
"epoch": 73.0,
"learning_rate": 2.0696835443037975e-05,
"loss": 0.0001,
"step": 7300
},
{
"epoch": 73.25,
"learning_rate": 2.068101265822785e-05,
"loss": 0.0001,
"step": 7325
},
{
"epoch": 73.5,
"learning_rate": 2.0665189873417722e-05,
"loss": 0.0001,
"step": 7350
},
{
"epoch": 73.75,
"learning_rate": 2.0649367088607597e-05,
"loss": 0.0001,
"step": 7375
},
{
"epoch": 74.0,
"learning_rate": 2.063354430379747e-05,
"loss": 0.0001,
"step": 7400
},
{
"epoch": 74.25,
"learning_rate": 2.0617721518987344e-05,
"loss": 0.0001,
"step": 7425
},
{
"epoch": 74.5,
"learning_rate": 2.0601898734177216e-05,
"loss": 0.0001,
"step": 7450
},
{
"epoch": 74.75,
"learning_rate": 2.0586075949367088e-05,
"loss": 0.0001,
"step": 7475
},
{
"epoch": 75.0,
"learning_rate": 2.0570253164556963e-05,
"loss": 0.0001,
"step": 7500
},
{
"epoch": 75.25,
"learning_rate": 2.0554430379746835e-05,
"loss": 0.0001,
"step": 7525
},
{
"epoch": 75.5,
"learning_rate": 2.053860759493671e-05,
"loss": 0.0001,
"step": 7550
},
{
"epoch": 75.75,
"learning_rate": 2.0522784810126582e-05,
"loss": 0.0001,
"step": 7575
},
{
"epoch": 76.0,
"learning_rate": 2.0506962025316458e-05,
"loss": 0.0001,
"step": 7600
},
{
"epoch": 76.25,
"learning_rate": 2.049113924050633e-05,
"loss": 0.0,
"step": 7625
},
{
"epoch": 76.5,
"learning_rate": 2.04753164556962e-05,
"loss": 0.0,
"step": 7650
},
{
"epoch": 76.75,
"learning_rate": 2.0459493670886077e-05,
"loss": 0.0001,
"step": 7675
},
{
"epoch": 77.0,
"learning_rate": 2.044367088607595e-05,
"loss": 0.0,
"step": 7700
},
{
"epoch": 77.25,
"learning_rate": 2.0427848101265824e-05,
"loss": 0.0,
"step": 7725
},
{
"epoch": 77.5,
"learning_rate": 2.0412025316455696e-05,
"loss": 0.0,
"step": 7750
},
{
"epoch": 77.75,
"learning_rate": 2.039620253164557e-05,
"loss": 0.0001,
"step": 7775
},
{
"epoch": 78.0,
"learning_rate": 2.0380379746835443e-05,
"loss": 0.0,
"step": 7800
},
{
"epoch": 78.25,
"learning_rate": 2.0364556962025315e-05,
"loss": 0.0,
"step": 7825
},
{
"epoch": 78.5,
"learning_rate": 2.034873417721519e-05,
"loss": 0.0001,
"step": 7850
},
{
"epoch": 78.75,
"learning_rate": 2.0332911392405062e-05,
"loss": 0.0,
"step": 7875
},
{
"epoch": 79.0,
"learning_rate": 2.031708860759494e-05,
"loss": 0.0001,
"step": 7900
},
{
"epoch": 79.25,
"learning_rate": 2.0301265822784812e-05,
"loss": 0.0,
"step": 7925
},
{
"epoch": 79.5,
"learning_rate": 2.0285443037974684e-05,
"loss": 0.0001,
"step": 7950
},
{
"epoch": 79.75,
"learning_rate": 2.026962025316456e-05,
"loss": 0.0001,
"step": 7975
},
{
"epoch": 80.0,
"learning_rate": 2.025379746835443e-05,
"loss": 0.0,
"step": 8000
},
{
"epoch": 80.0,
"eval_loss": 0.4881844222545624,
"eval_runtime": 159.9181,
"eval_samples_per_second": 79.678,
"eval_steps_per_second": 1.251,
"eval_wer": 18.108097545724558,
"step": 8000
},
{
"epoch": 80.25,
"learning_rate": 2.0237974683544307e-05,
"loss": 0.0,
"step": 8025
},
{
"epoch": 80.5,
"learning_rate": 2.022215189873418e-05,
"loss": 0.0,
"step": 8050
},
{
"epoch": 80.75,
"learning_rate": 2.0206329113924054e-05,
"loss": 0.0001,
"step": 8075
},
{
"epoch": 81.0,
"learning_rate": 2.0190506329113926e-05,
"loss": 0.0,
"step": 8100
},
{
"epoch": 81.25,
"learning_rate": 2.0174683544303797e-05,
"loss": 0.0001,
"step": 8125
},
{
"epoch": 81.5,
"learning_rate": 2.0158860759493673e-05,
"loss": 0.0,
"step": 8150
},
{
"epoch": 81.75,
"learning_rate": 2.0143037974683545e-05,
"loss": 0.0001,
"step": 8175
},
{
"epoch": 82.0,
"learning_rate": 2.0129113924050633e-05,
"loss": 0.0163,
"step": 8200
},
{
"epoch": 82.25,
"learning_rate": 2.0113291139240505e-05,
"loss": 0.0472,
"step": 8225
},
{
"epoch": 82.5,
"learning_rate": 2.009746835443038e-05,
"loss": 0.0499,
"step": 8250
},
{
"epoch": 82.75,
"learning_rate": 2.0081645569620256e-05,
"loss": 0.0423,
"step": 8275
},
{
"epoch": 83.0,
"learning_rate": 2.0065822784810128e-05,
"loss": 0.0335,
"step": 8300
},
{
"epoch": 83.25,
"learning_rate": 2.0050000000000003e-05,
"loss": 0.0196,
"step": 8325
},
{
"epoch": 83.5,
"learning_rate": 2.0034177215189875e-05,
"loss": 0.0161,
"step": 8350
},
{
"epoch": 83.75,
"learning_rate": 2.001835443037975e-05,
"loss": 0.0169,
"step": 8375
},
{
"epoch": 84.0,
"learning_rate": 2.0002531645569622e-05,
"loss": 0.015,
"step": 8400
},
{
"epoch": 84.25,
"learning_rate": 1.9986708860759497e-05,
"loss": 0.0084,
"step": 8425
},
{
"epoch": 84.5,
"learning_rate": 1.997088607594937e-05,
"loss": 0.0072,
"step": 8450
},
{
"epoch": 84.75,
"learning_rate": 1.995506329113924e-05,
"loss": 0.0064,
"step": 8475
},
{
"epoch": 85.0,
"learning_rate": 1.9939240506329116e-05,
"loss": 0.0067,
"step": 8500
},
{
"epoch": 85.25,
"learning_rate": 1.9923417721518988e-05,
"loss": 0.0038,
"step": 8525
},
{
"epoch": 85.5,
"learning_rate": 1.9907594936708863e-05,
"loss": 0.0032,
"step": 8550
},
{
"epoch": 85.75,
"learning_rate": 1.9891772151898735e-05,
"loss": 0.0033,
"step": 8575
},
{
"epoch": 86.0,
"learning_rate": 1.987594936708861e-05,
"loss": 0.0027,
"step": 8600
},
{
"epoch": 86.25,
"learning_rate": 1.9860126582278482e-05,
"loss": 0.0015,
"step": 8625
},
{
"epoch": 86.5,
"learning_rate": 1.9844303797468354e-05,
"loss": 0.0018,
"step": 8650
},
{
"epoch": 86.75,
"learning_rate": 1.982848101265823e-05,
"loss": 0.002,
"step": 8675
},
{
"epoch": 87.0,
"learning_rate": 1.98126582278481e-05,
"loss": 0.002,
"step": 8700
},
{
"epoch": 87.25,
"learning_rate": 1.9796835443037977e-05,
"loss": 0.0011,
"step": 8725
},
{
"epoch": 87.5,
"learning_rate": 1.978101265822785e-05,
"loss": 0.0011,
"step": 8750
},
{
"epoch": 87.75,
"learning_rate": 1.9765189873417724e-05,
"loss": 0.0009,
"step": 8775
},
{
"epoch": 88.0,
"learning_rate": 1.9749367088607596e-05,
"loss": 0.0008,
"step": 8800
},
{
"epoch": 88.25,
"learning_rate": 1.9733544303797467e-05,
"loss": 0.0006,
"step": 8825
},
{
"epoch": 88.5,
"learning_rate": 1.9717721518987343e-05,
"loss": 0.0005,
"step": 8850
},
{
"epoch": 88.75,
"learning_rate": 1.9701898734177215e-05,
"loss": 0.0006,
"step": 8875
},
{
"epoch": 89.0,
"learning_rate": 1.968607594936709e-05,
"loss": 0.0005,
"step": 8900
},
{
"epoch": 89.25,
"learning_rate": 1.9670253164556962e-05,
"loss": 0.0004,
"step": 8925
},
{
"epoch": 89.5,
"learning_rate": 1.9654430379746837e-05,
"loss": 0.0004,
"step": 8950
},
{
"epoch": 89.75,
"learning_rate": 1.963860759493671e-05,
"loss": 0.0003,
"step": 8975
},
{
"epoch": 90.0,
"learning_rate": 1.962278481012658e-05,
"loss": 0.0003,
"step": 9000
},
{
"epoch": 90.0,
"eval_loss": 0.3803234100341797,
"eval_runtime": 158.5126,
"eval_samples_per_second": 80.385,
"eval_steps_per_second": 1.262,
"eval_wer": 16.380725340003128,
"step": 9000
},
{
"epoch": 90.25,
"learning_rate": 1.9606962025316456e-05,
"loss": 0.0002,
"step": 9025
},
{
"epoch": 90.5,
"learning_rate": 1.9591139240506328e-05,
"loss": 0.0002,
"step": 9050
},
{
"epoch": 90.75,
"learning_rate": 1.9575316455696203e-05,
"loss": 0.0002,
"step": 9075
},
{
"epoch": 91.0,
"learning_rate": 1.955949367088608e-05,
"loss": 0.0002,
"step": 9100
},
{
"epoch": 91.25,
"learning_rate": 1.954367088607595e-05,
"loss": 0.0002,
"step": 9125
},
{
"epoch": 91.5,
"learning_rate": 1.9527848101265826e-05,
"loss": 0.0002,
"step": 9150
},
{
"epoch": 91.75,
"learning_rate": 1.9512025316455697e-05,
"loss": 0.0002,
"step": 9175
},
{
"epoch": 92.0,
"learning_rate": 1.9496202531645573e-05,
"loss": 0.0002,
"step": 9200
},
{
"epoch": 92.25,
"learning_rate": 1.9480379746835445e-05,
"loss": 0.0002,
"step": 9225
},
{
"epoch": 92.5,
"learning_rate": 1.946455696202532e-05,
"loss": 0.0002,
"step": 9250
},
{
"epoch": 92.75,
"learning_rate": 1.9448734177215192e-05,
"loss": 0.0002,
"step": 9275
},
{
"epoch": 93.0,
"learning_rate": 1.9432911392405064e-05,
"loss": 0.0002,
"step": 9300
},
{
"epoch": 93.25,
"learning_rate": 1.941708860759494e-05,
"loss": 0.0002,
"step": 9325
},
{
"epoch": 93.5,
"learning_rate": 1.940126582278481e-05,
"loss": 0.0002,
"step": 9350
},
{
"epoch": 93.75,
"learning_rate": 1.9385443037974686e-05,
"loss": 0.0002,
"step": 9375
},
{
"epoch": 94.0,
"learning_rate": 1.9369620253164558e-05,
"loss": 0.0002,
"step": 9400
},
{
"epoch": 94.25,
"learning_rate": 1.9353797468354433e-05,
"loss": 0.0002,
"step": 9425
},
{
"epoch": 94.5,
"learning_rate": 1.9337974683544305e-05,
"loss": 0.0002,
"step": 9450
},
{
"epoch": 94.75,
"learning_rate": 1.9322151898734177e-05,
"loss": 0.0002,
"step": 9475
},
{
"epoch": 95.0,
"learning_rate": 1.9306329113924052e-05,
"loss": 0.0002,
"step": 9500
},
{
"epoch": 95.25,
"learning_rate": 1.9290506329113924e-05,
"loss": 0.0002,
"step": 9525
},
{
"epoch": 95.5,
"learning_rate": 1.92746835443038e-05,
"loss": 0.0002,
"step": 9550
},
{
"epoch": 95.75,
"learning_rate": 1.925886075949367e-05,
"loss": 0.0001,
"step": 9575
},
{
"epoch": 96.0,
"learning_rate": 1.9243037974683546e-05,
"loss": 0.0001,
"step": 9600
},
{
"epoch": 96.25,
"learning_rate": 1.9227215189873418e-05,
"loss": 0.0001,
"step": 9625
},
{
"epoch": 96.5,
"learning_rate": 1.921139240506329e-05,
"loss": 0.0001,
"step": 9650
},
{
"epoch": 96.75,
"learning_rate": 1.9195569620253165e-05,
"loss": 0.0001,
"step": 9675
},
{
"epoch": 97.0,
"learning_rate": 1.9179746835443037e-05,
"loss": 0.0001,
"step": 9700
},
{
"epoch": 97.25,
"learning_rate": 1.9163924050632913e-05,
"loss": 0.0001,
"step": 9725
},
{
"epoch": 97.5,
"learning_rate": 1.9148101265822784e-05,
"loss": 0.0001,
"step": 9750
},
{
"epoch": 97.75,
"learning_rate": 1.913227848101266e-05,
"loss": 0.0001,
"step": 9775
},
{
"epoch": 98.0,
"learning_rate": 1.911645569620253e-05,
"loss": 0.0001,
"step": 9800
},
{
"epoch": 98.25,
"learning_rate": 1.9100632911392403e-05,
"loss": 0.0001,
"step": 9825
},
{
"epoch": 98.5,
"learning_rate": 1.908481012658228e-05,
"loss": 0.0001,
"step": 9850
},
{
"epoch": 98.75,
"learning_rate": 1.906898734177215e-05,
"loss": 0.0001,
"step": 9875
},
{
"epoch": 99.0,
"learning_rate": 1.9053164556962026e-05,
"loss": 0.0001,
"step": 9900
},
{
"epoch": 99.25,
"learning_rate": 1.90373417721519e-05,
"loss": 0.0001,
"step": 9925
},
{
"epoch": 99.5,
"learning_rate": 1.9021518987341773e-05,
"loss": 0.0001,
"step": 9950
},
{
"epoch": 99.75,
"learning_rate": 1.9005696202531648e-05,
"loss": 0.0001,
"step": 9975
},
{
"epoch": 100.0,
"learning_rate": 1.898987341772152e-05,
"loss": 0.0001,
"step": 10000
},
{
"epoch": 100.0,
"eval_loss": 0.4047200679779053,
"eval_runtime": 158.4112,
"eval_samples_per_second": 80.436,
"eval_steps_per_second": 1.263,
"eval_wer": 16.229287165858995,
"step": 10000
},
{
"epoch": 100.25,
"learning_rate": 1.8974050632911395e-05,
"loss": 0.0001,
"step": 10025
},
{
"epoch": 100.5,
"learning_rate": 1.8958227848101267e-05,
"loss": 0.0001,
"step": 10050
},
{
"epoch": 100.75,
"learning_rate": 1.8942405063291143e-05,
"loss": 0.0001,
"step": 10075
},
{
"epoch": 101.0,
"learning_rate": 1.8926582278481014e-05,
"loss": 0.0001,
"step": 10100
},
{
"epoch": 101.25,
"learning_rate": 1.8910759493670886e-05,
"loss": 0.0001,
"step": 10125
},
{
"epoch": 101.5,
"learning_rate": 1.889493670886076e-05,
"loss": 0.0001,
"step": 10150
},
{
"epoch": 101.75,
"learning_rate": 1.8879113924050633e-05,
"loss": 0.0001,
"step": 10175
},
{
"epoch": 102.0,
"learning_rate": 1.886329113924051e-05,
"loss": 0.0001,
"step": 10200
},
{
"epoch": 102.25,
"learning_rate": 1.884746835443038e-05,
"loss": 0.0001,
"step": 10225
},
{
"epoch": 102.5,
"learning_rate": 1.8831645569620256e-05,
"loss": 0.0001,
"step": 10250
},
{
"epoch": 102.75,
"learning_rate": 1.8815822784810128e-05,
"loss": 0.0001,
"step": 10275
},
{
"epoch": 103.0,
"learning_rate": 1.88e-05,
"loss": 0.0001,
"step": 10300
},
{
"epoch": 103.25,
"learning_rate": 1.8784177215189875e-05,
"loss": 0.0001,
"step": 10325
},
{
"epoch": 103.5,
"learning_rate": 1.8768354430379747e-05,
"loss": 0.0001,
"step": 10350
},
{
"epoch": 103.75,
"learning_rate": 1.8752531645569622e-05,
"loss": 0.0001,
"step": 10375
},
{
"epoch": 104.0,
"learning_rate": 1.8736708860759494e-05,
"loss": 0.0001,
"step": 10400
},
{
"epoch": 104.25,
"learning_rate": 1.872088607594937e-05,
"loss": 0.0001,
"step": 10425
},
{
"epoch": 104.5,
"learning_rate": 1.870506329113924e-05,
"loss": 0.0001,
"step": 10450
},
{
"epoch": 104.75,
"learning_rate": 1.8689240506329113e-05,
"loss": 0.0001,
"step": 10475
},
{
"epoch": 105.0,
"learning_rate": 1.8673417721518988e-05,
"loss": 0.0001,
"step": 10500
},
{
"epoch": 105.25,
"learning_rate": 1.865759493670886e-05,
"loss": 0.0001,
"step": 10525
},
{
"epoch": 105.5,
"learning_rate": 1.8641772151898735e-05,
"loss": 0.0001,
"step": 10550
},
{
"epoch": 105.75,
"learning_rate": 1.8625949367088607e-05,
"loss": 0.0001,
"step": 10575
},
{
"epoch": 106.0,
"learning_rate": 1.8610126582278482e-05,
"loss": 0.0001,
"step": 10600
},
{
"epoch": 106.25,
"learning_rate": 1.8594303797468354e-05,
"loss": 0.0001,
"step": 10625
},
{
"epoch": 106.5,
"learning_rate": 1.8578481012658226e-05,
"loss": 0.0001,
"step": 10650
},
{
"epoch": 106.75,
"learning_rate": 1.85626582278481e-05,
"loss": 0.0001,
"step": 10675
},
{
"epoch": 107.0,
"learning_rate": 1.8546835443037973e-05,
"loss": 0.0001,
"step": 10700
},
{
"epoch": 107.25,
"learning_rate": 1.8531012658227852e-05,
"loss": 0.0001,
"step": 10725
},
{
"epoch": 107.5,
"learning_rate": 1.8515189873417724e-05,
"loss": 0.0001,
"step": 10750
},
{
"epoch": 107.75,
"learning_rate": 1.8499367088607596e-05,
"loss": 0.0001,
"step": 10775
},
{
"epoch": 108.0,
"learning_rate": 1.848354430379747e-05,
"loss": 0.0001,
"step": 10800
},
{
"epoch": 108.25,
"learning_rate": 1.8467721518987343e-05,
"loss": 0.0001,
"step": 10825
},
{
"epoch": 108.5,
"learning_rate": 1.8451898734177218e-05,
"loss": 0.0001,
"step": 10850
},
{
"epoch": 108.75,
"learning_rate": 1.843607594936709e-05,
"loss": 0.0001,
"step": 10875
},
{
"epoch": 109.0,
"learning_rate": 1.8420253164556965e-05,
"loss": 0.0001,
"step": 10900
},
{
"epoch": 109.25,
"learning_rate": 1.8404430379746837e-05,
"loss": 0.0001,
"step": 10925
},
{
"epoch": 109.5,
"learning_rate": 1.838860759493671e-05,
"loss": 0.0001,
"step": 10950
},
{
"epoch": 109.75,
"learning_rate": 1.8372784810126584e-05,
"loss": 0.0001,
"step": 10975
},
{
"epoch": 110.0,
"learning_rate": 1.8356962025316456e-05,
"loss": 0.0001,
"step": 11000
},
{
"epoch": 110.0,
"eval_loss": 0.420736163854599,
"eval_runtime": 158.9284,
"eval_samples_per_second": 80.174,
"eval_steps_per_second": 1.258,
"eval_wer": 16.241988432077537,
"step": 11000
},
{
"epoch": 110.25,
"learning_rate": 1.834113924050633e-05,
"loss": 0.0001,
"step": 11025
},
{
"epoch": 110.5,
"learning_rate": 1.8325316455696203e-05,
"loss": 0.0001,
"step": 11050
},
{
"epoch": 110.75,
"learning_rate": 1.830949367088608e-05,
"loss": 0.0001,
"step": 11075
},
{
"epoch": 111.0,
"learning_rate": 1.829367088607595e-05,
"loss": 0.0001,
"step": 11100
},
{
"epoch": 111.25,
"learning_rate": 1.8277848101265822e-05,
"loss": 0.0001,
"step": 11125
},
{
"epoch": 111.5,
"learning_rate": 1.8262025316455698e-05,
"loss": 0.0001,
"step": 11150
},
{
"epoch": 111.75,
"learning_rate": 1.824620253164557e-05,
"loss": 0.0001,
"step": 11175
},
{
"epoch": 112.0,
"learning_rate": 1.8230379746835445e-05,
"loss": 0.0001,
"step": 11200
},
{
"epoch": 112.25,
"learning_rate": 1.8214556962025317e-05,
"loss": 0.0001,
"step": 11225
},
{
"epoch": 112.5,
"learning_rate": 1.8198734177215192e-05,
"loss": 0.0001,
"step": 11250
},
{
"epoch": 112.75,
"learning_rate": 1.8182911392405064e-05,
"loss": 0.0001,
"step": 11275
},
{
"epoch": 113.0,
"learning_rate": 1.8167088607594936e-05,
"loss": 0.0001,
"step": 11300
},
{
"epoch": 113.25,
"learning_rate": 1.815126582278481e-05,
"loss": 0.0001,
"step": 11325
},
{
"epoch": 113.5,
"learning_rate": 1.8135443037974683e-05,
"loss": 0.0001,
"step": 11350
},
{
"epoch": 113.75,
"learning_rate": 1.8119620253164558e-05,
"loss": 0.0001,
"step": 11375
},
{
"epoch": 114.0,
"learning_rate": 1.810379746835443e-05,
"loss": 0.0001,
"step": 11400
},
{
"epoch": 114.25,
"learning_rate": 1.8087974683544305e-05,
"loss": 0.0001,
"step": 11425
},
{
"epoch": 114.5,
"learning_rate": 1.8072151898734177e-05,
"loss": 0.0001,
"step": 11450
},
{
"epoch": 114.75,
"learning_rate": 1.805632911392405e-05,
"loss": 0.0001,
"step": 11475
},
{
"epoch": 115.0,
"learning_rate": 1.8040506329113924e-05,
"loss": 0.0001,
"step": 11500
},
{
"epoch": 115.25,
"learning_rate": 1.8024683544303796e-05,
"loss": 0.0001,
"step": 11525
},
{
"epoch": 115.5,
"learning_rate": 1.8008860759493675e-05,
"loss": 0.0001,
"step": 11550
},
{
"epoch": 115.75,
"learning_rate": 1.7993037974683547e-05,
"loss": 0.0001,
"step": 11575
},
{
"epoch": 116.0,
"learning_rate": 1.797721518987342e-05,
"loss": 0.0001,
"step": 11600
},
{
"epoch": 116.25,
"learning_rate": 1.7961392405063294e-05,
"loss": 0.0001,
"step": 11625
},
{
"epoch": 116.5,
"learning_rate": 1.7945569620253166e-05,
"loss": 0.0001,
"step": 11650
},
{
"epoch": 116.75,
"learning_rate": 1.792974683544304e-05,
"loss": 0.0001,
"step": 11675
},
{
"epoch": 117.0,
"learning_rate": 1.7913924050632913e-05,
"loss": 0.0001,
"step": 11700
},
{
"epoch": 117.25,
"learning_rate": 1.7898101265822788e-05,
"loss": 0.0001,
"step": 11725
},
{
"epoch": 117.5,
"learning_rate": 1.788227848101266e-05,
"loss": 0.0001,
"step": 11750
},
{
"epoch": 117.75,
"learning_rate": 1.786645569620253e-05,
"loss": 0.0001,
"step": 11775
},
{
"epoch": 118.0,
"learning_rate": 1.7850632911392407e-05,
"loss": 0.0001,
"step": 11800
},
{
"epoch": 118.25,
"learning_rate": 1.783481012658228e-05,
"loss": 0.0,
"step": 11825
},
{
"epoch": 118.5,
"learning_rate": 1.7818987341772154e-05,
"loss": 0.0,
"step": 11850
},
{
"epoch": 118.75,
"learning_rate": 1.7803164556962026e-05,
"loss": 0.0001,
"step": 11875
},
{
"epoch": 119.0,
"learning_rate": 1.77873417721519e-05,
"loss": 0.0001,
"step": 11900
},
{
"epoch": 119.25,
"learning_rate": 1.7771518987341773e-05,
"loss": 0.0,
"step": 11925
},
{
"epoch": 119.5,
"learning_rate": 1.7755696202531645e-05,
"loss": 0.0001,
"step": 11950
},
{
"epoch": 119.75,
"learning_rate": 1.773987341772152e-05,
"loss": 0.0,
"step": 11975
},
{
"epoch": 120.0,
"learning_rate": 1.7724050632911392e-05,
"loss": 0.0001,
"step": 12000
},
{
"epoch": 120.0,
"eval_loss": 0.43533626198768616,
"eval_runtime": 158.8725,
"eval_samples_per_second": 80.203,
"eval_steps_per_second": 1.259,
"eval_wer": 16.28790839455995,
"step": 12000
},
{
"epoch": 120.25,
"learning_rate": 1.7708227848101267e-05,
"loss": 0.0001,
"step": 12025
},
{
"epoch": 120.5,
"learning_rate": 1.769240506329114e-05,
"loss": 0.0,
"step": 12050
},
{
"epoch": 120.75,
"learning_rate": 1.7676582278481015e-05,
"loss": 0.0,
"step": 12075
},
{
"epoch": 121.0,
"learning_rate": 1.7660759493670886e-05,
"loss": 0.0001,
"step": 12100
},
{
"epoch": 121.25,
"learning_rate": 1.7644936708860758e-05,
"loss": 0.0,
"step": 12125
},
{
"epoch": 121.5,
"learning_rate": 1.7629113924050634e-05,
"loss": 0.0,
"step": 12150
},
{
"epoch": 121.75,
"learning_rate": 1.7613291139240505e-05,
"loss": 0.0001,
"step": 12175
},
{
"epoch": 122.0,
"learning_rate": 1.759746835443038e-05,
"loss": 0.0,
"step": 12200
},
{
"epoch": 122.25,
"learning_rate": 1.7581645569620253e-05,
"loss": 0.0,
"step": 12225
},
{
"epoch": 122.5,
"learning_rate": 1.7565822784810128e-05,
"loss": 0.0,
"step": 12250
},
{
"epoch": 122.75,
"learning_rate": 1.755e-05,
"loss": 0.0,
"step": 12275
},
{
"epoch": 123.0,
"learning_rate": 1.753417721518987e-05,
"loss": 0.0,
"step": 12300
},
{
"epoch": 123.25,
"learning_rate": 1.7518354430379747e-05,
"loss": 0.0,
"step": 12325
},
{
"epoch": 123.5,
"learning_rate": 1.750253164556962e-05,
"loss": 0.0,
"step": 12350
},
{
"epoch": 123.75,
"learning_rate": 1.7486708860759497e-05,
"loss": 0.0,
"step": 12375
},
{
"epoch": 124.0,
"learning_rate": 1.747088607594937e-05,
"loss": 0.0,
"step": 12400
},
{
"epoch": 124.25,
"learning_rate": 1.745506329113924e-05,
"loss": 0.0,
"step": 12425
},
{
"epoch": 124.5,
"learning_rate": 1.7439240506329116e-05,
"loss": 0.0,
"step": 12450
},
{
"epoch": 124.75,
"learning_rate": 1.7423417721518988e-05,
"loss": 0.0,
"step": 12475
},
{
"epoch": 125.0,
"learning_rate": 1.7407594936708863e-05,
"loss": 0.0,
"step": 12500
},
{
"epoch": 125.25,
"learning_rate": 1.7391772151898735e-05,
"loss": 0.0,
"step": 12525
},
{
"epoch": 125.5,
"learning_rate": 1.737594936708861e-05,
"loss": 0.0,
"step": 12550
},
{
"epoch": 125.75,
"learning_rate": 1.7360126582278483e-05,
"loss": 0.0,
"step": 12575
},
{
"epoch": 126.0,
"learning_rate": 1.7344303797468354e-05,
"loss": 0.0,
"step": 12600
},
{
"epoch": 126.25,
"learning_rate": 1.732848101265823e-05,
"loss": 0.0,
"step": 12625
},
{
"epoch": 126.5,
"learning_rate": 1.73126582278481e-05,
"loss": 0.0,
"step": 12650
},
{
"epoch": 126.75,
"learning_rate": 1.7296835443037977e-05,
"loss": 0.0,
"step": 12675
},
{
"epoch": 127.0,
"learning_rate": 1.728101265822785e-05,
"loss": 0.0,
"step": 12700
},
{
"epoch": 127.25,
"learning_rate": 1.7265189873417724e-05,
"loss": 0.0,
"step": 12725
},
{
"epoch": 127.5,
"learning_rate": 1.7249367088607596e-05,
"loss": 0.0,
"step": 12750
},
{
"epoch": 127.75,
"learning_rate": 1.7233544303797468e-05,
"loss": 0.0001,
"step": 12775
},
{
"epoch": 128.0,
"learning_rate": 1.7217721518987343e-05,
"loss": 0.0,
"step": 12800
},
{
"epoch": 128.25,
"learning_rate": 1.7201898734177215e-05,
"loss": 0.0,
"step": 12825
},
{
"epoch": 128.5,
"learning_rate": 1.718607594936709e-05,
"loss": 0.0,
"step": 12850
},
{
"epoch": 128.75,
"learning_rate": 1.7170253164556962e-05,
"loss": 0.0,
"step": 12875
},
{
"epoch": 129.0,
"learning_rate": 1.7154430379746837e-05,
"loss": 0.0,
"step": 12900
},
{
"epoch": 129.25,
"learning_rate": 1.713860759493671e-05,
"loss": 0.0,
"step": 12925
},
{
"epoch": 129.5,
"learning_rate": 1.712278481012658e-05,
"loss": 0.0,
"step": 12950
},
{
"epoch": 129.75,
"learning_rate": 1.7106962025316456e-05,
"loss": 0.0,
"step": 12975
},
{
"epoch": 130.0,
"learning_rate": 1.7091139240506328e-05,
"loss": 0.0,
"step": 13000
},
{
"epoch": 130.0,
"eval_loss": 0.4501500725746155,
"eval_runtime": 161.2897,
"eval_samples_per_second": 79.001,
"eval_steps_per_second": 1.24,
"eval_wer": 16.369978114741286,
"step": 13000
},
{
"epoch": 130.25,
"learning_rate": 1.7075316455696203e-05,
"loss": 0.0,
"step": 13025
},
{
"epoch": 130.5,
"learning_rate": 1.7059493670886075e-05,
"loss": 0.0,
"step": 13050
},
{
"epoch": 130.75,
"learning_rate": 1.704367088607595e-05,
"loss": 0.0,
"step": 13075
},
{
"epoch": 131.0,
"learning_rate": 1.7027848101265822e-05,
"loss": 0.0,
"step": 13100
},
{
"epoch": 131.25,
"learning_rate": 1.7012025316455694e-05,
"loss": 0.0,
"step": 13125
},
{
"epoch": 131.5,
"learning_rate": 1.699620253164557e-05,
"loss": 0.0,
"step": 13150
},
{
"epoch": 131.75,
"learning_rate": 1.698037974683544e-05,
"loss": 0.0,
"step": 13175
},
{
"epoch": 132.0,
"learning_rate": 1.696455696202532e-05,
"loss": 0.0,
"step": 13200
},
{
"epoch": 132.25,
"learning_rate": 1.6948734177215192e-05,
"loss": 0.0,
"step": 13225
},
{
"epoch": 132.5,
"learning_rate": 1.6932911392405064e-05,
"loss": 0.0,
"step": 13250
},
{
"epoch": 132.75,
"learning_rate": 1.691708860759494e-05,
"loss": 0.0,
"step": 13275
},
{
"epoch": 133.0,
"learning_rate": 1.690126582278481e-05,
"loss": 0.0,
"step": 13300
},
{
"epoch": 133.25,
"learning_rate": 1.6885443037974686e-05,
"loss": 0.0,
"step": 13325
},
{
"epoch": 133.5,
"learning_rate": 1.6869620253164558e-05,
"loss": 0.0,
"step": 13350
},
{
"epoch": 133.75,
"learning_rate": 1.6853797468354433e-05,
"loss": 0.0,
"step": 13375
},
{
"epoch": 134.0,
"learning_rate": 1.6837974683544305e-05,
"loss": 0.0,
"step": 13400
},
{
"epoch": 134.25,
"learning_rate": 1.6822151898734177e-05,
"loss": 0.0,
"step": 13425
},
{
"epoch": 134.5,
"learning_rate": 1.6806329113924052e-05,
"loss": 0.0,
"step": 13450
},
{
"epoch": 134.75,
"learning_rate": 1.6790506329113924e-05,
"loss": 0.0,
"step": 13475
},
{
"epoch": 135.0,
"learning_rate": 1.67746835443038e-05,
"loss": 0.0,
"step": 13500
},
{
"epoch": 135.25,
"learning_rate": 1.675886075949367e-05,
"loss": 0.0,
"step": 13525
},
{
"epoch": 135.5,
"learning_rate": 1.6743037974683547e-05,
"loss": 0.0,
"step": 13550
},
{
"epoch": 135.75,
"learning_rate": 1.672721518987342e-05,
"loss": 0.0,
"step": 13575
},
{
"epoch": 136.0,
"learning_rate": 1.671139240506329e-05,
"loss": 0.0,
"step": 13600
},
{
"epoch": 136.25,
"learning_rate": 1.6695569620253166e-05,
"loss": 0.0,
"step": 13625
},
{
"epoch": 136.5,
"learning_rate": 1.6679746835443038e-05,
"loss": 0.0,
"step": 13650
},
{
"epoch": 136.75,
"learning_rate": 1.6663924050632913e-05,
"loss": 0.0,
"step": 13675
},
{
"epoch": 137.0,
"learning_rate": 1.6648101265822785e-05,
"loss": 0.0,
"step": 13700
},
{
"epoch": 137.25,
"learning_rate": 1.663227848101266e-05,
"loss": 0.0,
"step": 13725
},
{
"epoch": 137.5,
"learning_rate": 1.6616455696202532e-05,
"loss": 0.0,
"step": 13750
},
{
"epoch": 137.75,
"learning_rate": 1.6600632911392404e-05,
"loss": 0.0,
"step": 13775
},
{
"epoch": 138.0,
"learning_rate": 1.658481012658228e-05,
"loss": 0.0,
"step": 13800
},
{
"epoch": 138.25,
"learning_rate": 1.656898734177215e-05,
"loss": 0.0,
"step": 13825
},
{
"epoch": 138.5,
"learning_rate": 1.6553164556962026e-05,
"loss": 0.0,
"step": 13850
},
{
"epoch": 138.75,
"learning_rate": 1.6537341772151898e-05,
"loss": 0.0,
"step": 13875
},
{
"epoch": 139.0,
"learning_rate": 1.6521518987341773e-05,
"loss": 0.0,
"step": 13900
},
{
"epoch": 139.25,
"learning_rate": 1.6505696202531645e-05,
"loss": 0.0,
"step": 13925
},
{
"epoch": 139.5,
"learning_rate": 1.6489873417721517e-05,
"loss": 0.0,
"step": 13950
},
{
"epoch": 139.75,
"learning_rate": 1.6474050632911392e-05,
"loss": 0.0,
"step": 13975
},
{
"epoch": 140.0,
"learning_rate": 1.6458227848101264e-05,
"loss": 0.0,
"step": 14000
},
{
"epoch": 140.0,
"eval_loss": 0.4653187692165375,
"eval_runtime": 162.4767,
"eval_samples_per_second": 78.424,
"eval_steps_per_second": 1.231,
"eval_wer": 16.508715022666877,
"step": 14000
},
{
"epoch": 140.25,
"learning_rate": 1.6442405063291143e-05,
"loss": 0.0,
"step": 14025
},
{
"epoch": 140.5,
"learning_rate": 1.6426582278481015e-05,
"loss": 0.0,
"step": 14050
},
{
"epoch": 140.75,
"learning_rate": 1.6410759493670887e-05,
"loss": 0.0,
"step": 14075
},
{
"epoch": 141.0,
"learning_rate": 1.6394936708860762e-05,
"loss": 0.0,
"step": 14100
},
{
"epoch": 141.25,
"learning_rate": 1.6379113924050634e-05,
"loss": 0.0,
"step": 14125
},
{
"epoch": 141.5,
"learning_rate": 1.636329113924051e-05,
"loss": 0.0,
"step": 14150
},
{
"epoch": 141.75,
"learning_rate": 1.634746835443038e-05,
"loss": 0.0,
"step": 14175
},
{
"epoch": 142.0,
"learning_rate": 1.6331645569620256e-05,
"loss": 0.0,
"step": 14200
},
{
"epoch": 142.25,
"learning_rate": 1.6315822784810128e-05,
"loss": 0.0,
"step": 14225
},
{
"epoch": 142.5,
"learning_rate": 1.63e-05,
"loss": 0.0,
"step": 14250
},
{
"epoch": 142.75,
"learning_rate": 1.6284177215189875e-05,
"loss": 0.0,
"step": 14275
},
{
"epoch": 143.0,
"learning_rate": 1.6268354430379747e-05,
"loss": 0.0,
"step": 14300
},
{
"epoch": 143.25,
"learning_rate": 1.6252531645569622e-05,
"loss": 0.0,
"step": 14325
},
{
"epoch": 143.5,
"learning_rate": 1.6236708860759494e-05,
"loss": 0.0,
"step": 14350
},
{
"epoch": 143.75,
"learning_rate": 1.622088607594937e-05,
"loss": 0.0,
"step": 14375
},
{
"epoch": 144.0,
"learning_rate": 1.620506329113924e-05,
"loss": 0.0,
"step": 14400
},
{
"epoch": 144.25,
"learning_rate": 1.6189240506329113e-05,
"loss": 0.0,
"step": 14425
},
{
"epoch": 144.5,
"learning_rate": 1.617341772151899e-05,
"loss": 0.0,
"step": 14450
},
{
"epoch": 144.75,
"learning_rate": 1.615759493670886e-05,
"loss": 0.0,
"step": 14475
},
{
"epoch": 145.0,
"learning_rate": 1.6141772151898735e-05,
"loss": 0.0,
"step": 14500
},
{
"epoch": 145.25,
"learning_rate": 1.6125949367088607e-05,
"loss": 0.0,
"step": 14525
},
{
"epoch": 145.5,
"learning_rate": 1.6110126582278483e-05,
"loss": 0.0,
"step": 14550
},
{
"epoch": 145.75,
"learning_rate": 1.6094303797468354e-05,
"loss": 0.0,
"step": 14575
},
{
"epoch": 146.0,
"learning_rate": 1.6078481012658226e-05,
"loss": 0.0,
"step": 14600
},
{
"epoch": 146.25,
"learning_rate": 1.60626582278481e-05,
"loss": 0.0,
"step": 14625
},
{
"epoch": 146.5,
"learning_rate": 1.6046835443037974e-05,
"loss": 0.0,
"step": 14650
},
{
"epoch": 146.75,
"learning_rate": 1.603101265822785e-05,
"loss": 0.0,
"step": 14675
},
{
"epoch": 147.0,
"learning_rate": 1.601518987341772e-05,
"loss": 0.0,
"step": 14700
},
{
"epoch": 147.25,
"learning_rate": 1.5999367088607596e-05,
"loss": 0.0,
"step": 14725
},
{
"epoch": 147.5,
"learning_rate": 1.5983544303797468e-05,
"loss": 0.0,
"step": 14750
},
{
"epoch": 147.75,
"learning_rate": 1.5967721518987343e-05,
"loss": 0.0,
"step": 14775
},
{
"epoch": 148.0,
"learning_rate": 1.5951898734177215e-05,
"loss": 0.0,
"step": 14800
},
{
"epoch": 148.25,
"learning_rate": 1.5936075949367087e-05,
"loss": 0.0,
"step": 14825
},
{
"epoch": 148.5,
"learning_rate": 1.5920253164556965e-05,
"loss": 0.0,
"step": 14850
},
{
"epoch": 148.75,
"learning_rate": 1.5904430379746837e-05,
"loss": 0.0,
"step": 14875
},
{
"epoch": 149.0,
"learning_rate": 1.588860759493671e-05,
"loss": 0.0,
"step": 14900
},
{
"epoch": 149.25,
"learning_rate": 1.5872784810126584e-05,
"loss": 0.0,
"step": 14925
},
{
"epoch": 149.5,
"learning_rate": 1.5856962025316456e-05,
"loss": 0.0,
"step": 14950
},
{
"epoch": 149.75,
"learning_rate": 1.584113924050633e-05,
"loss": 0.0,
"step": 14975
},
{
"epoch": 150.0,
"learning_rate": 1.5825316455696203e-05,
"loss": 0.0,
"step": 15000
},
{
"epoch": 150.0,
"eval_loss": 0.4805411398410797,
"eval_runtime": 160.7538,
"eval_samples_per_second": 79.264,
"eval_steps_per_second": 1.244,
"eval_wer": 16.43934656870408,
"step": 15000
},
{
"epoch": 150.25,
"learning_rate": 1.580949367088608e-05,
"loss": 0.0,
"step": 15025
},
{
"epoch": 150.5,
"learning_rate": 1.579367088607595e-05,
"loss": 0.0,
"step": 15050
},
{
"epoch": 150.75,
"learning_rate": 1.5777848101265822e-05,
"loss": 0.0,
"step": 15075
},
{
"epoch": 151.0,
"learning_rate": 1.5762025316455698e-05,
"loss": 0.0,
"step": 15100
},
{
"epoch": 151.25,
"learning_rate": 1.574620253164557e-05,
"loss": 0.0,
"step": 15125
},
{
"epoch": 151.5,
"learning_rate": 1.5730379746835445e-05,
"loss": 0.0,
"step": 15150
},
{
"epoch": 151.75,
"learning_rate": 1.5714556962025317e-05,
"loss": 0.0,
"step": 15175
},
{
"epoch": 152.0,
"learning_rate": 1.5698734177215192e-05,
"loss": 0.0,
"step": 15200
},
{
"epoch": 152.25,
"learning_rate": 1.5682911392405064e-05,
"loss": 0.0,
"step": 15225
},
{
"epoch": 152.5,
"learning_rate": 1.5667088607594936e-05,
"loss": 0.0,
"step": 15250
},
{
"epoch": 152.75,
"learning_rate": 1.565126582278481e-05,
"loss": 0.0,
"step": 15275
},
{
"epoch": 153.0,
"learning_rate": 1.5635443037974683e-05,
"loss": 0.0,
"step": 15300
},
{
"epoch": 153.25,
"learning_rate": 1.5619620253164558e-05,
"loss": 0.0,
"step": 15325
},
{
"epoch": 153.5,
"learning_rate": 1.560379746835443e-05,
"loss": 0.0,
"step": 15350
},
{
"epoch": 153.75,
"learning_rate": 1.5587974683544305e-05,
"loss": 0.0,
"step": 15375
},
{
"epoch": 154.0,
"learning_rate": 1.5572151898734177e-05,
"loss": 0.0,
"step": 15400
},
{
"epoch": 154.25,
"learning_rate": 1.5556329113924052e-05,
"loss": 0.0,
"step": 15425
},
{
"epoch": 154.5,
"learning_rate": 1.5540506329113924e-05,
"loss": 0.0,
"step": 15450
},
{
"epoch": 154.75,
"learning_rate": 1.5524683544303796e-05,
"loss": 0.0,
"step": 15475
},
{
"epoch": 155.0,
"learning_rate": 1.550886075949367e-05,
"loss": 0.0,
"step": 15500
},
{
"epoch": 155.25,
"learning_rate": 1.5493037974683543e-05,
"loss": 0.0,
"step": 15525
},
{
"epoch": 155.5,
"learning_rate": 1.547721518987342e-05,
"loss": 0.0,
"step": 15550
},
{
"epoch": 155.75,
"learning_rate": 1.546139240506329e-05,
"loss": 0.0,
"step": 15575
},
{
"epoch": 156.0,
"learning_rate": 1.5445569620253166e-05,
"loss": 0.0,
"step": 15600
},
{
"epoch": 156.25,
"learning_rate": 1.5429746835443038e-05,
"loss": 0.0,
"step": 15625
},
{
"epoch": 156.5,
"learning_rate": 1.541392405063291e-05,
"loss": 0.0,
"step": 15650
},
{
"epoch": 156.75,
"learning_rate": 1.5398101265822788e-05,
"loss": 0.0,
"step": 15675
},
{
"epoch": 157.0,
"learning_rate": 1.538227848101266e-05,
"loss": 0.0,
"step": 15700
},
{
"epoch": 157.25,
"learning_rate": 1.5366455696202532e-05,
"loss": 0.0,
"step": 15725
},
{
"epoch": 157.5,
"learning_rate": 1.5350632911392407e-05,
"loss": 0.0,
"step": 15750
},
{
"epoch": 157.75,
"learning_rate": 1.533481012658228e-05,
"loss": 0.0,
"step": 15775
},
{
"epoch": 158.0,
"learning_rate": 1.5318987341772154e-05,
"loss": 0.0,
"step": 15800
},
{
"epoch": 158.25,
"learning_rate": 1.5303164556962026e-05,
"loss": 0.0,
"step": 15825
},
{
"epoch": 158.5,
"learning_rate": 1.52873417721519e-05,
"loss": 0.0,
"step": 15850
},
{
"epoch": 158.75,
"learning_rate": 1.5271518987341773e-05,
"loss": 0.0,
"step": 15875
},
{
"epoch": 159.0,
"learning_rate": 1.5255696202531647e-05,
"loss": 0.0,
"step": 15900
},
{
"epoch": 159.25,
"learning_rate": 1.523987341772152e-05,
"loss": 0.0,
"step": 15925
},
{
"epoch": 159.5,
"learning_rate": 1.5224050632911394e-05,
"loss": 0.0,
"step": 15950
},
{
"epoch": 159.75,
"learning_rate": 1.5208227848101268e-05,
"loss": 0.0,
"step": 15975
},
{
"epoch": 160.0,
"learning_rate": 1.519240506329114e-05,
"loss": 0.0,
"step": 16000
},
{
"epoch": 160.0,
"eval_loss": 0.49637511372566223,
"eval_runtime": 159.1982,
"eval_samples_per_second": 80.039,
"eval_steps_per_second": 1.256,
"eval_wer": 16.494059715491638,
"step": 16000
},
{
"epoch": 160.25,
"learning_rate": 1.5176582278481013e-05,
"loss": 0.0,
"step": 16025
},
{
"epoch": 160.5,
"learning_rate": 1.5160759493670887e-05,
"loss": 0.0,
"step": 16050
},
{
"epoch": 160.75,
"learning_rate": 1.514493670886076e-05,
"loss": 0.0,
"step": 16075
},
{
"epoch": 161.0,
"learning_rate": 1.5129113924050634e-05,
"loss": 0.0,
"step": 16100
},
{
"epoch": 161.25,
"learning_rate": 1.5113291139240507e-05,
"loss": 0.0,
"step": 16125
},
{
"epoch": 161.5,
"learning_rate": 1.5097468354430381e-05,
"loss": 0.0,
"step": 16150
},
{
"epoch": 161.75,
"learning_rate": 1.5081645569620253e-05,
"loss": 0.0,
"step": 16175
},
{
"epoch": 162.0,
"learning_rate": 1.5065822784810126e-05,
"loss": 0.0,
"step": 16200
},
{
"epoch": 162.25,
"learning_rate": 1.505e-05,
"loss": 0.0,
"step": 16225
},
{
"epoch": 162.5,
"learning_rate": 1.5034177215189873e-05,
"loss": 0.0,
"step": 16250
},
{
"epoch": 162.75,
"learning_rate": 1.5018354430379747e-05,
"loss": 0.0,
"step": 16275
},
{
"epoch": 163.0,
"learning_rate": 1.500253164556962e-05,
"loss": 0.0,
"step": 16300
},
{
"epoch": 163.25,
"learning_rate": 1.4986708860759494e-05,
"loss": 0.0,
"step": 16325
},
{
"epoch": 163.5,
"learning_rate": 1.4970886075949366e-05,
"loss": 0.0,
"step": 16350
},
{
"epoch": 163.75,
"learning_rate": 1.495506329113924e-05,
"loss": 0.0,
"step": 16375
},
{
"epoch": 164.0,
"learning_rate": 1.4939240506329113e-05,
"loss": 0.0,
"step": 16400
},
{
"epoch": 164.25,
"learning_rate": 1.4923417721518987e-05,
"loss": 0.0,
"step": 16425
},
{
"epoch": 164.5,
"learning_rate": 1.490759493670886e-05,
"loss": 0.0,
"step": 16450
},
{
"epoch": 164.75,
"learning_rate": 1.4891772151898734e-05,
"loss": 0.0,
"step": 16475
},
{
"epoch": 165.0,
"learning_rate": 1.487594936708861e-05,
"loss": 0.0,
"step": 16500
},
{
"epoch": 165.25,
"learning_rate": 1.4860126582278483e-05,
"loss": 0.0,
"step": 16525
},
{
"epoch": 165.5,
"learning_rate": 1.4844303797468356e-05,
"loss": 0.0,
"step": 16550
},
{
"epoch": 165.75,
"learning_rate": 1.482848101265823e-05,
"loss": 0.0,
"step": 16575
},
{
"epoch": 166.0,
"learning_rate": 1.4812658227848103e-05,
"loss": 0.0,
"step": 16600
},
{
"epoch": 166.25,
"learning_rate": 1.4796835443037977e-05,
"loss": 0.0,
"step": 16625
},
{
"epoch": 166.5,
"learning_rate": 1.4781012658227849e-05,
"loss": 0.0,
"step": 16650
},
{
"epoch": 166.75,
"learning_rate": 1.4765189873417722e-05,
"loss": 0.0,
"step": 16675
},
{
"epoch": 167.0,
"learning_rate": 1.4749367088607596e-05,
"loss": 0.0,
"step": 16700
},
{
"epoch": 167.25,
"learning_rate": 1.473354430379747e-05,
"loss": 0.0,
"step": 16725
},
{
"epoch": 167.5,
"learning_rate": 1.4717721518987343e-05,
"loss": 0.0,
"step": 16750
},
{
"epoch": 167.75,
"learning_rate": 1.4701898734177217e-05,
"loss": 0.0,
"step": 16775
},
{
"epoch": 168.0,
"learning_rate": 1.468607594936709e-05,
"loss": 0.0,
"step": 16800
},
{
"epoch": 168.25,
"learning_rate": 1.4670253164556962e-05,
"loss": 0.0,
"step": 16825
},
{
"epoch": 168.5,
"learning_rate": 1.4654430379746836e-05,
"loss": 0.0,
"step": 16850
},
{
"epoch": 168.75,
"learning_rate": 1.463860759493671e-05,
"loss": 0.0,
"step": 16875
},
{
"epoch": 169.0,
"learning_rate": 1.4622784810126583e-05,
"loss": 0.0,
"step": 16900
},
{
"epoch": 169.25,
"learning_rate": 1.4606962025316456e-05,
"loss": 0.0,
"step": 16925
},
{
"epoch": 169.5,
"learning_rate": 1.459113924050633e-05,
"loss": 0.0,
"step": 16950
},
{
"epoch": 169.75,
"learning_rate": 1.4575316455696204e-05,
"loss": 0.0,
"step": 16975
},
{
"epoch": 170.0,
"learning_rate": 1.4559493670886075e-05,
"loss": 0.0,
"step": 17000
},
{
"epoch": 170.0,
"eval_loss": 0.5127857327461243,
"eval_runtime": 157.5862,
"eval_samples_per_second": 80.857,
"eval_steps_per_second": 1.269,
"eval_wer": 16.510669063623574,
"step": 17000
},
{
"epoch": 170.25,
"learning_rate": 1.4543670886075949e-05,
"loss": 0.0,
"step": 17025
},
{
"epoch": 170.5,
"learning_rate": 1.4527848101265823e-05,
"loss": 0.0,
"step": 17050
},
{
"epoch": 170.75,
"learning_rate": 1.4512025316455696e-05,
"loss": 0.0,
"step": 17075
},
{
"epoch": 171.0,
"learning_rate": 1.449620253164557e-05,
"loss": 0.0,
"step": 17100
},
{
"epoch": 171.25,
"learning_rate": 1.4480379746835443e-05,
"loss": 0.0,
"step": 17125
},
{
"epoch": 171.5,
"learning_rate": 1.4464556962025317e-05,
"loss": 0.0,
"step": 17150
},
{
"epoch": 171.75,
"learning_rate": 1.444873417721519e-05,
"loss": 0.0,
"step": 17175
},
{
"epoch": 172.0,
"learning_rate": 1.4432911392405062e-05,
"loss": 0.0,
"step": 17200
},
{
"epoch": 172.25,
"learning_rate": 1.4417088607594936e-05,
"loss": 0.0,
"step": 17225
},
{
"epoch": 172.5,
"learning_rate": 1.440126582278481e-05,
"loss": 0.0,
"step": 17250
},
{
"epoch": 172.75,
"learning_rate": 1.4385443037974683e-05,
"loss": 0.0,
"step": 17275
},
{
"epoch": 173.0,
"learning_rate": 1.4369620253164557e-05,
"loss": 0.0,
"step": 17300
},
{
"epoch": 173.25,
"learning_rate": 1.4353797468354432e-05,
"loss": 0.0,
"step": 17325
},
{
"epoch": 173.5,
"learning_rate": 1.4337974683544305e-05,
"loss": 0.0,
"step": 17350
},
{
"epoch": 173.75,
"learning_rate": 1.4322151898734179e-05,
"loss": 0.0,
"step": 17375
},
{
"epoch": 174.0,
"learning_rate": 1.4306329113924053e-05,
"loss": 0.0,
"step": 17400
},
{
"epoch": 174.25,
"learning_rate": 1.4290506329113926e-05,
"loss": 0.0,
"step": 17425
},
{
"epoch": 174.5,
"learning_rate": 1.42746835443038e-05,
"loss": 0.0,
"step": 17450
},
{
"epoch": 174.75,
"learning_rate": 1.4258860759493672e-05,
"loss": 0.0,
"step": 17475
},
{
"epoch": 175.0,
"learning_rate": 1.4243037974683545e-05,
"loss": 0.0,
"step": 17500
},
{
"epoch": 175.25,
"learning_rate": 1.4227215189873419e-05,
"loss": 0.0,
"step": 17525
},
{
"epoch": 175.5,
"learning_rate": 1.4211392405063292e-05,
"loss": 0.0,
"step": 17550
},
{
"epoch": 175.75,
"learning_rate": 1.4195569620253166e-05,
"loss": 0.0,
"step": 17575
},
{
"epoch": 176.0,
"learning_rate": 1.417974683544304e-05,
"loss": 0.0,
"step": 17600
},
{
"epoch": 176.25,
"learning_rate": 1.4163924050632913e-05,
"loss": 0.0,
"step": 17625
},
{
"epoch": 176.5,
"learning_rate": 1.4148101265822785e-05,
"loss": 0.0,
"step": 17650
},
{
"epoch": 176.75,
"learning_rate": 1.4132278481012658e-05,
"loss": 0.0,
"step": 17675
},
{
"epoch": 177.0,
"learning_rate": 1.4116455696202532e-05,
"loss": 0.0,
"step": 17700
},
{
"epoch": 177.25,
"learning_rate": 1.4100632911392406e-05,
"loss": 0.0,
"step": 17725
},
{
"epoch": 177.5,
"learning_rate": 1.408481012658228e-05,
"loss": 0.0,
"step": 17750
},
{
"epoch": 177.75,
"learning_rate": 1.4068987341772153e-05,
"loss": 0.0,
"step": 17775
},
{
"epoch": 178.0,
"learning_rate": 1.4053164556962026e-05,
"loss": 0.0,
"step": 17800
},
{
"epoch": 178.25,
"learning_rate": 1.40373417721519e-05,
"loss": 0.0,
"step": 17825
},
{
"epoch": 178.5,
"learning_rate": 1.4021518987341772e-05,
"loss": 0.0,
"step": 17850
},
{
"epoch": 178.75,
"learning_rate": 1.4005696202531645e-05,
"loss": 0.0,
"step": 17875
},
{
"epoch": 179.0,
"learning_rate": 1.3989873417721519e-05,
"loss": 0.0,
"step": 17900
},
{
"epoch": 179.25,
"learning_rate": 1.3974050632911392e-05,
"loss": 0.0,
"step": 17925
},
{
"epoch": 179.5,
"learning_rate": 1.3958227848101266e-05,
"loss": 0.0,
"step": 17950
},
{
"epoch": 179.75,
"learning_rate": 1.394240506329114e-05,
"loss": 0.0,
"step": 17975
},
{
"epoch": 180.0,
"learning_rate": 1.3926582278481013e-05,
"loss": 0.0,
"step": 18000
},
{
"epoch": 180.0,
"eval_loss": 0.5284730792045593,
"eval_runtime": 160.4225,
"eval_samples_per_second": 79.428,
"eval_steps_per_second": 1.247,
"eval_wer": 16.637681725808974,
"step": 18000
},
{
"epoch": 180.25,
"learning_rate": 1.3910759493670885e-05,
"loss": 0.0,
"step": 18025
},
{
"epoch": 180.5,
"learning_rate": 1.3894936708860759e-05,
"loss": 0.0,
"step": 18050
},
{
"epoch": 180.75,
"learning_rate": 1.3879113924050632e-05,
"loss": 0.0,
"step": 18075
},
{
"epoch": 181.0,
"learning_rate": 1.3863291139240506e-05,
"loss": 0.0,
"step": 18100
},
{
"epoch": 181.25,
"learning_rate": 1.384746835443038e-05,
"loss": 0.0,
"step": 18125
},
{
"epoch": 181.5,
"learning_rate": 1.3831645569620255e-05,
"loss": 0.0,
"step": 18150
},
{
"epoch": 181.75,
"learning_rate": 1.3815822784810128e-05,
"loss": 0.0,
"step": 18175
},
{
"epoch": 182.0,
"learning_rate": 1.3800000000000002e-05,
"loss": 0.0,
"step": 18200
},
{
"epoch": 182.25,
"learning_rate": 1.3784177215189875e-05,
"loss": 0.0,
"step": 18225
},
{
"epoch": 182.5,
"learning_rate": 1.3768987341772152e-05,
"loss": 0.0,
"step": 18250
},
{
"epoch": 182.75,
"learning_rate": 1.3753164556962026e-05,
"loss": 0.0,
"step": 18275
},
{
"epoch": 183.0,
"learning_rate": 1.37373417721519e-05,
"loss": 0.0,
"step": 18300
},
{
"epoch": 183.25,
"learning_rate": 1.3721518987341773e-05,
"loss": 0.0,
"step": 18325
},
{
"epoch": 183.5,
"learning_rate": 1.3705696202531645e-05,
"loss": 0.0,
"step": 18350
},
{
"epoch": 183.75,
"learning_rate": 1.3689873417721518e-05,
"loss": 0.0,
"step": 18375
},
{
"epoch": 184.0,
"learning_rate": 1.3674050632911392e-05,
"loss": 0.0,
"step": 18400
},
{
"epoch": 184.25,
"learning_rate": 1.3658227848101265e-05,
"loss": 0.0,
"step": 18425
},
{
"epoch": 184.5,
"learning_rate": 1.3642405063291139e-05,
"loss": 0.0,
"step": 18450
},
{
"epoch": 184.75,
"learning_rate": 1.3626582278481013e-05,
"loss": 0.0,
"step": 18475
},
{
"epoch": 185.0,
"learning_rate": 1.3610759493670886e-05,
"loss": 0.0,
"step": 18500
},
{
"epoch": 185.25,
"learning_rate": 1.3594936708860758e-05,
"loss": 0.0,
"step": 18525
},
{
"epoch": 185.5,
"learning_rate": 1.3579113924050635e-05,
"loss": 0.0,
"step": 18550
},
{
"epoch": 185.75,
"learning_rate": 1.3563291139240509e-05,
"loss": 0.0,
"step": 18575
},
{
"epoch": 186.0,
"learning_rate": 1.3547468354430382e-05,
"loss": 0.0,
"step": 18600
},
{
"epoch": 186.25,
"learning_rate": 1.3531645569620254e-05,
"loss": 0.0,
"step": 18625
},
{
"epoch": 186.5,
"learning_rate": 1.3515822784810128e-05,
"loss": 0.0,
"step": 18650
},
{
"epoch": 186.75,
"learning_rate": 1.3500000000000001e-05,
"loss": 0.0,
"step": 18675
},
{
"epoch": 187.0,
"learning_rate": 1.3484177215189875e-05,
"loss": 0.0,
"step": 18700
},
{
"epoch": 187.25,
"learning_rate": 1.3468354430379748e-05,
"loss": 0.0,
"step": 18725
},
{
"epoch": 187.5,
"learning_rate": 1.3452531645569622e-05,
"loss": 0.0,
"step": 18750
},
{
"epoch": 187.75,
"learning_rate": 1.3436708860759495e-05,
"loss": 0.0,
"step": 18775
},
{
"epoch": 188.0,
"learning_rate": 1.3420886075949369e-05,
"loss": 0.0,
"step": 18800
},
{
"epoch": 188.25,
"learning_rate": 1.3405063291139241e-05,
"loss": 0.0,
"step": 18825
},
{
"epoch": 188.5,
"learning_rate": 1.3389240506329114e-05,
"loss": 0.0,
"step": 18850
},
{
"epoch": 188.75,
"learning_rate": 1.3373417721518988e-05,
"loss": 0.0,
"step": 18875
},
{
"epoch": 189.0,
"learning_rate": 1.3357594936708862e-05,
"loss": 0.0,
"step": 18900
},
{
"epoch": 189.25,
"learning_rate": 1.3341772151898735e-05,
"loss": 0.0,
"step": 18925
},
{
"epoch": 189.5,
"learning_rate": 1.3325949367088609e-05,
"loss": 0.0,
"step": 18950
},
{
"epoch": 189.75,
"learning_rate": 1.3310126582278482e-05,
"loss": 0.0,
"step": 18975
},
{
"epoch": 190.0,
"learning_rate": 1.3294303797468354e-05,
"loss": 0.0,
"step": 19000
},
{
"epoch": 190.0,
"eval_loss": 0.5456529259681702,
"eval_runtime": 157.826,
"eval_samples_per_second": 80.734,
"eval_steps_per_second": 1.267,
"eval_wer": 16.657222135375957,
"step": 19000
},
{
"epoch": 190.25,
"learning_rate": 1.3278481012658228e-05,
"loss": 0.0,
"step": 19025
},
{
"epoch": 190.5,
"learning_rate": 1.3262658227848101e-05,
"loss": 0.0,
"step": 19050
},
{
"epoch": 190.75,
"learning_rate": 1.3246835443037975e-05,
"loss": 0.0,
"step": 19075
},
{
"epoch": 191.0,
"learning_rate": 1.3231012658227848e-05,
"loss": 0.0,
"step": 19100
},
{
"epoch": 191.25,
"learning_rate": 1.3215189873417722e-05,
"loss": 0.0,
"step": 19125
},
{
"epoch": 191.5,
"learning_rate": 1.3199367088607596e-05,
"loss": 0.0,
"step": 19150
},
{
"epoch": 191.75,
"learning_rate": 1.3183544303797467e-05,
"loss": 0.0,
"step": 19175
},
{
"epoch": 192.0,
"learning_rate": 1.3167721518987341e-05,
"loss": 0.0,
"step": 19200
},
{
"epoch": 192.25,
"learning_rate": 1.3151898734177215e-05,
"loss": 0.0,
"step": 19225
},
{
"epoch": 192.5,
"learning_rate": 1.3136075949367088e-05,
"loss": 0.0,
"step": 19250
},
{
"epoch": 192.75,
"learning_rate": 1.3120253164556962e-05,
"loss": 0.0,
"step": 19275
},
{
"epoch": 193.0,
"learning_rate": 1.3104430379746835e-05,
"loss": 0.0,
"step": 19300
},
{
"epoch": 193.25,
"learning_rate": 1.3088607594936709e-05,
"loss": 0.0,
"step": 19325
},
{
"epoch": 193.5,
"learning_rate": 1.3072784810126584e-05,
"loss": 0.0,
"step": 19350
},
{
"epoch": 193.75,
"learning_rate": 1.3056962025316458e-05,
"loss": 0.0,
"step": 19375
},
{
"epoch": 194.0,
"learning_rate": 1.3041139240506331e-05,
"loss": 0.0,
"step": 19400
},
{
"epoch": 194.25,
"learning_rate": 1.3025316455696205e-05,
"loss": 0.0,
"step": 19425
},
{
"epoch": 194.5,
"learning_rate": 1.3009493670886078e-05,
"loss": 0.0,
"step": 19450
},
{
"epoch": 194.75,
"learning_rate": 1.299367088607595e-05,
"loss": 0.0,
"step": 19475
},
{
"epoch": 195.0,
"learning_rate": 1.2977848101265824e-05,
"loss": 0.0,
"step": 19500
},
{
"epoch": 195.25,
"learning_rate": 1.2962025316455697e-05,
"loss": 0.0,
"step": 19525
},
{
"epoch": 195.5,
"learning_rate": 1.2946202531645571e-05,
"loss": 0.0,
"step": 19550
},
{
"epoch": 195.75,
"learning_rate": 1.2930379746835445e-05,
"loss": 0.0,
"step": 19575
},
{
"epoch": 196.0,
"learning_rate": 1.2914556962025318e-05,
"loss": 0.0,
"step": 19600
},
{
"epoch": 196.25,
"learning_rate": 1.2898734177215192e-05,
"loss": 0.0,
"step": 19625
},
{
"epoch": 196.5,
"learning_rate": 1.2882911392405064e-05,
"loss": 0.0,
"step": 19650
},
{
"epoch": 196.75,
"learning_rate": 1.2867088607594937e-05,
"loss": 0.0,
"step": 19675
},
{
"epoch": 197.0,
"learning_rate": 1.285126582278481e-05,
"loss": 0.0,
"step": 19700
},
{
"epoch": 197.25,
"learning_rate": 1.2835443037974684e-05,
"loss": 0.0,
"step": 19725
},
{
"epoch": 197.5,
"learning_rate": 1.2819620253164558e-05,
"loss": 0.0,
"step": 19750
},
{
"epoch": 197.75,
"learning_rate": 1.2803797468354431e-05,
"loss": 0.0,
"step": 19775
},
{
"epoch": 198.0,
"learning_rate": 1.2787974683544305e-05,
"loss": 0.0,
"step": 19800
},
{
"epoch": 198.25,
"learning_rate": 1.2772151898734177e-05,
"loss": 0.0,
"step": 19825
},
{
"epoch": 198.5,
"learning_rate": 1.275632911392405e-05,
"loss": 0.0,
"step": 19850
},
{
"epoch": 198.75,
"learning_rate": 1.2740506329113924e-05,
"loss": 0.0,
"step": 19875
},
{
"epoch": 199.0,
"learning_rate": 1.2724683544303798e-05,
"loss": 0.0,
"step": 19900
},
{
"epoch": 199.25,
"learning_rate": 1.2711392405063291e-05,
"loss": 0.0184,
"step": 19925
},
{
"epoch": 199.5,
"learning_rate": 1.2695569620253165e-05,
"loss": 0.0165,
"step": 19950
},
{
"epoch": 199.75,
"learning_rate": 1.2679746835443037e-05,
"loss": 0.0147,
"step": 19975
},
{
"epoch": 200.0,
"learning_rate": 1.266392405063291e-05,
"loss": 0.0102,
"step": 20000
},
{
"epoch": 200.0,
"eval_loss": 0.4229086935520172,
"eval_runtime": 160.3396,
"eval_samples_per_second": 79.469,
"eval_steps_per_second": 1.247,
"eval_wer": 18.19016726590589,
"step": 20000
},
{
"epoch": 200.25,
"learning_rate": 1.2648101265822784e-05,
"loss": 0.0075,
"step": 20025
},
{
"epoch": 200.5,
"learning_rate": 1.2632278481012658e-05,
"loss": 0.0064,
"step": 20050
},
{
"epoch": 200.75,
"learning_rate": 1.2616455696202531e-05,
"loss": 0.0052,
"step": 20075
},
{
"epoch": 201.0,
"learning_rate": 1.2600632911392405e-05,
"loss": 0.0047,
"step": 20100
},
{
"epoch": 201.25,
"learning_rate": 1.258481012658228e-05,
"loss": 0.002,
"step": 20125
},
{
"epoch": 201.5,
"learning_rate": 1.2568987341772154e-05,
"loss": 0.0016,
"step": 20150
},
{
"epoch": 201.75,
"learning_rate": 1.2553164556962027e-05,
"loss": 0.0018,
"step": 20175
},
{
"epoch": 202.0,
"learning_rate": 1.25373417721519e-05,
"loss": 0.0014,
"step": 20200
},
{
"epoch": 202.25,
"learning_rate": 1.2521518987341774e-05,
"loss": 0.0006,
"step": 20225
},
{
"epoch": 202.5,
"learning_rate": 1.2505696202531648e-05,
"loss": 0.0008,
"step": 20250
},
{
"epoch": 202.75,
"learning_rate": 1.248987341772152e-05,
"loss": 0.0003,
"step": 20275
},
{
"epoch": 203.0,
"learning_rate": 1.2474050632911392e-05,
"loss": 0.0003,
"step": 20300
},
{
"epoch": 203.25,
"learning_rate": 1.2458227848101267e-05,
"loss": 0.0002,
"step": 20325
},
{
"epoch": 203.5,
"learning_rate": 1.244240506329114e-05,
"loss": 0.0002,
"step": 20350
},
{
"epoch": 203.75,
"learning_rate": 1.2426582278481014e-05,
"loss": 0.0002,
"step": 20375
},
{
"epoch": 204.0,
"learning_rate": 1.2410759493670888e-05,
"loss": 0.0001,
"step": 20400
},
{
"epoch": 204.25,
"learning_rate": 1.2394936708860761e-05,
"loss": 0.0001,
"step": 20425
},
{
"epoch": 204.5,
"learning_rate": 1.2379113924050633e-05,
"loss": 0.0002,
"step": 20450
},
{
"epoch": 204.75,
"learning_rate": 1.2363291139240507e-05,
"loss": 0.0001,
"step": 20475
},
{
"epoch": 205.0,
"learning_rate": 1.234746835443038e-05,
"loss": 0.0001,
"step": 20500
},
{
"epoch": 205.25,
"learning_rate": 1.2331645569620254e-05,
"loss": 0.0001,
"step": 20525
},
{
"epoch": 205.5,
"learning_rate": 1.2315822784810127e-05,
"loss": 0.0001,
"step": 20550
},
{
"epoch": 205.75,
"learning_rate": 1.23e-05,
"loss": 0.0001,
"step": 20575
},
{
"epoch": 206.0,
"learning_rate": 1.2284177215189874e-05,
"loss": 0.0001,
"step": 20600
},
{
"epoch": 206.25,
"learning_rate": 1.2268354430379746e-05,
"loss": 0.0001,
"step": 20625
},
{
"epoch": 206.5,
"learning_rate": 1.225253164556962e-05,
"loss": 0.0001,
"step": 20650
},
{
"epoch": 206.75,
"learning_rate": 1.2236708860759493e-05,
"loss": 0.0,
"step": 20675
},
{
"epoch": 207.0,
"learning_rate": 1.2220886075949367e-05,
"loss": 0.0,
"step": 20700
},
{
"epoch": 207.25,
"learning_rate": 1.220506329113924e-05,
"loss": 0.0,
"step": 20725
},
{
"epoch": 207.5,
"learning_rate": 1.2189240506329116e-05,
"loss": 0.0,
"step": 20750
},
{
"epoch": 207.75,
"learning_rate": 1.2173417721518988e-05,
"loss": 0.0,
"step": 20775
},
{
"epoch": 208.0,
"learning_rate": 1.2157594936708861e-05,
"loss": 0.0,
"step": 20800
},
{
"epoch": 208.25,
"learning_rate": 1.2141772151898735e-05,
"loss": 0.0,
"step": 20825
},
{
"epoch": 208.5,
"learning_rate": 1.2125949367088608e-05,
"loss": 0.0,
"step": 20850
},
{
"epoch": 208.75,
"learning_rate": 1.2110126582278482e-05,
"loss": 0.0,
"step": 20875
},
{
"epoch": 209.0,
"learning_rate": 1.2094303797468356e-05,
"loss": 0.0,
"step": 20900
},
{
"epoch": 209.25,
"learning_rate": 1.2078481012658229e-05,
"loss": 0.0,
"step": 20925
},
{
"epoch": 209.5,
"learning_rate": 1.2062658227848101e-05,
"loss": 0.0,
"step": 20950
},
{
"epoch": 209.75,
"learning_rate": 1.2046835443037975e-05,
"loss": 0.0,
"step": 20975
},
{
"epoch": 210.0,
"learning_rate": 1.2031012658227848e-05,
"loss": 0.0,
"step": 21000
},
{
"epoch": 210.0,
"eval_loss": 0.4498037099838257,
"eval_runtime": 159.2513,
"eval_samples_per_second": 80.012,
"eval_steps_per_second": 1.256,
"eval_wer": 16.21170079724871,
"step": 21000
},
{
"epoch": 210.25,
"learning_rate": 1.2015189873417722e-05,
"loss": 0.0,
"step": 21025
},
{
"epoch": 210.5,
"learning_rate": 1.1999367088607595e-05,
"loss": 0.0,
"step": 21050
},
{
"epoch": 210.75,
"learning_rate": 1.1983544303797469e-05,
"loss": 0.0,
"step": 21075
},
{
"epoch": 211.0,
"learning_rate": 1.1967721518987342e-05,
"loss": 0.0,
"step": 21100
},
{
"epoch": 211.25,
"learning_rate": 1.1951898734177216e-05,
"loss": 0.0,
"step": 21125
},
{
"epoch": 211.5,
"learning_rate": 1.193607594936709e-05,
"loss": 0.0,
"step": 21150
},
{
"epoch": 211.75,
"learning_rate": 1.1920253164556963e-05,
"loss": 0.0,
"step": 21175
},
{
"epoch": 212.0,
"learning_rate": 1.1904430379746837e-05,
"loss": 0.0001,
"step": 21200
},
{
"epoch": 212.25,
"learning_rate": 1.188860759493671e-05,
"loss": 0.0,
"step": 21225
},
{
"epoch": 212.5,
"learning_rate": 1.1872784810126584e-05,
"loss": 0.0,
"step": 21250
},
{
"epoch": 212.75,
"learning_rate": 1.1856962025316456e-05,
"loss": 0.0,
"step": 21275
},
{
"epoch": 213.0,
"learning_rate": 1.184113924050633e-05,
"loss": 0.0,
"step": 21300
},
{
"epoch": 213.25,
"learning_rate": 1.1825316455696203e-05,
"loss": 0.0,
"step": 21325
},
{
"epoch": 213.5,
"learning_rate": 1.1809493670886076e-05,
"loss": 0.0,
"step": 21350
},
{
"epoch": 213.75,
"learning_rate": 1.179367088607595e-05,
"loss": 0.0,
"step": 21375
},
{
"epoch": 214.0,
"learning_rate": 1.1777848101265824e-05,
"loss": 0.0,
"step": 21400
},
{
"epoch": 214.25,
"learning_rate": 1.1762025316455697e-05,
"loss": 0.0,
"step": 21425
},
{
"epoch": 214.5,
"learning_rate": 1.174620253164557e-05,
"loss": 0.0,
"step": 21450
},
{
"epoch": 214.75,
"learning_rate": 1.1730379746835443e-05,
"loss": 0.0,
"step": 21475
},
{
"epoch": 215.0,
"learning_rate": 1.1714556962025316e-05,
"loss": 0.0,
"step": 21500
},
{
"epoch": 215.25,
"learning_rate": 1.169873417721519e-05,
"loss": 0.0,
"step": 21525
},
{
"epoch": 215.5,
"learning_rate": 1.1682911392405063e-05,
"loss": 0.0,
"step": 21550
},
{
"epoch": 215.75,
"learning_rate": 1.1667088607594939e-05,
"loss": 0.0,
"step": 21575
},
{
"epoch": 216.0,
"learning_rate": 1.165126582278481e-05,
"loss": 0.0,
"step": 21600
},
{
"epoch": 216.25,
"learning_rate": 1.1635443037974684e-05,
"loss": 0.0,
"step": 21625
},
{
"epoch": 216.5,
"learning_rate": 1.1619620253164558e-05,
"loss": 0.0,
"step": 21650
},
{
"epoch": 216.75,
"learning_rate": 1.1603797468354431e-05,
"loss": 0.0,
"step": 21675
},
{
"epoch": 217.0,
"learning_rate": 1.1587974683544305e-05,
"loss": 0.0,
"step": 21700
},
{
"epoch": 217.25,
"learning_rate": 1.1572151898734178e-05,
"loss": 0.0,
"step": 21725
},
{
"epoch": 217.5,
"learning_rate": 1.1556329113924052e-05,
"loss": 0.0,
"step": 21750
},
{
"epoch": 217.75,
"learning_rate": 1.1540506329113925e-05,
"loss": 0.0,
"step": 21775
},
{
"epoch": 218.0,
"learning_rate": 1.1524683544303797e-05,
"loss": 0.0,
"step": 21800
},
{
"epoch": 218.25,
"learning_rate": 1.150886075949367e-05,
"loss": 0.0,
"step": 21825
},
{
"epoch": 218.5,
"learning_rate": 1.1493037974683544e-05,
"loss": 0.0,
"step": 21850
},
{
"epoch": 218.75,
"learning_rate": 1.1477215189873418e-05,
"loss": 0.0,
"step": 21875
},
{
"epoch": 219.0,
"learning_rate": 1.1461392405063292e-05,
"loss": 0.0,
"step": 21900
},
{
"epoch": 219.25,
"learning_rate": 1.1445569620253165e-05,
"loss": 0.0,
"step": 21925
},
{
"epoch": 219.5,
"learning_rate": 1.1429746835443039e-05,
"loss": 0.0,
"step": 21950
},
{
"epoch": 219.75,
"learning_rate": 1.1413924050632912e-05,
"loss": 0.0,
"step": 21975
},
{
"epoch": 220.0,
"learning_rate": 1.1398101265822786e-05,
"loss": 0.0,
"step": 22000
},
{
"epoch": 220.0,
"eval_loss": 0.4645980894565582,
"eval_runtime": 159.2078,
"eval_samples_per_second": 80.034,
"eval_steps_per_second": 1.256,
"eval_wer": 16.21463185868376,
"step": 22000
},
{
"epoch": 220.25,
"learning_rate": 1.138227848101266e-05,
"loss": 0.0,
"step": 22025
},
{
"epoch": 220.5,
"learning_rate": 1.1366455696202533e-05,
"loss": 0.0,
"step": 22050
},
{
"epoch": 220.75,
"learning_rate": 1.1350632911392407e-05,
"loss": 0.0,
"step": 22075
},
{
"epoch": 221.0,
"learning_rate": 1.133481012658228e-05,
"loss": 0.0,
"step": 22100
},
{
"epoch": 221.25,
"learning_rate": 1.1318987341772152e-05,
"loss": 0.0,
"step": 22125
},
{
"epoch": 221.5,
"learning_rate": 1.1303164556962026e-05,
"loss": 0.0,
"step": 22150
},
{
"epoch": 221.75,
"learning_rate": 1.1287341772151899e-05,
"loss": 0.0,
"step": 22175
},
{
"epoch": 222.0,
"learning_rate": 1.1271518987341773e-05,
"loss": 0.0,
"step": 22200
},
{
"epoch": 222.25,
"learning_rate": 1.1255696202531646e-05,
"loss": 0.0,
"step": 22225
},
{
"epoch": 222.5,
"learning_rate": 1.123987341772152e-05,
"loss": 0.0,
"step": 22250
},
{
"epoch": 222.75,
"learning_rate": 1.1224050632911393e-05,
"loss": 0.0,
"step": 22275
},
{
"epoch": 223.0,
"learning_rate": 1.1208227848101265e-05,
"loss": 0.0,
"step": 22300
},
{
"epoch": 223.25,
"learning_rate": 1.1192405063291139e-05,
"loss": 0.0,
"step": 22325
},
{
"epoch": 223.5,
"learning_rate": 1.1176582278481012e-05,
"loss": 0.0,
"step": 22350
},
{
"epoch": 223.75,
"learning_rate": 1.1160759493670888e-05,
"loss": 0.0,
"step": 22375
},
{
"epoch": 224.0,
"learning_rate": 1.1144936708860761e-05,
"loss": 0.0,
"step": 22400
},
{
"epoch": 224.25,
"learning_rate": 1.1129113924050635e-05,
"loss": 0.0,
"step": 22425
},
{
"epoch": 224.5,
"learning_rate": 1.1113291139240507e-05,
"loss": 0.0,
"step": 22450
},
{
"epoch": 224.75,
"learning_rate": 1.109746835443038e-05,
"loss": 0.0,
"step": 22475
},
{
"epoch": 225.0,
"learning_rate": 1.1081645569620254e-05,
"loss": 0.0,
"step": 22500
},
{
"epoch": 225.25,
"learning_rate": 1.1065822784810127e-05,
"loss": 0.0,
"step": 22525
},
{
"epoch": 225.5,
"learning_rate": 1.1050000000000001e-05,
"loss": 0.0,
"step": 22550
},
{
"epoch": 225.75,
"learning_rate": 1.1034177215189874e-05,
"loss": 0.0,
"step": 22575
},
{
"epoch": 226.0,
"learning_rate": 1.1018354430379748e-05,
"loss": 0.0,
"step": 22600
},
{
"epoch": 226.25,
"learning_rate": 1.100253164556962e-05,
"loss": 0.0,
"step": 22625
},
{
"epoch": 226.5,
"learning_rate": 1.0986708860759494e-05,
"loss": 0.0,
"step": 22650
},
{
"epoch": 226.75,
"learning_rate": 1.0970886075949367e-05,
"loss": 0.0,
"step": 22675
},
{
"epoch": 227.0,
"learning_rate": 1.095506329113924e-05,
"loss": 0.0,
"step": 22700
},
{
"epoch": 227.25,
"learning_rate": 1.0939240506329114e-05,
"loss": 0.0,
"step": 22725
},
{
"epoch": 227.5,
"learning_rate": 1.0923417721518988e-05,
"loss": 0.0,
"step": 22750
},
{
"epoch": 227.75,
"learning_rate": 1.0907594936708861e-05,
"loss": 0.0,
"step": 22775
},
{
"epoch": 228.0,
"learning_rate": 1.0891772151898735e-05,
"loss": 0.0,
"step": 22800
},
{
"epoch": 228.25,
"learning_rate": 1.0875949367088608e-05,
"loss": 0.0,
"step": 22825
},
{
"epoch": 228.5,
"learning_rate": 1.0860126582278482e-05,
"loss": 0.0,
"step": 22850
},
{
"epoch": 228.75,
"learning_rate": 1.0844303797468356e-05,
"loss": 0.0,
"step": 22875
},
{
"epoch": 229.0,
"learning_rate": 1.082848101265823e-05,
"loss": 0.0,
"step": 22900
},
{
"epoch": 229.25,
"learning_rate": 1.0812658227848103e-05,
"loss": 0.0,
"step": 22925
},
{
"epoch": 229.5,
"learning_rate": 1.0796835443037975e-05,
"loss": 0.0,
"step": 22950
},
{
"epoch": 229.75,
"learning_rate": 1.0781012658227848e-05,
"loss": 0.0,
"step": 22975
},
{
"epoch": 230.0,
"learning_rate": 1.0765189873417722e-05,
"loss": 0.0,
"step": 23000
},
{
"epoch": 230.0,
"eval_loss": 0.4754066467285156,
"eval_runtime": 159.5663,
"eval_samples_per_second": 79.854,
"eval_steps_per_second": 1.253,
"eval_wer": 16.196068469595122,
"step": 23000
},
{
"epoch": 230.25,
"learning_rate": 1.0749367088607595e-05,
"loss": 0.0,
"step": 23025
},
{
"epoch": 230.5,
"learning_rate": 1.0733544303797469e-05,
"loss": 0.0,
"step": 23050
},
{
"epoch": 230.75,
"learning_rate": 1.0717721518987342e-05,
"loss": 0.0,
"step": 23075
},
{
"epoch": 231.0,
"learning_rate": 1.0701898734177216e-05,
"loss": 0.0,
"step": 23100
},
{
"epoch": 231.25,
"learning_rate": 1.0686075949367088e-05,
"loss": 0.0,
"step": 23125
},
{
"epoch": 231.5,
"learning_rate": 1.0670253164556962e-05,
"loss": 0.0,
"step": 23150
},
{
"epoch": 231.75,
"learning_rate": 1.0654430379746835e-05,
"loss": 0.0,
"step": 23175
},
{
"epoch": 232.0,
"learning_rate": 1.063860759493671e-05,
"loss": 0.0,
"step": 23200
},
{
"epoch": 232.25,
"learning_rate": 1.0622784810126584e-05,
"loss": 0.0,
"step": 23225
},
{
"epoch": 232.5,
"learning_rate": 1.0606962025316457e-05,
"loss": 0.0,
"step": 23250
},
{
"epoch": 232.75,
"learning_rate": 1.059113924050633e-05,
"loss": 0.0,
"step": 23275
},
{
"epoch": 233.0,
"learning_rate": 1.0575316455696203e-05,
"loss": 0.0,
"step": 23300
},
{
"epoch": 233.25,
"learning_rate": 1.0559493670886076e-05,
"loss": 0.0,
"step": 23325
},
{
"epoch": 233.5,
"learning_rate": 1.054367088607595e-05,
"loss": 0.0,
"step": 23350
},
{
"epoch": 233.75,
"learning_rate": 1.0527848101265824e-05,
"loss": 0.0,
"step": 23375
},
{
"epoch": 234.0,
"learning_rate": 1.0512025316455697e-05,
"loss": 0.0,
"step": 23400
},
{
"epoch": 234.25,
"learning_rate": 1.049620253164557e-05,
"loss": 0.0,
"step": 23425
},
{
"epoch": 234.5,
"learning_rate": 1.0480379746835443e-05,
"loss": 0.0,
"step": 23450
},
{
"epoch": 234.75,
"learning_rate": 1.0464556962025316e-05,
"loss": 0.0,
"step": 23475
},
{
"epoch": 235.0,
"learning_rate": 1.044873417721519e-05,
"loss": 0.0,
"step": 23500
},
{
"epoch": 235.25,
"learning_rate": 1.0432911392405063e-05,
"loss": 0.0,
"step": 23525
},
{
"epoch": 235.5,
"learning_rate": 1.0417088607594937e-05,
"loss": 0.0,
"step": 23550
},
{
"epoch": 235.75,
"learning_rate": 1.040126582278481e-05,
"loss": 0.0,
"step": 23575
},
{
"epoch": 236.0,
"learning_rate": 1.0385443037974684e-05,
"loss": 0.0,
"step": 23600
},
{
"epoch": 236.25,
"learning_rate": 1.0369620253164558e-05,
"loss": 0.0,
"step": 23625
},
{
"epoch": 236.5,
"learning_rate": 1.0353797468354431e-05,
"loss": 0.0,
"step": 23650
},
{
"epoch": 236.75,
"learning_rate": 1.0337974683544305e-05,
"loss": 0.0,
"step": 23675
},
{
"epoch": 237.0,
"learning_rate": 1.0322151898734178e-05,
"loss": 0.0,
"step": 23700
},
{
"epoch": 237.25,
"learning_rate": 1.0306329113924052e-05,
"loss": 0.0,
"step": 23725
},
{
"epoch": 237.5,
"learning_rate": 1.0290506329113925e-05,
"loss": 0.0,
"step": 23750
},
{
"epoch": 237.75,
"learning_rate": 1.0274683544303797e-05,
"loss": 0.0,
"step": 23775
},
{
"epoch": 238.0,
"learning_rate": 1.0258860759493671e-05,
"loss": 0.0,
"step": 23800
},
{
"epoch": 238.25,
"learning_rate": 1.0243037974683544e-05,
"loss": 0.0,
"step": 23825
},
{
"epoch": 238.5,
"learning_rate": 1.0227215189873418e-05,
"loss": 0.0,
"step": 23850
},
{
"epoch": 238.75,
"learning_rate": 1.0211392405063292e-05,
"loss": 0.0,
"step": 23875
},
{
"epoch": 239.0,
"learning_rate": 1.0195569620253165e-05,
"loss": 0.0,
"step": 23900
},
{
"epoch": 239.25,
"learning_rate": 1.0179746835443039e-05,
"loss": 0.0,
"step": 23925
},
{
"epoch": 239.5,
"learning_rate": 1.016392405063291e-05,
"loss": 0.0,
"step": 23950
},
{
"epoch": 239.75,
"learning_rate": 1.0148101265822784e-05,
"loss": 0.0,
"step": 23975
},
{
"epoch": 240.0,
"learning_rate": 1.0132278481012658e-05,
"loss": 0.0,
"step": 24000
},
{
"epoch": 240.0,
"eval_loss": 0.48526978492736816,
"eval_runtime": 158.4647,
"eval_samples_per_second": 80.409,
"eval_steps_per_second": 1.262,
"eval_wer": 16.18629826481163,
"step": 24000
},
{
"epoch": 240.25,
"learning_rate": 1.0116455696202533e-05,
"loss": 0.0,
"step": 24025
},
{
"epoch": 240.5,
"learning_rate": 1.0100632911392407e-05,
"loss": 0.0,
"step": 24050
},
{
"epoch": 240.75,
"learning_rate": 1.008481012658228e-05,
"loss": 0.0,
"step": 24075
},
{
"epoch": 241.0,
"learning_rate": 1.0068987341772152e-05,
"loss": 0.0,
"step": 24100
},
{
"epoch": 241.25,
"learning_rate": 1.0053164556962026e-05,
"loss": 0.0,
"step": 24125
},
{
"epoch": 241.5,
"learning_rate": 1.00373417721519e-05,
"loss": 0.0,
"step": 24150
},
{
"epoch": 241.75,
"learning_rate": 1.0021518987341773e-05,
"loss": 0.0,
"step": 24175
},
{
"epoch": 242.0,
"learning_rate": 1.0005696202531646e-05,
"loss": 0.0,
"step": 24200
},
{
"epoch": 242.25,
"learning_rate": 9.98987341772152e-06,
"loss": 0.0,
"step": 24225
},
{
"epoch": 242.5,
"learning_rate": 9.974050632911393e-06,
"loss": 0.0,
"step": 24250
},
{
"epoch": 242.75,
"learning_rate": 9.958227848101265e-06,
"loss": 0.0,
"step": 24275
},
{
"epoch": 243.0,
"learning_rate": 9.942405063291139e-06,
"loss": 0.0,
"step": 24300
},
{
"epoch": 243.25,
"learning_rate": 9.926582278481012e-06,
"loss": 0.0,
"step": 24325
},
{
"epoch": 243.5,
"learning_rate": 9.910759493670886e-06,
"loss": 0.0,
"step": 24350
},
{
"epoch": 243.75,
"learning_rate": 9.89493670886076e-06,
"loss": 0.0,
"step": 24375
},
{
"epoch": 244.0,
"learning_rate": 9.879113924050633e-06,
"loss": 0.0,
"step": 24400
},
{
"epoch": 244.25,
"learning_rate": 9.863291139240507e-06,
"loss": 0.0,
"step": 24425
},
{
"epoch": 244.5,
"learning_rate": 9.84746835443038e-06,
"loss": 0.0,
"step": 24450
},
{
"epoch": 244.75,
"learning_rate": 9.831645569620254e-06,
"loss": 0.0,
"step": 24475
},
{
"epoch": 245.0,
"learning_rate": 9.815822784810127e-06,
"loss": 0.0,
"step": 24500
},
{
"epoch": 245.25,
"learning_rate": 9.800000000000001e-06,
"loss": 0.0,
"step": 24525
},
{
"epoch": 245.5,
"learning_rate": 9.784177215189875e-06,
"loss": 0.0,
"step": 24550
},
{
"epoch": 245.75,
"learning_rate": 9.768354430379748e-06,
"loss": 0.0,
"step": 24575
},
{
"epoch": 246.0,
"learning_rate": 9.75253164556962e-06,
"loss": 0.0,
"step": 24600
},
{
"epoch": 246.25,
"learning_rate": 9.736708860759494e-06,
"loss": 0.0,
"step": 24625
},
{
"epoch": 246.5,
"learning_rate": 9.720886075949367e-06,
"loss": 0.0,
"step": 24650
},
{
"epoch": 246.75,
"learning_rate": 9.70506329113924e-06,
"loss": 0.0,
"step": 24675
},
{
"epoch": 247.0,
"learning_rate": 9.689240506329114e-06,
"loss": 0.0,
"step": 24700
},
{
"epoch": 247.25,
"learning_rate": 9.673417721518988e-06,
"loss": 0.0,
"step": 24725
},
{
"epoch": 247.5,
"learning_rate": 9.657594936708861e-06,
"loss": 0.0,
"step": 24750
},
{
"epoch": 247.75,
"learning_rate": 9.641772151898733e-06,
"loss": 0.0,
"step": 24775
},
{
"epoch": 248.0,
"learning_rate": 9.625949367088607e-06,
"loss": 0.0,
"step": 24800
},
{
"epoch": 248.25,
"learning_rate": 9.61012658227848e-06,
"loss": 0.0,
"step": 24825
},
{
"epoch": 248.5,
"learning_rate": 9.594303797468356e-06,
"loss": 0.0,
"step": 24850
},
{
"epoch": 248.75,
"learning_rate": 9.57848101265823e-06,
"loss": 0.0,
"step": 24875
},
{
"epoch": 249.0,
"learning_rate": 9.562658227848103e-06,
"loss": 0.0,
"step": 24900
},
{
"epoch": 249.25,
"learning_rate": 9.546835443037975e-06,
"loss": 0.0,
"step": 24925
},
{
"epoch": 249.5,
"learning_rate": 9.531012658227848e-06,
"loss": 0.0,
"step": 24950
},
{
"epoch": 249.75,
"learning_rate": 9.515189873417722e-06,
"loss": 0.0,
"step": 24975
},
{
"epoch": 250.0,
"learning_rate": 9.499367088607595e-06,
"loss": 0.0,
"step": 25000
},
{
"epoch": 250.0,
"eval_loss": 0.49457526206970215,
"eval_runtime": 159.1963,
"eval_samples_per_second": 80.04,
"eval_steps_per_second": 1.256,
"eval_wer": 16.191183367203376,
"step": 25000
},
{
"epoch": 250.25,
"learning_rate": 9.483544303797469e-06,
"loss": 0.0,
"step": 25025
},
{
"epoch": 250.5,
"learning_rate": 9.467721518987343e-06,
"loss": 0.0,
"step": 25050
},
{
"epoch": 250.75,
"learning_rate": 9.451898734177216e-06,
"loss": 0.0,
"step": 25075
},
{
"epoch": 251.0,
"learning_rate": 9.436075949367088e-06,
"loss": 0.0,
"step": 25100
},
{
"epoch": 251.25,
"learning_rate": 9.420253164556962e-06,
"loss": 0.0,
"step": 25125
},
{
"epoch": 251.5,
"learning_rate": 9.404430379746835e-06,
"loss": 0.0,
"step": 25150
},
{
"epoch": 251.75,
"learning_rate": 9.388607594936709e-06,
"loss": 0.0,
"step": 25175
},
{
"epoch": 252.0,
"learning_rate": 9.372784810126582e-06,
"loss": 0.0,
"step": 25200
},
{
"epoch": 252.25,
"learning_rate": 9.356962025316456e-06,
"loss": 0.0,
"step": 25225
},
{
"epoch": 252.5,
"learning_rate": 9.34113924050633e-06,
"loss": 0.0,
"step": 25250
},
{
"epoch": 252.75,
"learning_rate": 9.325316455696203e-06,
"loss": 0.0,
"step": 25275
},
{
"epoch": 253.0,
"learning_rate": 9.309493670886077e-06,
"loss": 0.0,
"step": 25300
},
{
"epoch": 253.25,
"learning_rate": 9.29367088607595e-06,
"loss": 0.0,
"step": 25325
},
{
"epoch": 253.5,
"learning_rate": 9.277848101265824e-06,
"loss": 0.0,
"step": 25350
},
{
"epoch": 253.75,
"learning_rate": 9.262025316455697e-06,
"loss": 0.0,
"step": 25375
},
{
"epoch": 254.0,
"learning_rate": 9.246202531645571e-06,
"loss": 0.0,
"step": 25400
},
{
"epoch": 254.25,
"learning_rate": 9.230379746835443e-06,
"loss": 0.0,
"step": 25425
},
{
"epoch": 254.5,
"learning_rate": 9.214556962025316e-06,
"loss": 0.0,
"step": 25450
},
{
"epoch": 254.75,
"learning_rate": 9.19873417721519e-06,
"loss": 0.0,
"step": 25475
},
{
"epoch": 255.0,
"learning_rate": 9.182911392405063e-06,
"loss": 0.0,
"step": 25500
},
{
"epoch": 255.25,
"learning_rate": 9.167088607594937e-06,
"loss": 0.0,
"step": 25525
},
{
"epoch": 255.5,
"learning_rate": 9.15126582278481e-06,
"loss": 0.0,
"step": 25550
},
{
"epoch": 255.75,
"learning_rate": 9.135443037974684e-06,
"loss": 0.0,
"step": 25575
},
{
"epoch": 256.0,
"learning_rate": 9.119620253164558e-06,
"loss": 0.0,
"step": 25600
},
{
"epoch": 256.25,
"learning_rate": 9.10379746835443e-06,
"loss": 0.0,
"step": 25625
},
{
"epoch": 256.5,
"learning_rate": 9.087974683544303e-06,
"loss": 0.0,
"step": 25650
},
{
"epoch": 256.75,
"learning_rate": 9.072151898734178e-06,
"loss": 0.0,
"step": 25675
},
{
"epoch": 257.0,
"learning_rate": 9.056329113924052e-06,
"loss": 0.0,
"step": 25700
},
{
"epoch": 257.25,
"learning_rate": 9.040506329113926e-06,
"loss": 0.0,
"step": 25725
},
{
"epoch": 257.5,
"learning_rate": 9.0246835443038e-06,
"loss": 0.0,
"step": 25750
},
{
"epoch": 257.75,
"learning_rate": 9.008860759493671e-06,
"loss": 0.0,
"step": 25775
},
{
"epoch": 258.0,
"learning_rate": 8.993037974683545e-06,
"loss": 0.0,
"step": 25800
},
{
"epoch": 258.25,
"learning_rate": 8.977215189873418e-06,
"loss": 0.0,
"step": 25825
},
{
"epoch": 258.5,
"learning_rate": 8.961392405063292e-06,
"loss": 0.0,
"step": 25850
},
{
"epoch": 258.75,
"learning_rate": 8.945569620253165e-06,
"loss": 0.0,
"step": 25875
},
{
"epoch": 259.0,
"learning_rate": 8.929746835443039e-06,
"loss": 0.0,
"step": 25900
},
{
"epoch": 259.25,
"learning_rate": 8.913924050632912e-06,
"loss": 0.0,
"step": 25925
},
{
"epoch": 259.5,
"learning_rate": 8.898101265822784e-06,
"loss": 0.0,
"step": 25950
},
{
"epoch": 259.75,
"learning_rate": 8.882278481012658e-06,
"loss": 0.0,
"step": 25975
},
{
"epoch": 260.0,
"learning_rate": 8.866455696202531e-06,
"loss": 0.0,
"step": 26000
},
{
"epoch": 260.0,
"eval_loss": 0.5037948489189148,
"eval_runtime": 159.0614,
"eval_samples_per_second": 80.107,
"eval_steps_per_second": 1.257,
"eval_wer": 16.17652806002814,
"step": 26000
},
{
"epoch": 260.25,
"learning_rate": 8.850632911392405e-06,
"loss": 0.0,
"step": 26025
},
{
"epoch": 260.5,
"learning_rate": 8.834810126582279e-06,
"loss": 0.0,
"step": 26050
},
{
"epoch": 260.75,
"learning_rate": 8.818987341772152e-06,
"loss": 0.0,
"step": 26075
},
{
"epoch": 261.0,
"learning_rate": 8.803164556962026e-06,
"loss": 0.0,
"step": 26100
},
{
"epoch": 261.25,
"learning_rate": 8.7873417721519e-06,
"loss": 0.0,
"step": 26125
},
{
"epoch": 261.5,
"learning_rate": 8.771518987341773e-06,
"loss": 0.0,
"step": 26150
},
{
"epoch": 261.75,
"learning_rate": 8.755696202531646e-06,
"loss": 0.0,
"step": 26175
},
{
"epoch": 262.0,
"learning_rate": 8.73987341772152e-06,
"loss": 0.0,
"step": 26200
},
{
"epoch": 262.25,
"learning_rate": 8.724050632911394e-06,
"loss": 0.0,
"step": 26225
},
{
"epoch": 262.5,
"learning_rate": 8.708227848101267e-06,
"loss": 0.0,
"step": 26250
},
{
"epoch": 262.75,
"learning_rate": 8.692405063291139e-06,
"loss": 0.0,
"step": 26275
},
{
"epoch": 263.0,
"learning_rate": 8.676582278481013e-06,
"loss": 0.0,
"step": 26300
},
{
"epoch": 263.25,
"learning_rate": 8.660759493670886e-06,
"loss": 0.0,
"step": 26325
},
{
"epoch": 263.5,
"learning_rate": 8.64493670886076e-06,
"loss": 0.0,
"step": 26350
},
{
"epoch": 263.75,
"learning_rate": 8.629113924050633e-06,
"loss": 0.0,
"step": 26375
},
{
"epoch": 264.0,
"learning_rate": 8.613291139240507e-06,
"loss": 0.0,
"step": 26400
},
{
"epoch": 264.25,
"learning_rate": 8.59746835443038e-06,
"loss": 0.0,
"step": 26425
},
{
"epoch": 264.5,
"learning_rate": 8.581645569620252e-06,
"loss": 0.0,
"step": 26450
},
{
"epoch": 264.75,
"learning_rate": 8.565822784810126e-06,
"loss": 0.0,
"step": 26475
},
{
"epoch": 265.0,
"learning_rate": 8.550000000000001e-06,
"loss": 0.0,
"step": 26500
},
{
"epoch": 265.25,
"learning_rate": 8.534177215189875e-06,
"loss": 0.0,
"step": 26525
},
{
"epoch": 265.5,
"learning_rate": 8.518354430379748e-06,
"loss": 0.0,
"step": 26550
},
{
"epoch": 265.75,
"learning_rate": 8.502531645569622e-06,
"loss": 0.0,
"step": 26575
},
{
"epoch": 266.0,
"learning_rate": 8.486708860759494e-06,
"loss": 0.0,
"step": 26600
},
{
"epoch": 266.25,
"learning_rate": 8.470886075949367e-06,
"loss": 0.0,
"step": 26625
},
{
"epoch": 266.5,
"learning_rate": 8.455063291139241e-06,
"loss": 0.0,
"step": 26650
},
{
"epoch": 266.75,
"learning_rate": 8.439240506329114e-06,
"loss": 0.0,
"step": 26675
},
{
"epoch": 267.0,
"learning_rate": 8.423417721518988e-06,
"loss": 0.0,
"step": 26700
},
{
"epoch": 267.25,
"learning_rate": 8.407594936708862e-06,
"loss": 0.0,
"step": 26725
},
{
"epoch": 267.5,
"learning_rate": 8.391772151898735e-06,
"loss": 0.0,
"step": 26750
},
{
"epoch": 267.75,
"learning_rate": 8.375949367088607e-06,
"loss": 0.0,
"step": 26775
},
{
"epoch": 268.0,
"learning_rate": 8.36012658227848e-06,
"loss": 0.0,
"step": 26800
},
{
"epoch": 268.25,
"learning_rate": 8.344303797468354e-06,
"loss": 0.0,
"step": 26825
},
{
"epoch": 268.5,
"learning_rate": 8.328481012658228e-06,
"loss": 0.0,
"step": 26850
},
{
"epoch": 268.75,
"learning_rate": 8.312658227848101e-06,
"loss": 0.0,
"step": 26875
},
{
"epoch": 269.0,
"learning_rate": 8.296835443037977e-06,
"loss": 0.0,
"step": 26900
},
{
"epoch": 269.25,
"learning_rate": 8.281012658227848e-06,
"loss": 0.0,
"step": 26925
},
{
"epoch": 269.5,
"learning_rate": 8.265189873417722e-06,
"loss": 0.0,
"step": 26950
},
{
"epoch": 269.75,
"learning_rate": 8.249367088607596e-06,
"loss": 0.0,
"step": 26975
},
{
"epoch": 270.0,
"learning_rate": 8.233544303797469e-06,
"loss": 0.0,
"step": 27000
},
{
"epoch": 270.0,
"eval_loss": 0.5133084654808044,
"eval_runtime": 159.394,
"eval_samples_per_second": 79.94,
"eval_steps_per_second": 1.255,
"eval_wer": 16.221471002032203,
"step": 27000
},
{
"epoch": 270.25,
"learning_rate": 8.217721518987343e-06,
"loss": 0.0,
"step": 27025
},
{
"epoch": 270.5,
"learning_rate": 8.201898734177216e-06,
"loss": 0.0,
"step": 27050
},
{
"epoch": 270.75,
"learning_rate": 8.18607594936709e-06,
"loss": 0.0,
"step": 27075
},
{
"epoch": 271.0,
"learning_rate": 8.170253164556962e-06,
"loss": 0.0,
"step": 27100
},
{
"epoch": 271.25,
"learning_rate": 8.154430379746835e-06,
"loss": 0.0,
"step": 27125
},
{
"epoch": 271.5,
"learning_rate": 8.138607594936709e-06,
"loss": 0.0,
"step": 27150
},
{
"epoch": 271.75,
"learning_rate": 8.122784810126582e-06,
"loss": 0.0,
"step": 27175
},
{
"epoch": 272.0,
"learning_rate": 8.106962025316456e-06,
"loss": 0.0,
"step": 27200
},
{
"epoch": 272.25,
"learning_rate": 8.09113924050633e-06,
"loss": 0.0,
"step": 27225
},
{
"epoch": 272.5,
"learning_rate": 8.075316455696203e-06,
"loss": 0.0,
"step": 27250
},
{
"epoch": 272.75,
"learning_rate": 8.059493670886075e-06,
"loss": 0.0,
"step": 27275
},
{
"epoch": 273.0,
"learning_rate": 8.043670886075949e-06,
"loss": 0.0,
"step": 27300
},
{
"epoch": 273.25,
"learning_rate": 8.027848101265824e-06,
"loss": 0.0,
"step": 27325
},
{
"epoch": 273.5,
"learning_rate": 8.012025316455697e-06,
"loss": 0.0,
"step": 27350
},
{
"epoch": 273.75,
"learning_rate": 7.996202531645571e-06,
"loss": 0.0,
"step": 27375
},
{
"epoch": 274.0,
"learning_rate": 7.980379746835445e-06,
"loss": 0.0,
"step": 27400
},
{
"epoch": 274.25,
"learning_rate": 7.964556962025316e-06,
"loss": 0.0,
"step": 27425
},
{
"epoch": 274.5,
"learning_rate": 7.94873417721519e-06,
"loss": 0.0,
"step": 27450
},
{
"epoch": 274.75,
"learning_rate": 7.932911392405064e-06,
"loss": 0.0,
"step": 27475
},
{
"epoch": 275.0,
"learning_rate": 7.917088607594937e-06,
"loss": 0.0,
"step": 27500
},
{
"epoch": 275.25,
"learning_rate": 7.90126582278481e-06,
"loss": 0.0,
"step": 27525
},
{
"epoch": 275.5,
"learning_rate": 7.885443037974684e-06,
"loss": 0.0,
"step": 27550
},
{
"epoch": 275.75,
"learning_rate": 7.869620253164558e-06,
"loss": 0.0,
"step": 27575
},
{
"epoch": 276.0,
"learning_rate": 7.85379746835443e-06,
"loss": 0.0,
"step": 27600
},
{
"epoch": 276.25,
"learning_rate": 7.837974683544303e-06,
"loss": 0.0,
"step": 27625
},
{
"epoch": 276.5,
"learning_rate": 7.822151898734177e-06,
"loss": 0.0,
"step": 27650
},
{
"epoch": 276.75,
"learning_rate": 7.80632911392405e-06,
"loss": 0.0,
"step": 27675
},
{
"epoch": 277.0,
"learning_rate": 7.790506329113924e-06,
"loss": 0.0,
"step": 27700
},
{
"epoch": 277.25,
"learning_rate": 7.7746835443038e-06,
"loss": 0.0,
"step": 27725
},
{
"epoch": 277.5,
"learning_rate": 7.758860759493671e-06,
"loss": 0.0,
"step": 27750
},
{
"epoch": 277.75,
"learning_rate": 7.743037974683545e-06,
"loss": 0.0,
"step": 27775
},
{
"epoch": 278.0,
"learning_rate": 7.727215189873418e-06,
"loss": 0.0,
"step": 27800
},
{
"epoch": 278.25,
"learning_rate": 7.711392405063292e-06,
"loss": 0.0,
"step": 27825
},
{
"epoch": 278.5,
"learning_rate": 7.695569620253165e-06,
"loss": 0.0,
"step": 27850
},
{
"epoch": 278.75,
"learning_rate": 7.679746835443039e-06,
"loss": 0.0,
"step": 27875
},
{
"epoch": 279.0,
"learning_rate": 7.663924050632913e-06,
"loss": 0.0,
"step": 27900
},
{
"epoch": 279.25,
"learning_rate": 7.648101265822784e-06,
"loss": 0.0,
"step": 27925
},
{
"epoch": 279.5,
"learning_rate": 7.632278481012658e-06,
"loss": 0.0,
"step": 27950
},
{
"epoch": 279.75,
"learning_rate": 7.6164556962025316e-06,
"loss": 0.0,
"step": 27975
},
{
"epoch": 280.0,
"learning_rate": 7.600632911392405e-06,
"loss": 0.0,
"step": 28000
},
{
"epoch": 280.0,
"eval_loss": 0.5228456258773804,
"eval_runtime": 158.9726,
"eval_samples_per_second": 80.152,
"eval_steps_per_second": 1.258,
"eval_wer": 16.22244802251055,
"step": 28000
},
{
"epoch": 280.25,
"learning_rate": 7.584810126582279e-06,
"loss": 0.0,
"step": 28025
},
{
"epoch": 280.5,
"learning_rate": 7.568987341772152e-06,
"loss": 0.0,
"step": 28050
},
{
"epoch": 280.75,
"learning_rate": 7.553164556962025e-06,
"loss": 0.0,
"step": 28075
},
{
"epoch": 281.0,
"learning_rate": 7.5373417721518986e-06,
"loss": 0.0,
"step": 28100
},
{
"epoch": 281.25,
"learning_rate": 7.521518987341772e-06,
"loss": 0.0,
"step": 28125
},
{
"epoch": 281.5,
"learning_rate": 7.5056962025316466e-06,
"loss": 0.0,
"step": 28150
},
{
"epoch": 281.75,
"learning_rate": 7.48987341772152e-06,
"loss": 0.0,
"step": 28175
},
{
"epoch": 282.0,
"learning_rate": 7.474050632911393e-06,
"loss": 0.0,
"step": 28200
},
{
"epoch": 282.25,
"learning_rate": 7.458227848101266e-06,
"loss": 0.0,
"step": 28225
},
{
"epoch": 282.5,
"learning_rate": 7.44240506329114e-06,
"loss": 0.0,
"step": 28250
},
{
"epoch": 282.75,
"learning_rate": 7.4265822784810136e-06,
"loss": 0.0,
"step": 28275
},
{
"epoch": 283.0,
"learning_rate": 7.410759493670886e-06,
"loss": 0.0,
"step": 28300
},
{
"epoch": 283.25,
"learning_rate": 7.39493670886076e-06,
"loss": 0.0,
"step": 28325
},
{
"epoch": 283.5,
"learning_rate": 7.379113924050633e-06,
"loss": 0.0,
"step": 28350
},
{
"epoch": 283.75,
"learning_rate": 7.363291139240507e-06,
"loss": 0.0,
"step": 28375
},
{
"epoch": 284.0,
"learning_rate": 7.34746835443038e-06,
"loss": 0.0,
"step": 28400
},
{
"epoch": 284.25,
"learning_rate": 7.331645569620253e-06,
"loss": 0.0,
"step": 28425
},
{
"epoch": 284.5,
"learning_rate": 7.315822784810127e-06,
"loss": 0.0,
"step": 28450
},
{
"epoch": 284.75,
"learning_rate": 7.2999999999999996e-06,
"loss": 0.0,
"step": 28475
},
{
"epoch": 285.0,
"learning_rate": 7.284177215189873e-06,
"loss": 0.0,
"step": 28500
},
{
"epoch": 285.25,
"learning_rate": 7.268354430379747e-06,
"loss": 0.0,
"step": 28525
},
{
"epoch": 285.5,
"learning_rate": 7.252531645569621e-06,
"loss": 0.0,
"step": 28550
},
{
"epoch": 285.75,
"learning_rate": 7.236708860759495e-06,
"loss": 0.0,
"step": 28575
},
{
"epoch": 286.0,
"learning_rate": 7.220886075949368e-06,
"loss": 0.0,
"step": 28600
},
{
"epoch": 286.25,
"learning_rate": 7.205063291139241e-06,
"loss": 0.0,
"step": 28625
},
{
"epoch": 286.5,
"learning_rate": 7.1892405063291145e-06,
"loss": 0.0,
"step": 28650
},
{
"epoch": 286.75,
"learning_rate": 7.173417721518988e-06,
"loss": 0.0,
"step": 28675
},
{
"epoch": 287.0,
"learning_rate": 7.157594936708862e-06,
"loss": 0.0,
"step": 28700
},
{
"epoch": 287.25,
"learning_rate": 7.141772151898734e-06,
"loss": 0.0,
"step": 28725
},
{
"epoch": 287.5,
"learning_rate": 7.125949367088608e-06,
"loss": 0.0,
"step": 28750
},
{
"epoch": 287.75,
"learning_rate": 7.1101265822784815e-06,
"loss": 0.0,
"step": 28775
},
{
"epoch": 288.0,
"learning_rate": 7.094303797468354e-06,
"loss": 0.0,
"step": 28800
},
{
"epoch": 288.25,
"learning_rate": 7.078481012658228e-06,
"loss": 0.0,
"step": 28825
},
{
"epoch": 288.5,
"learning_rate": 7.062658227848101e-06,
"loss": 0.0,
"step": 28850
},
{
"epoch": 288.75,
"learning_rate": 7.046835443037975e-06,
"loss": 0.0,
"step": 28875
},
{
"epoch": 289.0,
"learning_rate": 7.031012658227848e-06,
"loss": 0.0,
"step": 28900
},
{
"epoch": 289.25,
"learning_rate": 7.015189873417721e-06,
"loss": 0.0,
"step": 28925
},
{
"epoch": 289.5,
"learning_rate": 6.999367088607595e-06,
"loss": 0.0,
"step": 28950
},
{
"epoch": 289.75,
"learning_rate": 6.983544303797469e-06,
"loss": 0.0,
"step": 28975
},
{
"epoch": 290.0,
"learning_rate": 6.967721518987343e-06,
"loss": 0.0,
"step": 29000
},
{
"epoch": 290.0,
"eval_loss": 0.5326051712036133,
"eval_runtime": 158.9966,
"eval_samples_per_second": 80.14,
"eval_steps_per_second": 1.258,
"eval_wer": 16.255666718774425,
"step": 29000
},
{
"epoch": 290.25,
"learning_rate": 6.951898734177216e-06,
"loss": 0.0,
"step": 29025
},
{
"epoch": 290.5,
"learning_rate": 6.936075949367089e-06,
"loss": 0.0,
"step": 29050
},
{
"epoch": 290.75,
"learning_rate": 6.920253164556963e-06,
"loss": 0.0,
"step": 29075
},
{
"epoch": 291.0,
"learning_rate": 6.904430379746836e-06,
"loss": 0.0,
"step": 29100
},
{
"epoch": 291.25,
"learning_rate": 6.888607594936709e-06,
"loss": 0.0,
"step": 29125
},
{
"epoch": 291.5,
"learning_rate": 6.8727848101265825e-06,
"loss": 0.0,
"step": 29150
},
{
"epoch": 291.75,
"learning_rate": 6.856962025316456e-06,
"loss": 0.0,
"step": 29175
},
{
"epoch": 292.0,
"learning_rate": 6.84113924050633e-06,
"loss": 0.0,
"step": 29200
},
{
"epoch": 292.25,
"learning_rate": 6.825316455696202e-06,
"loss": 0.0,
"step": 29225
},
{
"epoch": 292.5,
"learning_rate": 6.809493670886076e-06,
"loss": 0.0,
"step": 29250
},
{
"epoch": 292.75,
"learning_rate": 6.7936708860759495e-06,
"loss": 0.0,
"step": 29275
},
{
"epoch": 293.0,
"learning_rate": 6.777848101265822e-06,
"loss": 0.0,
"step": 29300
},
{
"epoch": 293.25,
"learning_rate": 6.762025316455696e-06,
"loss": 0.0,
"step": 29325
},
{
"epoch": 293.5,
"learning_rate": 6.746202531645569e-06,
"loss": 0.0,
"step": 29350
},
{
"epoch": 293.75,
"learning_rate": 6.730379746835444e-06,
"loss": 0.0,
"step": 29375
},
{
"epoch": 294.0,
"learning_rate": 6.714556962025317e-06,
"loss": 0.0,
"step": 29400
},
{
"epoch": 294.25,
"learning_rate": 6.698734177215191e-06,
"loss": 0.0,
"step": 29425
},
{
"epoch": 294.5,
"learning_rate": 6.682911392405064e-06,
"loss": 0.0,
"step": 29450
},
{
"epoch": 294.75,
"learning_rate": 6.667088607594937e-06,
"loss": 0.0,
"step": 29475
},
{
"epoch": 295.0,
"learning_rate": 6.651265822784811e-06,
"loss": 0.0,
"step": 29500
},
{
"epoch": 295.25,
"learning_rate": 6.635443037974684e-06,
"loss": 0.0,
"step": 29525
},
{
"epoch": 295.5,
"learning_rate": 6.619620253164557e-06,
"loss": 0.0,
"step": 29550
},
{
"epoch": 295.75,
"learning_rate": 6.603797468354431e-06,
"loss": 0.0,
"step": 29575
},
{
"epoch": 296.0,
"learning_rate": 6.587974683544304e-06,
"loss": 0.0,
"step": 29600
},
{
"epoch": 296.25,
"learning_rate": 6.572151898734177e-06,
"loss": 0.0,
"step": 29625
},
{
"epoch": 296.5,
"learning_rate": 6.5563291139240505e-06,
"loss": 0.0,
"step": 29650
},
{
"epoch": 296.75,
"learning_rate": 6.540506329113924e-06,
"loss": 0.0,
"step": 29675
},
{
"epoch": 297.0,
"learning_rate": 6.524683544303798e-06,
"loss": 0.0,
"step": 29700
},
{
"epoch": 297.25,
"learning_rate": 6.50886075949367e-06,
"loss": 0.0,
"step": 29725
},
{
"epoch": 297.5,
"learning_rate": 6.493037974683544e-06,
"loss": 0.0,
"step": 29750
},
{
"epoch": 297.75,
"learning_rate": 6.4772151898734175e-06,
"loss": 0.0,
"step": 29775
},
{
"epoch": 298.0,
"learning_rate": 6.461392405063292e-06,
"loss": 0.0,
"step": 29800
},
{
"epoch": 298.25,
"learning_rate": 6.4455696202531655e-06,
"loss": 0.0,
"step": 29825
},
{
"epoch": 298.5,
"learning_rate": 6.429746835443039e-06,
"loss": 0.0,
"step": 29850
},
{
"epoch": 298.75,
"learning_rate": 6.413924050632912e-06,
"loss": 0.0,
"step": 29875
},
{
"epoch": 299.0,
"learning_rate": 6.398101265822785e-06,
"loss": 0.0,
"step": 29900
},
{
"epoch": 299.25,
"learning_rate": 6.382278481012659e-06,
"loss": 0.0,
"step": 29925
},
{
"epoch": 299.5,
"learning_rate": 6.366455696202532e-06,
"loss": 0.0,
"step": 29950
},
{
"epoch": 299.75,
"learning_rate": 6.350632911392405e-06,
"loss": 0.0,
"step": 29975
},
{
"epoch": 300.0,
"learning_rate": 6.334810126582279e-06,
"loss": 0.0,
"step": 30000
},
{
"epoch": 300.0,
"eval_loss": 0.5426864624023438,
"eval_runtime": 157.5522,
"eval_samples_per_second": 80.875,
"eval_steps_per_second": 1.269,
"eval_wer": 16.241988432077537,
"step": 30000
},
{
"epoch": 300.25,
"learning_rate": 6.318987341772152e-06,
"loss": 0.0,
"step": 30025
},
{
"epoch": 300.5,
"learning_rate": 6.303164556962025e-06,
"loss": 0.0,
"step": 30050
},
{
"epoch": 300.75,
"learning_rate": 6.287341772151899e-06,
"loss": 0.0,
"step": 30075
},
{
"epoch": 301.0,
"learning_rate": 6.271518987341772e-06,
"loss": 0.0,
"step": 30100
},
{
"epoch": 301.25,
"learning_rate": 6.255696202531646e-06,
"loss": 0.0,
"step": 30125
},
{
"epoch": 301.5,
"learning_rate": 6.239873417721519e-06,
"loss": 0.0,
"step": 30150
},
{
"epoch": 301.75,
"learning_rate": 6.224050632911393e-06,
"loss": 0.0,
"step": 30175
},
{
"epoch": 302.0,
"learning_rate": 6.208227848101266e-06,
"loss": 0.0,
"step": 30200
},
{
"epoch": 302.25,
"learning_rate": 6.192405063291139e-06,
"loss": 0.0,
"step": 30225
},
{
"epoch": 302.5,
"learning_rate": 6.176582278481013e-06,
"loss": 0.0,
"step": 30250
},
{
"epoch": 302.75,
"learning_rate": 6.160759493670886e-06,
"loss": 0.0,
"step": 30275
},
{
"epoch": 303.0,
"learning_rate": 6.14493670886076e-06,
"loss": 0.0,
"step": 30300
},
{
"epoch": 303.25,
"learning_rate": 6.1291139240506335e-06,
"loss": 0.0,
"step": 30325
},
{
"epoch": 303.5,
"learning_rate": 6.113924050632912e-06,
"loss": 0.0,
"step": 30350
},
{
"epoch": 303.75,
"learning_rate": 6.098101265822785e-06,
"loss": 0.0,
"step": 30375
},
{
"epoch": 304.0,
"learning_rate": 6.0822784810126584e-06,
"loss": 0.0,
"step": 30400
},
{
"epoch": 304.25,
"learning_rate": 6.066455696202532e-06,
"loss": 0.0,
"step": 30425
},
{
"epoch": 304.5,
"learning_rate": 6.050632911392405e-06,
"loss": 0.0,
"step": 30450
},
{
"epoch": 304.75,
"learning_rate": 6.034810126582278e-06,
"loss": 0.0,
"step": 30475
},
{
"epoch": 305.0,
"learning_rate": 6.018987341772153e-06,
"loss": 0.0,
"step": 30500
},
{
"epoch": 305.25,
"learning_rate": 6.0031645569620254e-06,
"loss": 0.0,
"step": 30525
},
{
"epoch": 305.5,
"learning_rate": 5.987341772151899e-06,
"loss": 0.0,
"step": 30550
},
{
"epoch": 305.75,
"learning_rate": 5.971518987341773e-06,
"loss": 0.0,
"step": 30575
},
{
"epoch": 306.0,
"learning_rate": 5.955696202531646e-06,
"loss": 0.0,
"step": 30600
},
{
"epoch": 306.25,
"learning_rate": 5.939873417721519e-06,
"loss": 0.0,
"step": 30625
},
{
"epoch": 306.5,
"learning_rate": 5.9240506329113924e-06,
"loss": 0.0,
"step": 30650
},
{
"epoch": 306.75,
"learning_rate": 5.908227848101266e-06,
"loss": 0.0,
"step": 30675
},
{
"epoch": 307.0,
"learning_rate": 5.8924050632911396e-06,
"loss": 0.0,
"step": 30700
},
{
"epoch": 307.25,
"learning_rate": 5.876582278481013e-06,
"loss": 0.0,
"step": 30725
},
{
"epoch": 307.5,
"learning_rate": 5.860759493670887e-06,
"loss": 0.0,
"step": 30750
},
{
"epoch": 307.75,
"learning_rate": 5.8449367088607594e-06,
"loss": 0.0,
"step": 30775
},
{
"epoch": 308.0,
"learning_rate": 5.829113924050633e-06,
"loss": 0.0,
"step": 30800
},
{
"epoch": 308.25,
"learning_rate": 5.8132911392405066e-06,
"loss": 0.0,
"step": 30825
},
{
"epoch": 308.5,
"learning_rate": 5.79746835443038e-06,
"loss": 0.0,
"step": 30850
},
{
"epoch": 308.75,
"learning_rate": 5.781645569620253e-06,
"loss": 0.0,
"step": 30875
},
{
"epoch": 309.0,
"learning_rate": 5.765822784810127e-06,
"loss": 0.0,
"step": 30900
},
{
"epoch": 309.25,
"learning_rate": 5.750000000000001e-06,
"loss": 0.0,
"step": 30925
},
{
"epoch": 309.5,
"learning_rate": 5.7341772151898736e-06,
"loss": 0.0,
"step": 30950
},
{
"epoch": 309.75,
"learning_rate": 5.718354430379747e-06,
"loss": 0.0,
"step": 30975
},
{
"epoch": 310.0,
"learning_rate": 5.702531645569621e-06,
"loss": 0.0,
"step": 31000
},
{
"epoch": 310.0,
"eval_loss": 0.5525209307670593,
"eval_runtime": 158.5191,
"eval_samples_per_second": 80.382,
"eval_steps_per_second": 1.262,
"eval_wer": 16.263482882601217,
"step": 31000
},
{
"epoch": 310.25,
"learning_rate": 5.6867088607594934e-06,
"loss": 0.0,
"step": 31025
},
{
"epoch": 310.5,
"learning_rate": 5.670886075949367e-06,
"loss": 0.0,
"step": 31050
},
{
"epoch": 310.75,
"learning_rate": 5.6550632911392406e-06,
"loss": 0.0,
"step": 31075
},
{
"epoch": 311.0,
"learning_rate": 5.639240506329114e-06,
"loss": 0.0,
"step": 31100
},
{
"epoch": 311.25,
"learning_rate": 5.623417721518988e-06,
"loss": 0.0,
"step": 31125
},
{
"epoch": 311.5,
"learning_rate": 5.607594936708861e-06,
"loss": 0.0,
"step": 31150
},
{
"epoch": 311.75,
"learning_rate": 5.591772151898735e-06,
"loss": 0.0,
"step": 31175
},
{
"epoch": 312.0,
"learning_rate": 5.5759493670886076e-06,
"loss": 0.0,
"step": 31200
},
{
"epoch": 312.25,
"learning_rate": 5.560126582278481e-06,
"loss": 0.0,
"step": 31225
},
{
"epoch": 312.5,
"learning_rate": 5.544303797468355e-06,
"loss": 0.0,
"step": 31250
},
{
"epoch": 312.75,
"learning_rate": 5.528481012658228e-06,
"loss": 0.0,
"step": 31275
},
{
"epoch": 313.0,
"learning_rate": 5.512658227848101e-06,
"loss": 0.0,
"step": 31300
},
{
"epoch": 313.25,
"learning_rate": 5.496835443037975e-06,
"loss": 0.0,
"step": 31325
},
{
"epoch": 313.5,
"learning_rate": 5.481012658227849e-06,
"loss": 0.0,
"step": 31350
},
{
"epoch": 313.75,
"learning_rate": 5.465189873417722e-06,
"loss": 0.0,
"step": 31375
},
{
"epoch": 314.0,
"learning_rate": 5.449367088607595e-06,
"loss": 0.0,
"step": 31400
},
{
"epoch": 314.25,
"learning_rate": 5.433544303797469e-06,
"loss": 0.0,
"step": 31425
},
{
"epoch": 314.5,
"learning_rate": 5.4177215189873416e-06,
"loss": 0.0,
"step": 31450
},
{
"epoch": 314.75,
"learning_rate": 5.401898734177215e-06,
"loss": 0.0,
"step": 31475
},
{
"epoch": 315.0,
"learning_rate": 5.386075949367089e-06,
"loss": 0.0,
"step": 31500
},
{
"epoch": 315.25,
"learning_rate": 5.370253164556962e-06,
"loss": 0.0,
"step": 31525
},
{
"epoch": 315.5,
"learning_rate": 5.354430379746836e-06,
"loss": 0.0,
"step": 31550
},
{
"epoch": 315.75,
"learning_rate": 5.338607594936709e-06,
"loss": 0.0,
"step": 31575
},
{
"epoch": 316.0,
"learning_rate": 5.322784810126583e-06,
"loss": 0.0,
"step": 31600
},
{
"epoch": 316.25,
"learning_rate": 5.306962025316456e-06,
"loss": 0.0,
"step": 31625
},
{
"epoch": 316.5,
"learning_rate": 5.291139240506329e-06,
"loss": 0.0,
"step": 31650
},
{
"epoch": 316.75,
"learning_rate": 5.275316455696203e-06,
"loss": 0.0,
"step": 31675
},
{
"epoch": 317.0,
"learning_rate": 5.2594936708860756e-06,
"loss": 0.0,
"step": 31700
},
{
"epoch": 317.25,
"learning_rate": 5.24367088607595e-06,
"loss": 0.0,
"step": 31725
},
{
"epoch": 317.5,
"learning_rate": 5.2278481012658236e-06,
"loss": 0.0,
"step": 31750
},
{
"epoch": 317.75,
"learning_rate": 5.212025316455696e-06,
"loss": 0.0,
"step": 31775
},
{
"epoch": 318.0,
"learning_rate": 5.19620253164557e-06,
"loss": 0.0,
"step": 31800
},
{
"epoch": 318.25,
"learning_rate": 5.180379746835443e-06,
"loss": 0.0,
"step": 31825
},
{
"epoch": 318.5,
"learning_rate": 5.164556962025317e-06,
"loss": 0.0,
"step": 31850
},
{
"epoch": 318.75,
"learning_rate": 5.14873417721519e-06,
"loss": 0.0,
"step": 31875
},
{
"epoch": 319.0,
"learning_rate": 5.132911392405063e-06,
"loss": 0.0,
"step": 31900
},
{
"epoch": 319.25,
"learning_rate": 5.117088607594938e-06,
"loss": 0.0,
"step": 31925
},
{
"epoch": 319.5,
"learning_rate": 5.10126582278481e-06,
"loss": 0.0,
"step": 31950
},
{
"epoch": 319.75,
"learning_rate": 5.085443037974684e-06,
"loss": 0.0,
"step": 31975
},
{
"epoch": 320.0,
"learning_rate": 5.0696202531645576e-06,
"loss": 0.0,
"step": 32000
},
{
"epoch": 320.0,
"eval_loss": 0.5624327659606934,
"eval_runtime": 158.6013,
"eval_samples_per_second": 80.34,
"eval_steps_per_second": 1.261,
"eval_wer": 16.29572455838674,
"step": 32000
},
{
"epoch": 320.25,
"learning_rate": 5.05379746835443e-06,
"loss": 0.0,
"step": 32025
},
{
"epoch": 320.5,
"learning_rate": 5.037974683544304e-06,
"loss": 0.0,
"step": 32050
},
{
"epoch": 320.75,
"learning_rate": 5.022151898734177e-06,
"loss": 0.0,
"step": 32075
},
{
"epoch": 321.0,
"learning_rate": 5.006329113924051e-06,
"loss": 0.0,
"step": 32100
},
{
"epoch": 321.25,
"learning_rate": 4.990506329113924e-06,
"loss": 0.0,
"step": 32125
},
{
"epoch": 321.5,
"learning_rate": 4.974683544303798e-06,
"loss": 0.0,
"step": 32150
},
{
"epoch": 321.75,
"learning_rate": 4.958860759493672e-06,
"loss": 0.0,
"step": 32175
},
{
"epoch": 322.0,
"learning_rate": 4.943037974683544e-06,
"loss": 0.0,
"step": 32200
},
{
"epoch": 322.25,
"learning_rate": 4.927215189873418e-06,
"loss": 0.0,
"step": 32225
},
{
"epoch": 322.5,
"learning_rate": 4.9113924050632915e-06,
"loss": 0.0,
"step": 32250
},
{
"epoch": 322.75,
"learning_rate": 4.895569620253164e-06,
"loss": 0.0,
"step": 32275
},
{
"epoch": 323.0,
"learning_rate": 4.879746835443038e-06,
"loss": 0.0,
"step": 32300
},
{
"epoch": 323.25,
"learning_rate": 4.863924050632911e-06,
"loss": 0.0,
"step": 32325
},
{
"epoch": 323.5,
"learning_rate": 4.848101265822785e-06,
"loss": 0.0,
"step": 32350
},
{
"epoch": 323.75,
"learning_rate": 4.8322784810126585e-06,
"loss": 0.0,
"step": 32375
},
{
"epoch": 324.0,
"learning_rate": 4.816455696202532e-06,
"loss": 0.0,
"step": 32400
},
{
"epoch": 324.25,
"learning_rate": 4.800632911392406e-06,
"loss": 0.0,
"step": 32425
},
{
"epoch": 324.5,
"learning_rate": 4.784810126582278e-06,
"loss": 0.0,
"step": 32450
},
{
"epoch": 324.75,
"learning_rate": 4.768987341772152e-06,
"loss": 0.0,
"step": 32475
},
{
"epoch": 325.0,
"learning_rate": 4.7531645569620255e-06,
"loss": 0.0,
"step": 32500
},
{
"epoch": 325.25,
"learning_rate": 4.737341772151898e-06,
"loss": 0.0,
"step": 32525
},
{
"epoch": 325.5,
"learning_rate": 4.721518987341773e-06,
"loss": 0.0,
"step": 32550
},
{
"epoch": 325.75,
"learning_rate": 4.705696202531646e-06,
"loss": 0.0,
"step": 32575
},
{
"epoch": 326.0,
"learning_rate": 4.689873417721519e-06,
"loss": 0.0,
"step": 32600
},
{
"epoch": 326.25,
"learning_rate": 4.6740506329113925e-06,
"loss": 0.0,
"step": 32625
},
{
"epoch": 326.5,
"learning_rate": 4.658227848101266e-06,
"loss": 0.0,
"step": 32650
},
{
"epoch": 326.75,
"learning_rate": 4.64240506329114e-06,
"loss": 0.0,
"step": 32675
},
{
"epoch": 327.0,
"learning_rate": 4.626582278481012e-06,
"loss": 0.0,
"step": 32700
},
{
"epoch": 327.25,
"learning_rate": 4.610759493670886e-06,
"loss": 0.0,
"step": 32725
},
{
"epoch": 327.5,
"learning_rate": 4.59493670886076e-06,
"loss": 0.0,
"step": 32750
},
{
"epoch": 327.75,
"learning_rate": 4.579113924050633e-06,
"loss": 0.0,
"step": 32775
},
{
"epoch": 328.0,
"learning_rate": 4.563291139240507e-06,
"loss": 0.0,
"step": 32800
},
{
"epoch": 328.25,
"learning_rate": 4.54746835443038e-06,
"loss": 0.0,
"step": 32825
},
{
"epoch": 328.5,
"learning_rate": 4.531645569620253e-06,
"loss": 0.0,
"step": 32850
},
{
"epoch": 328.75,
"learning_rate": 4.5158227848101265e-06,
"loss": 0.0,
"step": 32875
},
{
"epoch": 329.0,
"learning_rate": 4.5e-06,
"loss": 0.0,
"step": 32900
},
{
"epoch": 329.25,
"learning_rate": 4.484177215189874e-06,
"loss": 0.0,
"step": 32925
},
{
"epoch": 329.5,
"learning_rate": 4.468354430379746e-06,
"loss": 0.0,
"step": 32950
},
{
"epoch": 329.75,
"learning_rate": 4.452531645569621e-06,
"loss": 0.0,
"step": 32975
},
{
"epoch": 330.0,
"learning_rate": 4.436708860759494e-06,
"loss": 0.0,
"step": 33000
},
{
"epoch": 330.0,
"eval_loss": 0.5705838203430176,
"eval_runtime": 157.8203,
"eval_samples_per_second": 80.737,
"eval_steps_per_second": 1.267,
"eval_wer": 16.329920275128966,
"step": 33000
},
{
"epoch": 330.25,
"learning_rate": 4.420886075949367e-06,
"loss": 0.0,
"step": 33025
},
{
"epoch": 330.5,
"learning_rate": 4.405063291139241e-06,
"loss": 0.0,
"step": 33050
},
{
"epoch": 330.75,
"learning_rate": 4.389240506329114e-06,
"loss": 0.0,
"step": 33075
},
{
"epoch": 331.0,
"learning_rate": 4.373417721518988e-06,
"loss": 0.0,
"step": 33100
},
{
"epoch": 331.25,
"learning_rate": 4.3575949367088605e-06,
"loss": 0.0,
"step": 33125
},
{
"epoch": 331.5,
"learning_rate": 4.341772151898734e-06,
"loss": 0.0,
"step": 33150
},
{
"epoch": 331.75,
"learning_rate": 4.325949367088608e-06,
"loss": 0.0,
"step": 33175
},
{
"epoch": 332.0,
"learning_rate": 4.310126582278481e-06,
"loss": 0.0,
"step": 33200
},
{
"epoch": 332.25,
"learning_rate": 4.294303797468355e-06,
"loss": 0.0,
"step": 33225
},
{
"epoch": 332.5,
"learning_rate": 4.278481012658228e-06,
"loss": 0.0,
"step": 33250
},
{
"epoch": 332.75,
"learning_rate": 4.262658227848101e-06,
"loss": 0.0,
"step": 33275
},
{
"epoch": 333.0,
"learning_rate": 4.246835443037975e-06,
"loss": 0.0,
"step": 33300
},
{
"epoch": 333.25,
"learning_rate": 4.231012658227848e-06,
"loss": 0.0,
"step": 33325
},
{
"epoch": 333.5,
"learning_rate": 4.215189873417722e-06,
"loss": 0.0,
"step": 33350
},
{
"epoch": 333.75,
"learning_rate": 4.199367088607595e-06,
"loss": 0.0,
"step": 33375
},
{
"epoch": 334.0,
"learning_rate": 4.183544303797469e-06,
"loss": 0.0,
"step": 33400
},
{
"epoch": 334.25,
"learning_rate": 4.1677215189873425e-06,
"loss": 0.0,
"step": 33425
},
{
"epoch": 334.5,
"learning_rate": 4.151898734177215e-06,
"loss": 0.0,
"step": 33450
},
{
"epoch": 334.75,
"learning_rate": 4.136075949367089e-06,
"loss": 0.0,
"step": 33475
},
{
"epoch": 335.0,
"learning_rate": 4.120253164556962e-06,
"loss": 0.0,
"step": 33500
},
{
"epoch": 335.25,
"learning_rate": 4.104430379746835e-06,
"loss": 0.0,
"step": 33525
},
{
"epoch": 335.5,
"learning_rate": 4.088607594936709e-06,
"loss": 0.0,
"step": 33550
},
{
"epoch": 335.75,
"learning_rate": 4.072784810126583e-06,
"loss": 0.0,
"step": 33575
},
{
"epoch": 336.0,
"learning_rate": 4.056962025316456e-06,
"loss": 0.0,
"step": 33600
},
{
"epoch": 336.25,
"learning_rate": 4.041139240506329e-06,
"loss": 0.0,
"step": 33625
},
{
"epoch": 336.5,
"learning_rate": 4.025316455696203e-06,
"loss": 0.0,
"step": 33650
},
{
"epoch": 336.75,
"learning_rate": 4.0094936708860765e-06,
"loss": 0.0,
"step": 33675
},
{
"epoch": 337.0,
"learning_rate": 3.993670886075949e-06,
"loss": 0.0,
"step": 33700
},
{
"epoch": 337.25,
"learning_rate": 3.977848101265823e-06,
"loss": 0.0,
"step": 33725
},
{
"epoch": 337.5,
"learning_rate": 3.962025316455696e-06,
"loss": 0.0,
"step": 33750
},
{
"epoch": 337.75,
"learning_rate": 3.946202531645569e-06,
"loss": 0.0,
"step": 33775
},
{
"epoch": 338.0,
"learning_rate": 3.9303797468354435e-06,
"loss": 0.0,
"step": 33800
},
{
"epoch": 338.25,
"learning_rate": 3.914556962025317e-06,
"loss": 0.0,
"step": 33825
},
{
"epoch": 338.5,
"learning_rate": 3.89873417721519e-06,
"loss": 0.0,
"step": 33850
},
{
"epoch": 338.75,
"learning_rate": 3.882911392405063e-06,
"loss": 0.0,
"step": 33875
},
{
"epoch": 339.0,
"learning_rate": 3.867088607594937e-06,
"loss": 0.0,
"step": 33900
},
{
"epoch": 339.25,
"learning_rate": 3.8512658227848105e-06,
"loss": 0.0,
"step": 33925
},
{
"epoch": 339.5,
"learning_rate": 3.835443037974683e-06,
"loss": 0.0,
"step": 33950
},
{
"epoch": 339.75,
"learning_rate": 3.819620253164557e-06,
"loss": 0.0,
"step": 33975
},
{
"epoch": 340.0,
"learning_rate": 3.803797468354431e-06,
"loss": 0.0,
"step": 34000
},
{
"epoch": 340.0,
"eval_loss": 0.5797959566116333,
"eval_runtime": 158.034,
"eval_samples_per_second": 80.628,
"eval_steps_per_second": 1.266,
"eval_wer": 16.353368766609346,
"step": 34000
},
{
"epoch": 340.25,
"learning_rate": 3.7879746835443044e-06,
"loss": 0.0,
"step": 34025
},
{
"epoch": 340.5,
"learning_rate": 3.7721518987341775e-06,
"loss": 0.0,
"step": 34050
},
{
"epoch": 340.75,
"learning_rate": 3.7563291139240507e-06,
"loss": 0.0,
"step": 34075
},
{
"epoch": 341.0,
"learning_rate": 3.7405063291139242e-06,
"loss": 0.0,
"step": 34100
},
{
"epoch": 341.25,
"learning_rate": 3.7246835443037974e-06,
"loss": 0.0,
"step": 34125
},
{
"epoch": 341.5,
"learning_rate": 3.708860759493671e-06,
"loss": 0.0,
"step": 34150
},
{
"epoch": 341.75,
"learning_rate": 3.693037974683544e-06,
"loss": 0.0,
"step": 34175
},
{
"epoch": 342.0,
"learning_rate": 3.677215189873418e-06,
"loss": 0.0,
"step": 34200
},
{
"epoch": 342.25,
"learning_rate": 3.6613924050632917e-06,
"loss": 0.0,
"step": 34225
},
{
"epoch": 342.5,
"learning_rate": 3.645569620253165e-06,
"loss": 0.0,
"step": 34250
},
{
"epoch": 342.75,
"learning_rate": 3.6297468354430384e-06,
"loss": 0.0,
"step": 34275
},
{
"epoch": 343.0,
"learning_rate": 3.6139240506329115e-06,
"loss": 0.0,
"step": 34300
},
{
"epoch": 343.25,
"learning_rate": 3.5981012658227847e-06,
"loss": 0.0,
"step": 34325
},
{
"epoch": 343.5,
"learning_rate": 3.5822784810126582e-06,
"loss": 0.0,
"step": 34350
},
{
"epoch": 343.75,
"learning_rate": 3.5670886075949364e-06,
"loss": 0.0,
"step": 34375
},
{
"epoch": 344.0,
"learning_rate": 3.5512658227848104e-06,
"loss": 0.0,
"step": 34400
},
{
"epoch": 344.25,
"learning_rate": 3.535443037974684e-06,
"loss": 0.0,
"step": 34425
},
{
"epoch": 344.5,
"learning_rate": 3.519620253164557e-06,
"loss": 0.0,
"step": 34450
},
{
"epoch": 344.75,
"learning_rate": 3.5037974683544307e-06,
"loss": 0.0,
"step": 34475
},
{
"epoch": 345.0,
"learning_rate": 3.487974683544304e-06,
"loss": 0.0,
"step": 34500
},
{
"epoch": 345.25,
"learning_rate": 3.4721518987341774e-06,
"loss": 0.0,
"step": 34525
},
{
"epoch": 345.5,
"learning_rate": 3.4563291139240506e-06,
"loss": 0.0,
"step": 34550
},
{
"epoch": 345.75,
"learning_rate": 3.4405063291139237e-06,
"loss": 0.0,
"step": 34575
},
{
"epoch": 346.0,
"learning_rate": 3.4246835443037977e-06,
"loss": 0.0,
"step": 34600
},
{
"epoch": 346.25,
"learning_rate": 3.4088607594936713e-06,
"loss": 0.0,
"step": 34625
},
{
"epoch": 346.5,
"learning_rate": 3.3930379746835444e-06,
"loss": 0.0,
"step": 34650
},
{
"epoch": 346.75,
"learning_rate": 3.377215189873418e-06,
"loss": 0.0,
"step": 34675
},
{
"epoch": 347.0,
"learning_rate": 3.361392405063291e-06,
"loss": 0.0,
"step": 34700
},
{
"epoch": 347.25,
"learning_rate": 3.3455696202531647e-06,
"loss": 0.0,
"step": 34725
},
{
"epoch": 347.5,
"learning_rate": 3.329746835443038e-06,
"loss": 0.0,
"step": 34750
},
{
"epoch": 347.75,
"learning_rate": 3.3139240506329114e-06,
"loss": 0.0,
"step": 34775
},
{
"epoch": 348.0,
"learning_rate": 3.2981012658227854e-06,
"loss": 0.0,
"step": 34800
},
{
"epoch": 348.25,
"learning_rate": 3.2822784810126586e-06,
"loss": 0.0,
"step": 34825
},
{
"epoch": 348.5,
"learning_rate": 3.266455696202532e-06,
"loss": 0.0,
"step": 34850
},
{
"epoch": 348.75,
"learning_rate": 3.2506329113924053e-06,
"loss": 0.0,
"step": 34875
},
{
"epoch": 349.0,
"learning_rate": 3.2348101265822784e-06,
"loss": 0.0,
"step": 34900
},
{
"epoch": 349.25,
"learning_rate": 3.218987341772152e-06,
"loss": 0.0,
"step": 34925
},
{
"epoch": 349.5,
"learning_rate": 3.203164556962025e-06,
"loss": 0.0,
"step": 34950
},
{
"epoch": 349.75,
"learning_rate": 3.1873417721518987e-06,
"loss": 0.0,
"step": 34975
},
{
"epoch": 350.0,
"learning_rate": 3.1715189873417727e-06,
"loss": 0.0,
"step": 35000
},
{
"epoch": 350.0,
"eval_loss": 0.5880439281463623,
"eval_runtime": 159.3626,
"eval_samples_per_second": 79.956,
"eval_steps_per_second": 1.255,
"eval_wer": 16.349460684695952,
"step": 35000
},
{
"epoch": 350.25,
"learning_rate": 3.155696202531646e-06,
"loss": 0.0,
"step": 35025
},
{
"epoch": 350.5,
"learning_rate": 3.1398734177215194e-06,
"loss": 0.0,
"step": 35050
},
{
"epoch": 350.75,
"learning_rate": 3.1240506329113926e-06,
"loss": 0.0,
"step": 35075
},
{
"epoch": 351.0,
"learning_rate": 3.108227848101266e-06,
"loss": 0.0,
"step": 35100
},
{
"epoch": 351.25,
"learning_rate": 3.0924050632911393e-06,
"loss": 0.0,
"step": 35125
},
{
"epoch": 351.5,
"learning_rate": 3.076582278481013e-06,
"loss": 0.0,
"step": 35150
},
{
"epoch": 351.75,
"learning_rate": 3.0607594936708864e-06,
"loss": 0.0,
"step": 35175
},
{
"epoch": 352.0,
"learning_rate": 3.0449367088607596e-06,
"loss": 0.0,
"step": 35200
},
{
"epoch": 352.25,
"learning_rate": 3.029113924050633e-06,
"loss": 0.0,
"step": 35225
},
{
"epoch": 352.5,
"learning_rate": 3.0132911392405063e-06,
"loss": 0.0,
"step": 35250
},
{
"epoch": 352.75,
"learning_rate": 2.99746835443038e-06,
"loss": 0.0,
"step": 35275
},
{
"epoch": 353.0,
"learning_rate": 2.9816455696202534e-06,
"loss": 0.0,
"step": 35300
},
{
"epoch": 353.25,
"learning_rate": 2.9658227848101266e-06,
"loss": 0.0,
"step": 35325
},
{
"epoch": 353.5,
"learning_rate": 2.95e-06,
"loss": 0.0,
"step": 35350
},
{
"epoch": 353.75,
"learning_rate": 2.9341772151898737e-06,
"loss": 0.0,
"step": 35375
},
{
"epoch": 354.0,
"learning_rate": 2.918354430379747e-06,
"loss": 0.0,
"step": 35400
},
{
"epoch": 354.25,
"learning_rate": 2.9025316455696204e-06,
"loss": 0.0,
"step": 35425
},
{
"epoch": 354.5,
"learning_rate": 2.8867088607594936e-06,
"loss": 0.0,
"step": 35450
},
{
"epoch": 354.75,
"learning_rate": 2.8708860759493676e-06,
"loss": 0.0,
"step": 35475
},
{
"epoch": 355.0,
"learning_rate": 2.8550632911392407e-06,
"loss": 0.0,
"step": 35500
},
{
"epoch": 355.25,
"learning_rate": 2.839240506329114e-06,
"loss": 0.0,
"step": 35525
},
{
"epoch": 355.5,
"learning_rate": 2.8234177215189874e-06,
"loss": 0.0,
"step": 35550
},
{
"epoch": 355.75,
"learning_rate": 2.807594936708861e-06,
"loss": 0.0,
"step": 35575
},
{
"epoch": 356.0,
"learning_rate": 2.7917721518987346e-06,
"loss": 0.0,
"step": 35600
},
{
"epoch": 356.25,
"learning_rate": 2.7759493670886077e-06,
"loss": 0.0,
"step": 35625
},
{
"epoch": 356.5,
"learning_rate": 2.760126582278481e-06,
"loss": 0.0,
"step": 35650
},
{
"epoch": 356.75,
"learning_rate": 2.744303797468355e-06,
"loss": 0.0,
"step": 35675
},
{
"epoch": 357.0,
"learning_rate": 2.728481012658228e-06,
"loss": 0.0,
"step": 35700
},
{
"epoch": 357.25,
"learning_rate": 2.7126582278481016e-06,
"loss": 0.0,
"step": 35725
},
{
"epoch": 357.5,
"learning_rate": 2.6968354430379747e-06,
"loss": 0.0,
"step": 35750
},
{
"epoch": 357.75,
"learning_rate": 2.6810126582278483e-06,
"loss": 0.0,
"step": 35775
},
{
"epoch": 358.0,
"learning_rate": 2.665189873417722e-06,
"loss": 0.0,
"step": 35800
},
{
"epoch": 358.25,
"learning_rate": 2.649367088607595e-06,
"loss": 0.0,
"step": 35825
},
{
"epoch": 358.5,
"learning_rate": 2.6335443037974686e-06,
"loss": 0.0,
"step": 35850
},
{
"epoch": 358.75,
"learning_rate": 2.617721518987342e-06,
"loss": 0.0,
"step": 35875
},
{
"epoch": 359.0,
"learning_rate": 2.6018987341772153e-06,
"loss": 0.0,
"step": 35900
},
{
"epoch": 359.25,
"learning_rate": 2.586075949367089e-06,
"loss": 0.0,
"step": 35925
},
{
"epoch": 359.5,
"learning_rate": 2.570253164556962e-06,
"loss": 0.0,
"step": 35950
},
{
"epoch": 359.75,
"learning_rate": 2.5544303797468355e-06,
"loss": 0.0,
"step": 35975
},
{
"epoch": 360.0,
"learning_rate": 2.538607594936709e-06,
"loss": 0.0,
"step": 36000
},
{
"epoch": 360.0,
"eval_loss": 0.5948340892791748,
"eval_runtime": 159.034,
"eval_samples_per_second": 80.121,
"eval_steps_per_second": 1.258,
"eval_wer": 16.36216195091449,
"step": 36000
},
{
"epoch": 360.25,
"learning_rate": 2.5227848101265823e-06,
"loss": 0.0,
"step": 36025
},
{
"epoch": 360.5,
"learning_rate": 2.506962025316456e-06,
"loss": 0.0,
"step": 36050
},
{
"epoch": 360.75,
"learning_rate": 2.491139240506329e-06,
"loss": 0.0,
"step": 36075
},
{
"epoch": 361.0,
"learning_rate": 2.4753164556962025e-06,
"loss": 0.0,
"step": 36100
},
{
"epoch": 361.25,
"learning_rate": 2.459493670886076e-06,
"loss": 0.0,
"step": 36125
},
{
"epoch": 361.5,
"learning_rate": 2.4436708860759493e-06,
"loss": 0.0,
"step": 36150
},
{
"epoch": 361.75,
"learning_rate": 2.427848101265823e-06,
"loss": 0.0,
"step": 36175
},
{
"epoch": 362.0,
"learning_rate": 2.4120253164556964e-06,
"loss": 0.0,
"step": 36200
},
{
"epoch": 362.25,
"learning_rate": 2.3962025316455695e-06,
"loss": 0.0,
"step": 36225
},
{
"epoch": 362.5,
"learning_rate": 2.380379746835443e-06,
"loss": 0.0,
"step": 36250
},
{
"epoch": 362.75,
"learning_rate": 2.3645569620253163e-06,
"loss": 0.0,
"step": 36275
},
{
"epoch": 363.0,
"learning_rate": 2.3487341772151903e-06,
"loss": 0.0,
"step": 36300
},
{
"epoch": 363.25,
"learning_rate": 2.3329113924050634e-06,
"loss": 0.0,
"step": 36325
},
{
"epoch": 363.5,
"learning_rate": 2.317088607594937e-06,
"loss": 0.0,
"step": 36350
},
{
"epoch": 363.75,
"learning_rate": 2.30126582278481e-06,
"loss": 0.0,
"step": 36375
},
{
"epoch": 364.0,
"learning_rate": 2.2860759493670887e-06,
"loss": 0.0,
"step": 36400
},
{
"epoch": 364.25,
"learning_rate": 2.2702531645569623e-06,
"loss": 0.0,
"step": 36425
},
{
"epoch": 364.5,
"learning_rate": 2.2544303797468355e-06,
"loss": 0.0,
"step": 36450
},
{
"epoch": 364.75,
"learning_rate": 2.238607594936709e-06,
"loss": 0.0,
"step": 36475
},
{
"epoch": 365.0,
"learning_rate": 2.2227848101265826e-06,
"loss": 0.0,
"step": 36500
},
{
"epoch": 365.25,
"learning_rate": 2.2069620253164557e-06,
"loss": 0.0,
"step": 36525
},
{
"epoch": 365.5,
"learning_rate": 2.1911392405063293e-06,
"loss": 0.0,
"step": 36550
},
{
"epoch": 365.75,
"learning_rate": 2.175316455696203e-06,
"loss": 0.0,
"step": 36575
},
{
"epoch": 366.0,
"learning_rate": 2.159493670886076e-06,
"loss": 0.0,
"step": 36600
},
{
"epoch": 366.25,
"learning_rate": 2.1436708860759496e-06,
"loss": 0.0,
"step": 36625
},
{
"epoch": 366.5,
"learning_rate": 2.1278481012658227e-06,
"loss": 0.0,
"step": 36650
},
{
"epoch": 366.75,
"learning_rate": 2.1120253164556963e-06,
"loss": 0.0,
"step": 36675
},
{
"epoch": 367.0,
"learning_rate": 2.09620253164557e-06,
"loss": 0.0,
"step": 36700
},
{
"epoch": 367.25,
"learning_rate": 2.080379746835443e-06,
"loss": 0.0,
"step": 36725
},
{
"epoch": 367.5,
"learning_rate": 2.0645569620253166e-06,
"loss": 0.0,
"step": 36750
},
{
"epoch": 367.75,
"learning_rate": 2.0487341772151897e-06,
"loss": 0.0,
"step": 36775
},
{
"epoch": 368.0,
"learning_rate": 2.0329113924050633e-06,
"loss": 0.0,
"step": 36800
},
{
"epoch": 368.25,
"learning_rate": 2.017088607594937e-06,
"loss": 0.0,
"step": 36825
},
{
"epoch": 368.5,
"learning_rate": 2.00126582278481e-06,
"loss": 0.0,
"step": 36850
},
{
"epoch": 368.75,
"learning_rate": 1.9854430379746836e-06,
"loss": 0.0,
"step": 36875
},
{
"epoch": 369.0,
"learning_rate": 1.969620253164557e-06,
"loss": 0.0,
"step": 36900
},
{
"epoch": 369.25,
"learning_rate": 1.9537974683544303e-06,
"loss": 0.0,
"step": 36925
},
{
"epoch": 369.5,
"learning_rate": 1.937974683544304e-06,
"loss": 0.0,
"step": 36950
},
{
"epoch": 369.75,
"learning_rate": 1.922151898734177e-06,
"loss": 0.0,
"step": 36975
},
{
"epoch": 370.0,
"learning_rate": 1.9063291139240508e-06,
"loss": 0.0,
"step": 37000
},
{
"epoch": 370.0,
"eval_loss": 0.6004884839057922,
"eval_runtime": 157.7534,
"eval_samples_per_second": 80.772,
"eval_steps_per_second": 1.268,
"eval_wer": 16.393426606221666,
"step": 37000
},
{
"epoch": 370.25,
"learning_rate": 1.8905063291139242e-06,
"loss": 0.0,
"step": 37025
},
{
"epoch": 370.5,
"learning_rate": 1.8746835443037975e-06,
"loss": 0.0,
"step": 37050
},
{
"epoch": 370.75,
"learning_rate": 1.8588607594936709e-06,
"loss": 0.0,
"step": 37075
},
{
"epoch": 371.0,
"learning_rate": 1.8430379746835444e-06,
"loss": 0.0,
"step": 37100
},
{
"epoch": 371.25,
"learning_rate": 1.8272151898734178e-06,
"loss": 0.0,
"step": 37125
},
{
"epoch": 371.5,
"learning_rate": 1.8113924050632912e-06,
"loss": 0.0,
"step": 37150
},
{
"epoch": 371.75,
"learning_rate": 1.7955696202531645e-06,
"loss": 0.0,
"step": 37175
},
{
"epoch": 372.0,
"learning_rate": 1.7797468354430383e-06,
"loss": 0.0,
"step": 37200
},
{
"epoch": 372.25,
"learning_rate": 1.7639240506329114e-06,
"loss": 0.0,
"step": 37225
},
{
"epoch": 372.5,
"learning_rate": 1.7481012658227848e-06,
"loss": 0.0,
"step": 37250
},
{
"epoch": 372.75,
"learning_rate": 1.7322784810126582e-06,
"loss": 0.0,
"step": 37275
},
{
"epoch": 373.0,
"learning_rate": 1.716455696202532e-06,
"loss": 0.0,
"step": 37300
},
{
"epoch": 373.25,
"learning_rate": 1.7006329113924053e-06,
"loss": 0.0,
"step": 37325
},
{
"epoch": 373.5,
"learning_rate": 1.6848101265822784e-06,
"loss": 0.0,
"step": 37350
},
{
"epoch": 373.75,
"learning_rate": 1.6689873417721518e-06,
"loss": 0.0,
"step": 37375
},
{
"epoch": 374.0,
"learning_rate": 1.6531645569620256e-06,
"loss": 0.0,
"step": 37400
},
{
"epoch": 374.25,
"learning_rate": 1.637341772151899e-06,
"loss": 0.0,
"step": 37425
},
{
"epoch": 374.5,
"learning_rate": 1.6215189873417723e-06,
"loss": 0.0,
"step": 37450
},
{
"epoch": 374.75,
"learning_rate": 1.6056962025316457e-06,
"loss": 0.0,
"step": 37475
},
{
"epoch": 375.0,
"learning_rate": 1.5898734177215188e-06,
"loss": 0.0,
"step": 37500
},
{
"epoch": 375.25,
"learning_rate": 1.5740506329113926e-06,
"loss": 0.0,
"step": 37525
},
{
"epoch": 375.5,
"learning_rate": 1.558227848101266e-06,
"loss": 0.0,
"step": 37550
},
{
"epoch": 375.75,
"learning_rate": 1.5424050632911393e-06,
"loss": 0.0,
"step": 37575
},
{
"epoch": 376.0,
"learning_rate": 1.5265822784810127e-06,
"loss": 0.0,
"step": 37600
},
{
"epoch": 376.25,
"learning_rate": 1.510759493670886e-06,
"loss": 0.0,
"step": 37625
},
{
"epoch": 376.5,
"learning_rate": 1.4949367088607596e-06,
"loss": 0.0,
"step": 37650
},
{
"epoch": 376.75,
"learning_rate": 1.479113924050633e-06,
"loss": 0.0,
"step": 37675
},
{
"epoch": 377.0,
"learning_rate": 1.4632911392405065e-06,
"loss": 0.0,
"step": 37700
},
{
"epoch": 377.25,
"learning_rate": 1.4474683544303797e-06,
"loss": 0.0,
"step": 37725
},
{
"epoch": 377.5,
"learning_rate": 1.4316455696202532e-06,
"loss": 0.0,
"step": 37750
},
{
"epoch": 377.75,
"learning_rate": 1.4158227848101266e-06,
"loss": 0.0,
"step": 37775
},
{
"epoch": 378.0,
"learning_rate": 1.4000000000000001e-06,
"loss": 0.0,
"step": 37800
},
{
"epoch": 378.25,
"learning_rate": 1.3841772151898735e-06,
"loss": 0.0,
"step": 37825
},
{
"epoch": 378.5,
"learning_rate": 1.3683544303797469e-06,
"loss": 0.0,
"step": 37850
},
{
"epoch": 378.75,
"learning_rate": 1.3525316455696202e-06,
"loss": 0.0,
"step": 37875
},
{
"epoch": 379.0,
"learning_rate": 1.3367088607594938e-06,
"loss": 0.0,
"step": 37900
},
{
"epoch": 379.25,
"learning_rate": 1.3208860759493671e-06,
"loss": 0.0,
"step": 37925
},
{
"epoch": 379.5,
"learning_rate": 1.3050632911392407e-06,
"loss": 0.0,
"step": 37950
},
{
"epoch": 379.75,
"learning_rate": 1.2892405063291139e-06,
"loss": 0.0,
"step": 37975
},
{
"epoch": 380.0,
"learning_rate": 1.2734177215189874e-06,
"loss": 0.0,
"step": 38000
},
{
"epoch": 380.0,
"eval_loss": 0.6044662594795227,
"eval_runtime": 158.9961,
"eval_samples_per_second": 80.14,
"eval_steps_per_second": 1.258,
"eval_wer": 16.38756448335157,
"step": 38000
},
{
"epoch": 380.25,
"learning_rate": 1.2575949367088608e-06,
"loss": 0.0,
"step": 38025
},
{
"epoch": 380.5,
"learning_rate": 1.2417721518987344e-06,
"loss": 0.0,
"step": 38050
},
{
"epoch": 380.75,
"learning_rate": 1.2259493670886077e-06,
"loss": 0.0,
"step": 38075
},
{
"epoch": 381.0,
"learning_rate": 1.210126582278481e-06,
"loss": 0.0,
"step": 38100
},
{
"epoch": 381.25,
"learning_rate": 1.1943037974683544e-06,
"loss": 0.0,
"step": 38125
},
{
"epoch": 381.5,
"learning_rate": 1.178481012658228e-06,
"loss": 0.0,
"step": 38150
},
{
"epoch": 381.75,
"learning_rate": 1.1626582278481014e-06,
"loss": 0.0,
"step": 38175
},
{
"epoch": 382.0,
"learning_rate": 1.1468354430379747e-06,
"loss": 0.0,
"step": 38200
},
{
"epoch": 382.25,
"learning_rate": 1.131012658227848e-06,
"loss": 0.0,
"step": 38225
},
{
"epoch": 382.5,
"learning_rate": 1.1151898734177216e-06,
"loss": 0.0,
"step": 38250
},
{
"epoch": 382.75,
"learning_rate": 1.099367088607595e-06,
"loss": 0.0,
"step": 38275
},
{
"epoch": 383.0,
"learning_rate": 1.0835443037974686e-06,
"loss": 0.0,
"step": 38300
},
{
"epoch": 383.25,
"learning_rate": 1.0677215189873417e-06,
"loss": 0.0,
"step": 38325
},
{
"epoch": 383.5,
"learning_rate": 1.0518987341772153e-06,
"loss": 0.0,
"step": 38350
},
{
"epoch": 383.75,
"learning_rate": 1.0360759493670886e-06,
"loss": 0.0,
"step": 38375
},
{
"epoch": 384.0,
"learning_rate": 1.020253164556962e-06,
"loss": 0.0,
"step": 38400
},
{
"epoch": 384.25,
"learning_rate": 1.0050632911392404e-06,
"loss": 0.0,
"step": 38425
},
{
"epoch": 384.5,
"learning_rate": 9.89240506329114e-07,
"loss": 0.0,
"step": 38450
},
{
"epoch": 384.75,
"learning_rate": 9.734177215189873e-07,
"loss": 0.0,
"step": 38475
},
{
"epoch": 385.0,
"learning_rate": 9.57594936708861e-07,
"loss": 0.0,
"step": 38500
},
{
"epoch": 385.25,
"learning_rate": 9.417721518987342e-07,
"loss": 0.0,
"step": 38525
},
{
"epoch": 385.5,
"learning_rate": 9.259493670886077e-07,
"loss": 0.0,
"step": 38550
},
{
"epoch": 385.75,
"learning_rate": 9.10126582278481e-07,
"loss": 0.0,
"step": 38575
},
{
"epoch": 386.0,
"learning_rate": 8.943037974683546e-07,
"loss": 0.0,
"step": 38600
},
{
"epoch": 386.25,
"learning_rate": 8.784810126582279e-07,
"loss": 0.0,
"step": 38625
},
{
"epoch": 386.5,
"learning_rate": 8.626582278481014e-07,
"loss": 0.0,
"step": 38650
},
{
"epoch": 386.75,
"learning_rate": 8.468354430379747e-07,
"loss": 0.0,
"step": 38675
},
{
"epoch": 387.0,
"learning_rate": 8.310126582278482e-07,
"loss": 0.0,
"step": 38700
},
{
"epoch": 387.25,
"learning_rate": 8.151898734177215e-07,
"loss": 0.0,
"step": 38725
},
{
"epoch": 387.5,
"learning_rate": 7.99367088607595e-07,
"loss": 0.0,
"step": 38750
},
{
"epoch": 387.75,
"learning_rate": 7.835443037974684e-07,
"loss": 0.0,
"step": 38775
},
{
"epoch": 388.0,
"learning_rate": 7.677215189873418e-07,
"loss": 0.0,
"step": 38800
},
{
"epoch": 388.25,
"learning_rate": 7.518987341772152e-07,
"loss": 0.0,
"step": 38825
},
{
"epoch": 388.5,
"learning_rate": 7.360759493670887e-07,
"loss": 0.0,
"step": 38850
},
{
"epoch": 388.75,
"learning_rate": 7.20253164556962e-07,
"loss": 0.0,
"step": 38875
},
{
"epoch": 389.0,
"learning_rate": 7.044303797468355e-07,
"loss": 0.0,
"step": 38900
},
{
"epoch": 389.25,
"learning_rate": 6.886075949367089e-07,
"loss": 0.0,
"step": 38925
},
{
"epoch": 389.5,
"learning_rate": 6.727848101265823e-07,
"loss": 0.0,
"step": 38950
},
{
"epoch": 389.75,
"learning_rate": 6.569620253164558e-07,
"loss": 0.0,
"step": 38975
},
{
"epoch": 390.0,
"learning_rate": 6.411392405063291e-07,
"loss": 0.0,
"step": 39000
},
{
"epoch": 390.0,
"eval_loss": 0.6074256300926208,
"eval_runtime": 159.2979,
"eval_samples_per_second": 79.989,
"eval_steps_per_second": 1.256,
"eval_wer": 16.432507425355634,
"step": 39000
},
{
"epoch": 390.25,
"learning_rate": 6.253164556962026e-07,
"loss": 0.0,
"step": 39025
},
{
"epoch": 390.5,
"learning_rate": 6.094936708860759e-07,
"loss": 0.0,
"step": 39050
},
{
"epoch": 390.75,
"learning_rate": 5.936708860759494e-07,
"loss": 0.0,
"step": 39075
},
{
"epoch": 391.0,
"learning_rate": 5.778481012658229e-07,
"loss": 0.0,
"step": 39100
},
{
"epoch": 391.25,
"learning_rate": 5.620253164556962e-07,
"loss": 0.0,
"step": 39125
},
{
"epoch": 391.5,
"learning_rate": 5.462025316455697e-07,
"loss": 0.0,
"step": 39150
},
{
"epoch": 391.75,
"learning_rate": 5.30379746835443e-07,
"loss": 0.0,
"step": 39175
},
{
"epoch": 392.0,
"learning_rate": 5.145569620253165e-07,
"loss": 0.0,
"step": 39200
},
{
"epoch": 392.25,
"learning_rate": 4.9873417721519e-07,
"loss": 0.0,
"step": 39225
},
{
"epoch": 392.5,
"learning_rate": 4.829113924050633e-07,
"loss": 0.0,
"step": 39250
},
{
"epoch": 392.75,
"learning_rate": 4.670886075949368e-07,
"loss": 0.0,
"step": 39275
},
{
"epoch": 393.0,
"learning_rate": 4.512658227848102e-07,
"loss": 0.0,
"step": 39300
},
{
"epoch": 393.25,
"learning_rate": 4.354430379746836e-07,
"loss": 0.0,
"step": 39325
},
{
"epoch": 393.5,
"learning_rate": 4.19620253164557e-07,
"loss": 0.0,
"step": 39350
},
{
"epoch": 393.75,
"learning_rate": 4.0379746835443043e-07,
"loss": 0.0,
"step": 39375
},
{
"epoch": 394.0,
"learning_rate": 3.8797468354430384e-07,
"loss": 0.0,
"step": 39400
},
{
"epoch": 394.25,
"learning_rate": 3.7215189873417725e-07,
"loss": 0.0,
"step": 39425
},
{
"epoch": 394.5,
"learning_rate": 3.5632911392405066e-07,
"loss": 0.0,
"step": 39450
},
{
"epoch": 394.75,
"learning_rate": 3.4050632911392407e-07,
"loss": 0.0,
"step": 39475
},
{
"epoch": 395.0,
"learning_rate": 3.246835443037975e-07,
"loss": 0.0,
"step": 39500
},
{
"epoch": 395.25,
"learning_rate": 3.088607594936709e-07,
"loss": 0.0,
"step": 39525
},
{
"epoch": 395.5,
"learning_rate": 2.9303797468354436e-07,
"loss": 0.0,
"step": 39550
},
{
"epoch": 395.75,
"learning_rate": 2.7721518987341777e-07,
"loss": 0.0,
"step": 39575
},
{
"epoch": 396.0,
"learning_rate": 2.613924050632912e-07,
"loss": 0.0,
"step": 39600
},
{
"epoch": 396.25,
"learning_rate": 2.4556962025316454e-07,
"loss": 0.0,
"step": 39625
},
{
"epoch": 396.5,
"learning_rate": 2.2974683544303797e-07,
"loss": 0.0,
"step": 39650
},
{
"epoch": 396.75,
"learning_rate": 2.1392405063291138e-07,
"loss": 0.0,
"step": 39675
},
{
"epoch": 397.0,
"learning_rate": 1.9810126582278482e-07,
"loss": 0.0,
"step": 39700
},
{
"epoch": 397.25,
"learning_rate": 1.8227848101265823e-07,
"loss": 0.0,
"step": 39725
},
{
"epoch": 397.5,
"learning_rate": 1.6645569620253164e-07,
"loss": 0.0,
"step": 39750
},
{
"epoch": 397.75,
"learning_rate": 1.5063291139240508e-07,
"loss": 0.0,
"step": 39775
},
{
"epoch": 398.0,
"learning_rate": 1.348101265822785e-07,
"loss": 0.0,
"step": 39800
},
{
"epoch": 398.25,
"learning_rate": 1.189873417721519e-07,
"loss": 0.0,
"step": 39825
},
{
"epoch": 398.5,
"learning_rate": 1.0316455696202532e-07,
"loss": 0.0,
"step": 39850
},
{
"epoch": 398.75,
"learning_rate": 8.734177215189874e-08,
"loss": 0.0,
"step": 39875
},
{
"epoch": 399.0,
"learning_rate": 7.151898734177216e-08,
"loss": 0.0,
"step": 39900
},
{
"epoch": 399.25,
"learning_rate": 5.569620253164557e-08,
"loss": 0.0,
"step": 39925
},
{
"epoch": 399.5,
"learning_rate": 3.987341772151899e-08,
"loss": 0.0,
"step": 39950
},
{
"epoch": 399.75,
"learning_rate": 2.4050632911392406e-08,
"loss": 0.0,
"step": 39975
},
{
"epoch": 400.0,
"learning_rate": 8.227848101265823e-09,
"loss": 0.0,
"step": 40000
},
{
"epoch": 400.0,
"eval_loss": 0.6085276007652283,
"eval_runtime": 158.0696,
"eval_samples_per_second": 80.61,
"eval_steps_per_second": 1.265,
"eval_wer": 16.431530404877286,
"step": 40000
},
{
"epoch": 400.0,
"step": 40000,
"total_flos": 6.61156856856576e+20,
"train_loss": 0.008819907821263906,
"train_runtime": 68982.7856,
"train_samples_per_second": 148.443,
"train_steps_per_second": 0.58
}
],
"logging_steps": 25,
"max_steps": 40000,
"num_input_tokens_seen": 0,
"num_train_epochs": 400,
"save_steps": 1000,
"total_flos": 6.61156856856576e+20,
"train_batch_size": 128,
"trial_name": null,
"trial_params": null
}