whisper-base-nl-3 / trainer_state.json
SuperKogito's picture
End of training
82c80ef
{
"best_metric": 18.48141795311607,
"best_model_checkpoint": "whisper-base-nl-3/checkpoint-29000",
"epoch": 49.07306434023991,
"global_step": 45000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.0,
"learning_rate": 4.0000000000000003e-07,
"loss": 1.3847,
"step": 25
},
{
"epoch": 0.0,
"learning_rate": 9.000000000000001e-07,
"loss": 1.4601,
"step": 50
},
{
"epoch": 0.0,
"learning_rate": 1.4000000000000001e-06,
"loss": 1.3556,
"step": 75
},
{
"epoch": 0.01,
"learning_rate": 1.9000000000000002e-06,
"loss": 1.1454,
"step": 100
},
{
"epoch": 0.01,
"learning_rate": 2.4000000000000003e-06,
"loss": 1.2552,
"step": 125
},
{
"epoch": 0.01,
"learning_rate": 2.9e-06,
"loss": 1.1695,
"step": 150
},
{
"epoch": 0.01,
"learning_rate": 3.4000000000000005e-06,
"loss": 0.9503,
"step": 175
},
{
"epoch": 0.01,
"learning_rate": 3.900000000000001e-06,
"loss": 0.9096,
"step": 200
},
{
"epoch": 0.01,
"learning_rate": 4.4e-06,
"loss": 0.8853,
"step": 225
},
{
"epoch": 0.02,
"learning_rate": 4.9000000000000005e-06,
"loss": 0.833,
"step": 250
},
{
"epoch": 0.02,
"learning_rate": 5.400000000000001e-06,
"loss": 0.8597,
"step": 275
},
{
"epoch": 0.02,
"learning_rate": 5.9e-06,
"loss": 0.8199,
"step": 300
},
{
"epoch": 0.02,
"learning_rate": 6.4000000000000006e-06,
"loss": 0.7158,
"step": 325
},
{
"epoch": 0.02,
"learning_rate": 6.9e-06,
"loss": 0.6896,
"step": 350
},
{
"epoch": 0.02,
"learning_rate": 7.4e-06,
"loss": 0.662,
"step": 375
},
{
"epoch": 0.03,
"learning_rate": 7.9e-06,
"loss": 0.8284,
"step": 400
},
{
"epoch": 0.03,
"learning_rate": 8.400000000000001e-06,
"loss": 0.6544,
"step": 425
},
{
"epoch": 0.03,
"learning_rate": 8.900000000000001e-06,
"loss": 0.7486,
"step": 450
},
{
"epoch": 0.03,
"learning_rate": 9.4e-06,
"loss": 0.5652,
"step": 475
},
{
"epoch": 0.03,
"learning_rate": 9.9e-06,
"loss": 0.6604,
"step": 500
},
{
"epoch": 0.03,
"learning_rate": 9.994202898550725e-06,
"loss": 0.7287,
"step": 525
},
{
"epoch": 0.04,
"learning_rate": 9.986956521739132e-06,
"loss": 0.6413,
"step": 550
},
{
"epoch": 0.04,
"learning_rate": 9.979710144927537e-06,
"loss": 0.6762,
"step": 575
},
{
"epoch": 0.04,
"learning_rate": 9.972463768115943e-06,
"loss": 0.6882,
"step": 600
},
{
"epoch": 0.04,
"learning_rate": 9.965217391304348e-06,
"loss": 0.7015,
"step": 625
},
{
"epoch": 0.04,
"learning_rate": 9.957971014492755e-06,
"loss": 0.6145,
"step": 650
},
{
"epoch": 0.04,
"learning_rate": 9.95072463768116e-06,
"loss": 0.6674,
"step": 675
},
{
"epoch": 0.05,
"learning_rate": 9.943478260869565e-06,
"loss": 0.5915,
"step": 700
},
{
"epoch": 0.05,
"learning_rate": 9.936231884057972e-06,
"loss": 0.6632,
"step": 725
},
{
"epoch": 0.05,
"learning_rate": 9.928985507246378e-06,
"loss": 0.6157,
"step": 750
},
{
"epoch": 0.05,
"learning_rate": 9.921739130434783e-06,
"loss": 0.7222,
"step": 775
},
{
"epoch": 0.05,
"learning_rate": 9.91449275362319e-06,
"loss": 0.6447,
"step": 800
},
{
"epoch": 0.05,
"learning_rate": 9.907246376811595e-06,
"loss": 0.6848,
"step": 825
},
{
"epoch": 0.06,
"learning_rate": 9.9e-06,
"loss": 0.6391,
"step": 850
},
{
"epoch": 0.06,
"learning_rate": 9.892753623188407e-06,
"loss": 0.6543,
"step": 875
},
{
"epoch": 0.06,
"learning_rate": 9.885507246376812e-06,
"loss": 0.5579,
"step": 900
},
{
"epoch": 0.06,
"learning_rate": 9.878260869565218e-06,
"loss": 0.5699,
"step": 925
},
{
"epoch": 0.06,
"learning_rate": 9.871014492753625e-06,
"loss": 0.5404,
"step": 950
},
{
"epoch": 0.06,
"learning_rate": 9.86376811594203e-06,
"loss": 0.6237,
"step": 975
},
{
"epoch": 0.06,
"learning_rate": 9.856521739130435e-06,
"loss": 0.5761,
"step": 1000
},
{
"epoch": 0.06,
"eval_cer": 10.115352452161936,
"eval_loss": 0.5675458908081055,
"eval_runtime": 3220.6897,
"eval_samples_per_second": 0.771,
"eval_steps_per_second": 0.385,
"eval_wer": 28.15323041738136,
"step": 1000
},
{
"epoch": 0.07,
"learning_rate": 9.84927536231884e-06,
"loss": 0.6175,
"step": 1025
},
{
"epoch": 0.07,
"learning_rate": 9.842028985507247e-06,
"loss": 0.6934,
"step": 1050
},
{
"epoch": 0.07,
"learning_rate": 9.834782608695654e-06,
"loss": 0.5818,
"step": 1075
},
{
"epoch": 0.07,
"learning_rate": 9.827536231884059e-06,
"loss": 0.6175,
"step": 1100
},
{
"epoch": 0.07,
"learning_rate": 9.820289855072465e-06,
"loss": 0.4952,
"step": 1125
},
{
"epoch": 0.07,
"learning_rate": 9.81304347826087e-06,
"loss": 0.6194,
"step": 1150
},
{
"epoch": 0.08,
"learning_rate": 9.805797101449275e-06,
"loss": 0.5897,
"step": 1175
},
{
"epoch": 0.08,
"learning_rate": 9.798550724637682e-06,
"loss": 0.5356,
"step": 1200
},
{
"epoch": 0.08,
"learning_rate": 9.791304347826089e-06,
"loss": 0.5805,
"step": 1225
},
{
"epoch": 0.08,
"learning_rate": 9.784057971014494e-06,
"loss": 0.5446,
"step": 1250
},
{
"epoch": 0.08,
"learning_rate": 9.776811594202899e-06,
"loss": 0.6734,
"step": 1275
},
{
"epoch": 0.08,
"learning_rate": 9.769565217391305e-06,
"loss": 0.5457,
"step": 1300
},
{
"epoch": 0.09,
"learning_rate": 9.76231884057971e-06,
"loss": 0.4686,
"step": 1325
},
{
"epoch": 0.09,
"learning_rate": 9.755072463768117e-06,
"loss": 0.5954,
"step": 1350
},
{
"epoch": 0.09,
"learning_rate": 9.747826086956522e-06,
"loss": 0.4973,
"step": 1375
},
{
"epoch": 0.09,
"learning_rate": 9.740579710144929e-06,
"loss": 0.5727,
"step": 1400
},
{
"epoch": 0.09,
"learning_rate": 9.733333333333334e-06,
"loss": 0.5767,
"step": 1425
},
{
"epoch": 0.09,
"learning_rate": 9.726086956521739e-06,
"loss": 0.4814,
"step": 1450
},
{
"epoch": 0.1,
"learning_rate": 9.718840579710146e-06,
"loss": 0.5544,
"step": 1475
},
{
"epoch": 0.1,
"learning_rate": 9.71159420289855e-06,
"loss": 0.5281,
"step": 1500
},
{
"epoch": 0.1,
"learning_rate": 9.704347826086957e-06,
"loss": 0.612,
"step": 1525
},
{
"epoch": 0.1,
"learning_rate": 9.697101449275364e-06,
"loss": 0.5293,
"step": 1550
},
{
"epoch": 0.1,
"learning_rate": 9.689855072463769e-06,
"loss": 0.5881,
"step": 1575
},
{
"epoch": 0.1,
"learning_rate": 9.682608695652174e-06,
"loss": 0.5571,
"step": 1600
},
{
"epoch": 0.11,
"learning_rate": 9.67536231884058e-06,
"loss": 0.429,
"step": 1625
},
{
"epoch": 0.11,
"learning_rate": 9.668115942028986e-06,
"loss": 0.4661,
"step": 1650
},
{
"epoch": 0.11,
"learning_rate": 9.660869565217392e-06,
"loss": 0.5181,
"step": 1675
},
{
"epoch": 0.11,
"learning_rate": 9.653623188405797e-06,
"loss": 0.5188,
"step": 1700
},
{
"epoch": 0.11,
"learning_rate": 9.646376811594204e-06,
"loss": 0.4881,
"step": 1725
},
{
"epoch": 0.11,
"learning_rate": 9.639130434782609e-06,
"loss": 0.6319,
"step": 1750
},
{
"epoch": 0.11,
"learning_rate": 9.631884057971014e-06,
"loss": 0.6,
"step": 1775
},
{
"epoch": 0.12,
"learning_rate": 9.624637681159421e-06,
"loss": 0.5251,
"step": 1800
},
{
"epoch": 0.12,
"learning_rate": 9.617391304347828e-06,
"loss": 0.4999,
"step": 1825
},
{
"epoch": 0.12,
"learning_rate": 9.610144927536233e-06,
"loss": 0.5612,
"step": 1850
},
{
"epoch": 0.12,
"learning_rate": 9.60289855072464e-06,
"loss": 0.456,
"step": 1875
},
{
"epoch": 0.12,
"learning_rate": 9.595652173913044e-06,
"loss": 0.5589,
"step": 1900
},
{
"epoch": 0.12,
"learning_rate": 9.58840579710145e-06,
"loss": 0.396,
"step": 1925
},
{
"epoch": 0.13,
"learning_rate": 9.581159420289856e-06,
"loss": 0.4713,
"step": 1950
},
{
"epoch": 0.13,
"learning_rate": 9.573913043478261e-06,
"loss": 0.5178,
"step": 1975
},
{
"epoch": 0.13,
"learning_rate": 9.566666666666668e-06,
"loss": 0.48,
"step": 2000
},
{
"epoch": 0.13,
"eval_cer": 9.69108170593733,
"eval_loss": 0.5239235162734985,
"eval_runtime": 3297.9692,
"eval_samples_per_second": 0.753,
"eval_steps_per_second": 0.376,
"eval_wer": 26.436439870402133,
"step": 2000
},
{
"epoch": 0.13,
"learning_rate": 9.559420289855074e-06,
"loss": 0.5154,
"step": 2025
},
{
"epoch": 0.13,
"learning_rate": 9.55217391304348e-06,
"loss": 0.5715,
"step": 2050
},
{
"epoch": 0.13,
"learning_rate": 9.545217391304349e-06,
"loss": 0.5522,
"step": 2075
},
{
"epoch": 0.14,
"learning_rate": 9.537971014492754e-06,
"loss": 0.5205,
"step": 2100
},
{
"epoch": 0.14,
"learning_rate": 9.53072463768116e-06,
"loss": 0.4494,
"step": 2125
},
{
"epoch": 0.14,
"learning_rate": 9.523478260869566e-06,
"loss": 0.5226,
"step": 2150
},
{
"epoch": 0.14,
"learning_rate": 9.516231884057972e-06,
"loss": 0.469,
"step": 2175
},
{
"epoch": 0.14,
"learning_rate": 9.508985507246377e-06,
"loss": 0.5067,
"step": 2200
},
{
"epoch": 0.14,
"learning_rate": 9.501739130434784e-06,
"loss": 0.5879,
"step": 2225
},
{
"epoch": 0.15,
"learning_rate": 9.494492753623189e-06,
"loss": 0.8063,
"step": 2250
},
{
"epoch": 0.15,
"learning_rate": 9.487246376811596e-06,
"loss": 0.5067,
"step": 2275
},
{
"epoch": 0.15,
"learning_rate": 9.48e-06,
"loss": 0.5124,
"step": 2300
},
{
"epoch": 0.15,
"learning_rate": 9.472753623188406e-06,
"loss": 0.4894,
"step": 2325
},
{
"epoch": 0.15,
"learning_rate": 9.465507246376812e-06,
"loss": 0.504,
"step": 2350
},
{
"epoch": 0.15,
"learning_rate": 9.458260869565217e-06,
"loss": 0.545,
"step": 2375
},
{
"epoch": 0.16,
"learning_rate": 9.451014492753624e-06,
"loss": 0.4962,
"step": 2400
},
{
"epoch": 0.16,
"learning_rate": 9.44376811594203e-06,
"loss": 0.4774,
"step": 2425
},
{
"epoch": 0.16,
"learning_rate": 9.436521739130436e-06,
"loss": 0.5429,
"step": 2450
},
{
"epoch": 0.16,
"learning_rate": 9.42927536231884e-06,
"loss": 0.445,
"step": 2475
},
{
"epoch": 0.16,
"learning_rate": 9.422028985507246e-06,
"loss": 0.4111,
"step": 2500
},
{
"epoch": 0.16,
"learning_rate": 9.414782608695653e-06,
"loss": 0.5188,
"step": 2525
},
{
"epoch": 0.17,
"learning_rate": 9.40753623188406e-06,
"loss": 0.4584,
"step": 2550
},
{
"epoch": 0.17,
"learning_rate": 9.400289855072464e-06,
"loss": 0.5017,
"step": 2575
},
{
"epoch": 0.17,
"learning_rate": 9.393043478260871e-06,
"loss": 0.593,
"step": 2600
},
{
"epoch": 0.17,
"learning_rate": 9.385797101449276e-06,
"loss": 0.5195,
"step": 2625
},
{
"epoch": 0.17,
"learning_rate": 9.378550724637681e-06,
"loss": 0.5083,
"step": 2650
},
{
"epoch": 0.17,
"learning_rate": 9.371304347826088e-06,
"loss": 0.5534,
"step": 2675
},
{
"epoch": 0.17,
"learning_rate": 9.364057971014493e-06,
"loss": 0.4893,
"step": 2700
},
{
"epoch": 0.18,
"learning_rate": 9.3568115942029e-06,
"loss": 0.4512,
"step": 2725
},
{
"epoch": 0.18,
"learning_rate": 9.349565217391306e-06,
"loss": 0.5876,
"step": 2750
},
{
"epoch": 0.18,
"learning_rate": 9.342318840579711e-06,
"loss": 0.4597,
"step": 2775
},
{
"epoch": 0.18,
"learning_rate": 9.335072463768116e-06,
"loss": 0.3634,
"step": 2800
},
{
"epoch": 0.18,
"learning_rate": 9.327826086956523e-06,
"loss": 0.4483,
"step": 2825
},
{
"epoch": 0.18,
"learning_rate": 9.320579710144928e-06,
"loss": 0.5484,
"step": 2850
},
{
"epoch": 0.19,
"learning_rate": 9.313333333333335e-06,
"loss": 0.4852,
"step": 2875
},
{
"epoch": 0.19,
"learning_rate": 9.306086956521741e-06,
"loss": 0.5576,
"step": 2900
},
{
"epoch": 0.19,
"learning_rate": 9.298840579710146e-06,
"loss": 0.5107,
"step": 2925
},
{
"epoch": 0.19,
"learning_rate": 9.291594202898551e-06,
"loss": 0.5286,
"step": 2950
},
{
"epoch": 0.19,
"learning_rate": 9.284347826086956e-06,
"loss": 0.5618,
"step": 2975
},
{
"epoch": 0.19,
"learning_rate": 9.277101449275363e-06,
"loss": 0.4094,
"step": 3000
},
{
"epoch": 0.19,
"eval_cer": 9.153180185941267,
"eval_loss": 0.49246901273727417,
"eval_runtime": 3242.5657,
"eval_samples_per_second": 0.765,
"eval_steps_per_second": 0.383,
"eval_wer": 24.835525061940157,
"step": 3000
},
{
"epoch": 0.2,
"learning_rate": 9.26985507246377e-06,
"loss": 0.5152,
"step": 3025
},
{
"epoch": 0.2,
"learning_rate": 9.262608695652175e-06,
"loss": 0.5572,
"step": 3050
},
{
"epoch": 0.2,
"learning_rate": 9.255362318840581e-06,
"loss": 0.4801,
"step": 3075
},
{
"epoch": 0.2,
"learning_rate": 9.248115942028986e-06,
"loss": 0.4005,
"step": 3100
},
{
"epoch": 0.2,
"learning_rate": 9.240869565217391e-06,
"loss": 0.4693,
"step": 3125
},
{
"epoch": 0.2,
"learning_rate": 9.233623188405798e-06,
"loss": 0.4487,
"step": 3150
},
{
"epoch": 0.21,
"learning_rate": 9.226376811594203e-06,
"loss": 0.4477,
"step": 3175
},
{
"epoch": 0.21,
"learning_rate": 9.21913043478261e-06,
"loss": 0.4,
"step": 3200
},
{
"epoch": 0.21,
"learning_rate": 9.211884057971015e-06,
"loss": 0.4358,
"step": 3225
},
{
"epoch": 0.21,
"learning_rate": 9.204637681159421e-06,
"loss": 0.4952,
"step": 3250
},
{
"epoch": 0.21,
"learning_rate": 9.197391304347826e-06,
"loss": 0.4526,
"step": 3275
},
{
"epoch": 0.21,
"learning_rate": 9.190144927536233e-06,
"loss": 0.3588,
"step": 3300
},
{
"epoch": 0.22,
"learning_rate": 9.182898550724638e-06,
"loss": 0.5127,
"step": 3325
},
{
"epoch": 0.22,
"learning_rate": 9.175652173913045e-06,
"loss": 0.6166,
"step": 3350
},
{
"epoch": 0.22,
"learning_rate": 9.16840579710145e-06,
"loss": 0.5032,
"step": 3375
},
{
"epoch": 0.22,
"learning_rate": 9.161159420289855e-06,
"loss": 0.5632,
"step": 3400
},
{
"epoch": 0.22,
"learning_rate": 9.153913043478262e-06,
"loss": 0.5268,
"step": 3425
},
{
"epoch": 0.22,
"learning_rate": 9.146666666666667e-06,
"loss": 0.4672,
"step": 3450
},
{
"epoch": 0.23,
"learning_rate": 9.139420289855073e-06,
"loss": 0.4342,
"step": 3475
},
{
"epoch": 0.23,
"learning_rate": 9.13217391304348e-06,
"loss": 0.4504,
"step": 3500
},
{
"epoch": 0.23,
"learning_rate": 9.124927536231885e-06,
"loss": 0.4076,
"step": 3525
},
{
"epoch": 0.23,
"learning_rate": 9.11768115942029e-06,
"loss": 0.5036,
"step": 3550
},
{
"epoch": 0.23,
"learning_rate": 9.110434782608695e-06,
"loss": 0.3835,
"step": 3575
},
{
"epoch": 0.23,
"learning_rate": 9.103188405797102e-06,
"loss": 0.3652,
"step": 3600
},
{
"epoch": 0.23,
"learning_rate": 9.095942028985508e-06,
"loss": 0.4231,
"step": 3625
},
{
"epoch": 0.24,
"learning_rate": 9.088695652173913e-06,
"loss": 0.4644,
"step": 3650
},
{
"epoch": 0.24,
"learning_rate": 9.08144927536232e-06,
"loss": 0.5602,
"step": 3675
},
{
"epoch": 0.24,
"learning_rate": 9.074202898550725e-06,
"loss": 0.4637,
"step": 3700
},
{
"epoch": 0.24,
"learning_rate": 9.06695652173913e-06,
"loss": 0.4324,
"step": 3725
},
{
"epoch": 0.24,
"learning_rate": 9.059710144927537e-06,
"loss": 0.446,
"step": 3750
},
{
"epoch": 0.24,
"learning_rate": 9.052463768115944e-06,
"loss": 0.5127,
"step": 3775
},
{
"epoch": 0.25,
"learning_rate": 9.045217391304349e-06,
"loss": 0.4453,
"step": 3800
},
{
"epoch": 0.25,
"learning_rate": 9.037971014492755e-06,
"loss": 0.4382,
"step": 3825
},
{
"epoch": 0.25,
"learning_rate": 9.03072463768116e-06,
"loss": 0.5816,
"step": 3850
},
{
"epoch": 0.25,
"learning_rate": 9.023478260869565e-06,
"loss": 0.397,
"step": 3875
},
{
"epoch": 0.25,
"learning_rate": 9.016231884057972e-06,
"loss": 0.4512,
"step": 3900
},
{
"epoch": 0.25,
"learning_rate": 9.008985507246377e-06,
"loss": 0.4541,
"step": 3925
},
{
"epoch": 0.26,
"learning_rate": 9.001739130434784e-06,
"loss": 0.3829,
"step": 3950
},
{
"epoch": 0.26,
"learning_rate": 8.99449275362319e-06,
"loss": 0.5275,
"step": 3975
},
{
"epoch": 0.26,
"learning_rate": 8.987246376811595e-06,
"loss": 0.4792,
"step": 4000
},
{
"epoch": 0.26,
"eval_cer": 8.841433420237099,
"eval_loss": 0.47019296884536743,
"eval_runtime": 3179.8405,
"eval_samples_per_second": 0.781,
"eval_steps_per_second": 0.39,
"eval_wer": 24.110539355822375,
"step": 4000
},
{
"epoch": 0.26,
"learning_rate": 8.98e-06,
"loss": 0.4638,
"step": 4025
},
{
"epoch": 0.26,
"learning_rate": 8.972753623188405e-06,
"loss": 0.5326,
"step": 4050
},
{
"epoch": 0.26,
"learning_rate": 8.965507246376812e-06,
"loss": 0.4799,
"step": 4075
},
{
"epoch": 0.27,
"learning_rate": 8.958260869565219e-06,
"loss": 0.4798,
"step": 4100
},
{
"epoch": 0.27,
"learning_rate": 8.951014492753624e-06,
"loss": 0.4938,
"step": 4125
},
{
"epoch": 0.27,
"learning_rate": 8.94376811594203e-06,
"loss": 0.4882,
"step": 4150
},
{
"epoch": 0.27,
"learning_rate": 8.936521739130436e-06,
"loss": 0.4136,
"step": 4175
},
{
"epoch": 0.27,
"learning_rate": 8.92927536231884e-06,
"loss": 0.5116,
"step": 4200
},
{
"epoch": 0.27,
"learning_rate": 8.922028985507247e-06,
"loss": 0.5381,
"step": 4225
},
{
"epoch": 0.28,
"learning_rate": 8.914782608695652e-06,
"loss": 0.3999,
"step": 4250
},
{
"epoch": 0.28,
"learning_rate": 8.907536231884059e-06,
"loss": 0.3925,
"step": 4275
},
{
"epoch": 0.28,
"learning_rate": 8.900289855072464e-06,
"loss": 0.469,
"step": 4300
},
{
"epoch": 0.28,
"learning_rate": 8.89304347826087e-06,
"loss": 0.4854,
"step": 4325
},
{
"epoch": 0.28,
"learning_rate": 8.885797101449276e-06,
"loss": 0.5086,
"step": 4350
},
{
"epoch": 0.28,
"learning_rate": 8.878550724637682e-06,
"loss": 0.4679,
"step": 4375
},
{
"epoch": 0.29,
"learning_rate": 8.871594202898552e-06,
"loss": 0.5175,
"step": 4400
},
{
"epoch": 0.29,
"learning_rate": 8.864347826086957e-06,
"loss": 0.4921,
"step": 4425
},
{
"epoch": 0.29,
"learning_rate": 8.857101449275362e-06,
"loss": 0.4375,
"step": 4450
},
{
"epoch": 0.29,
"learning_rate": 8.849855072463769e-06,
"loss": 0.6226,
"step": 4475
},
{
"epoch": 0.29,
"learning_rate": 8.842608695652175e-06,
"loss": 0.4383,
"step": 4500
},
{
"epoch": 0.29,
"learning_rate": 8.83536231884058e-06,
"loss": 0.4799,
"step": 4525
},
{
"epoch": 0.29,
"learning_rate": 8.828115942028987e-06,
"loss": 0.4063,
"step": 4550
},
{
"epoch": 0.3,
"learning_rate": 8.820869565217392e-06,
"loss": 0.4039,
"step": 4575
},
{
"epoch": 0.3,
"learning_rate": 8.813623188405797e-06,
"loss": 0.3688,
"step": 4600
},
{
"epoch": 0.3,
"learning_rate": 8.806376811594204e-06,
"loss": 0.4714,
"step": 4625
},
{
"epoch": 0.3,
"learning_rate": 8.799130434782609e-06,
"loss": 0.426,
"step": 4650
},
{
"epoch": 0.3,
"learning_rate": 8.791884057971015e-06,
"loss": 0.4623,
"step": 4675
},
{
"epoch": 0.3,
"learning_rate": 8.784637681159422e-06,
"loss": 0.4223,
"step": 4700
},
{
"epoch": 0.31,
"learning_rate": 8.777391304347827e-06,
"loss": 0.504,
"step": 4725
},
{
"epoch": 0.31,
"learning_rate": 8.770144927536232e-06,
"loss": 0.4396,
"step": 4750
},
{
"epoch": 0.31,
"learning_rate": 8.762898550724639e-06,
"loss": 0.4665,
"step": 4775
},
{
"epoch": 0.31,
"learning_rate": 8.755652173913044e-06,
"loss": 0.4356,
"step": 4800
},
{
"epoch": 0.31,
"learning_rate": 8.74840579710145e-06,
"loss": 0.4058,
"step": 4825
},
{
"epoch": 0.31,
"learning_rate": 8.741159420289856e-06,
"loss": 0.4825,
"step": 4850
},
{
"epoch": 0.32,
"learning_rate": 8.733913043478262e-06,
"loss": 0.5461,
"step": 4875
},
{
"epoch": 0.32,
"learning_rate": 8.726666666666667e-06,
"loss": 0.4718,
"step": 4900
},
{
"epoch": 0.32,
"learning_rate": 8.719420289855072e-06,
"loss": 0.5011,
"step": 4925
},
{
"epoch": 0.32,
"learning_rate": 8.712173913043479e-06,
"loss": 0.4281,
"step": 4950
},
{
"epoch": 0.32,
"learning_rate": 8.704927536231886e-06,
"loss": 0.5207,
"step": 4975
},
{
"epoch": 0.32,
"learning_rate": 8.69768115942029e-06,
"loss": 0.3444,
"step": 5000
},
{
"epoch": 0.32,
"eval_cer": 8.853116237886763,
"eval_loss": 0.45443984866142273,
"eval_runtime": 3270.5063,
"eval_samples_per_second": 0.759,
"eval_steps_per_second": 0.379,
"eval_wer": 23.901658090337335,
"step": 5000
},
{
"epoch": 0.33,
"learning_rate": 8.690434782608697e-06,
"loss": 0.4848,
"step": 5025
},
{
"epoch": 0.33,
"learning_rate": 8.683188405797102e-06,
"loss": 0.4012,
"step": 5050
},
{
"epoch": 0.33,
"learning_rate": 8.675942028985507e-06,
"loss": 0.3266,
"step": 5075
},
{
"epoch": 0.33,
"learning_rate": 8.668695652173914e-06,
"loss": 0.4751,
"step": 5100
},
{
"epoch": 0.33,
"learning_rate": 8.661449275362319e-06,
"loss": 0.5552,
"step": 5125
},
{
"epoch": 0.33,
"learning_rate": 8.654202898550726e-06,
"loss": 0.4079,
"step": 5150
},
{
"epoch": 0.34,
"learning_rate": 8.64695652173913e-06,
"loss": 0.4326,
"step": 5175
},
{
"epoch": 0.34,
"learning_rate": 8.639710144927538e-06,
"loss": 0.4591,
"step": 5200
},
{
"epoch": 0.34,
"learning_rate": 8.632463768115943e-06,
"loss": 0.3962,
"step": 5225
},
{
"epoch": 0.34,
"learning_rate": 8.625217391304348e-06,
"loss": 0.4825,
"step": 5250
},
{
"epoch": 0.34,
"learning_rate": 8.617971014492754e-06,
"loss": 0.4377,
"step": 5275
},
{
"epoch": 0.34,
"learning_rate": 8.610724637681161e-06,
"loss": 0.437,
"step": 5300
},
{
"epoch": 0.34,
"learning_rate": 8.603478260869566e-06,
"loss": 0.3836,
"step": 5325
},
{
"epoch": 0.35,
"learning_rate": 8.596231884057971e-06,
"loss": 0.4649,
"step": 5350
},
{
"epoch": 0.35,
"learning_rate": 8.588985507246378e-06,
"loss": 0.4631,
"step": 5375
},
{
"epoch": 0.35,
"learning_rate": 8.581739130434783e-06,
"loss": 0.5619,
"step": 5400
},
{
"epoch": 0.35,
"learning_rate": 8.57449275362319e-06,
"loss": 0.5031,
"step": 5425
},
{
"epoch": 0.35,
"learning_rate": 8.567246376811596e-06,
"loss": 0.3797,
"step": 5450
},
{
"epoch": 0.35,
"learning_rate": 8.560000000000001e-06,
"loss": 0.4993,
"step": 5475
},
{
"epoch": 0.36,
"learning_rate": 8.552753623188406e-06,
"loss": 0.4146,
"step": 5500
},
{
"epoch": 0.36,
"learning_rate": 8.545507246376811e-06,
"loss": 0.4524,
"step": 5525
},
{
"epoch": 0.36,
"learning_rate": 8.538260869565218e-06,
"loss": 0.4812,
"step": 5550
},
{
"epoch": 0.36,
"learning_rate": 8.531014492753624e-06,
"loss": 0.3781,
"step": 5575
},
{
"epoch": 0.36,
"learning_rate": 8.52376811594203e-06,
"loss": 0.4343,
"step": 5600
},
{
"epoch": 0.36,
"learning_rate": 8.516521739130436e-06,
"loss": 0.4226,
"step": 5625
},
{
"epoch": 0.37,
"learning_rate": 8.509275362318841e-06,
"loss": 0.4341,
"step": 5650
},
{
"epoch": 0.37,
"learning_rate": 8.502028985507246e-06,
"loss": 0.4008,
"step": 5675
},
{
"epoch": 0.37,
"learning_rate": 8.494782608695653e-06,
"loss": 0.4199,
"step": 5700
},
{
"epoch": 0.37,
"learning_rate": 8.487536231884058e-06,
"loss": 0.4822,
"step": 5725
},
{
"epoch": 0.37,
"learning_rate": 8.480289855072465e-06,
"loss": 0.3857,
"step": 5750
},
{
"epoch": 0.37,
"learning_rate": 8.473043478260871e-06,
"loss": 0.5646,
"step": 5775
},
{
"epoch": 0.38,
"learning_rate": 8.465797101449276e-06,
"loss": 0.3835,
"step": 5800
},
{
"epoch": 0.38,
"learning_rate": 8.458550724637681e-06,
"loss": 0.4856,
"step": 5825
},
{
"epoch": 0.38,
"learning_rate": 8.451304347826088e-06,
"loss": 0.4807,
"step": 5850
},
{
"epoch": 0.38,
"learning_rate": 8.444057971014493e-06,
"loss": 0.5281,
"step": 5875
},
{
"epoch": 0.38,
"learning_rate": 8.4368115942029e-06,
"loss": 0.4234,
"step": 5900
},
{
"epoch": 0.38,
"learning_rate": 8.429565217391305e-06,
"loss": 0.6375,
"step": 5925
},
{
"epoch": 0.39,
"learning_rate": 8.422318840579711e-06,
"loss": 0.4303,
"step": 5950
},
{
"epoch": 0.39,
"learning_rate": 8.415072463768116e-06,
"loss": 0.4196,
"step": 5975
},
{
"epoch": 0.39,
"learning_rate": 8.407826086956521e-06,
"loss": 0.3943,
"step": 6000
},
{
"epoch": 0.39,
"eval_cer": 8.360224310098873,
"eval_loss": 0.44455686211586,
"eval_runtime": 3263.9495,
"eval_samples_per_second": 0.76,
"eval_steps_per_second": 0.38,
"eval_wer": 22.735277301315037,
"step": 6000
},
{
"epoch": 0.39,
"learning_rate": 8.400579710144928e-06,
"loss": 0.4164,
"step": 6025
},
{
"epoch": 0.39,
"learning_rate": 8.393333333333335e-06,
"loss": 0.4818,
"step": 6050
},
{
"epoch": 0.39,
"learning_rate": 8.38608695652174e-06,
"loss": 0.5536,
"step": 6075
},
{
"epoch": 0.4,
"learning_rate": 8.378840579710147e-06,
"loss": 0.4731,
"step": 6100
},
{
"epoch": 0.4,
"learning_rate": 8.371594202898552e-06,
"loss": 0.4081,
"step": 6125
},
{
"epoch": 0.4,
"learning_rate": 8.364347826086957e-06,
"loss": 0.3741,
"step": 6150
},
{
"epoch": 0.4,
"learning_rate": 8.357101449275363e-06,
"loss": 0.4173,
"step": 6175
},
{
"epoch": 0.4,
"learning_rate": 8.349855072463768e-06,
"loss": 0.4954,
"step": 6200
},
{
"epoch": 0.4,
"learning_rate": 8.342608695652175e-06,
"loss": 0.461,
"step": 6225
},
{
"epoch": 0.4,
"learning_rate": 8.33536231884058e-06,
"loss": 0.4501,
"step": 6250
},
{
"epoch": 0.41,
"learning_rate": 8.328115942028987e-06,
"loss": 0.3652,
"step": 6275
},
{
"epoch": 0.41,
"learning_rate": 8.320869565217392e-06,
"loss": 0.4046,
"step": 6300
},
{
"epoch": 0.41,
"learning_rate": 8.313623188405798e-06,
"loss": 0.4184,
"step": 6325
},
{
"epoch": 0.41,
"learning_rate": 8.306376811594203e-06,
"loss": 0.4287,
"step": 6350
},
{
"epoch": 0.41,
"learning_rate": 8.29913043478261e-06,
"loss": 0.3938,
"step": 6375
},
{
"epoch": 0.41,
"learning_rate": 8.291884057971015e-06,
"loss": 0.4758,
"step": 6400
},
{
"epoch": 0.42,
"learning_rate": 8.28463768115942e-06,
"loss": 0.4716,
"step": 6425
},
{
"epoch": 0.42,
"learning_rate": 8.277391304347827e-06,
"loss": 0.3819,
"step": 6450
},
{
"epoch": 0.42,
"learning_rate": 8.270144927536232e-06,
"loss": 0.3889,
"step": 6475
},
{
"epoch": 0.42,
"learning_rate": 8.262898550724639e-06,
"loss": 0.4659,
"step": 6500
},
{
"epoch": 0.42,
"learning_rate": 8.255652173913045e-06,
"loss": 0.3274,
"step": 6525
},
{
"epoch": 0.42,
"learning_rate": 8.24840579710145e-06,
"loss": 0.4144,
"step": 6550
},
{
"epoch": 0.43,
"learning_rate": 8.241159420289855e-06,
"loss": 0.3875,
"step": 6575
},
{
"epoch": 0.43,
"learning_rate": 8.23391304347826e-06,
"loss": 0.452,
"step": 6600
},
{
"epoch": 0.43,
"learning_rate": 8.226666666666667e-06,
"loss": 0.4747,
"step": 6625
},
{
"epoch": 0.43,
"learning_rate": 8.219420289855074e-06,
"loss": 0.4448,
"step": 6650
},
{
"epoch": 0.43,
"learning_rate": 8.212173913043479e-06,
"loss": 0.5215,
"step": 6675
},
{
"epoch": 0.43,
"learning_rate": 8.204927536231885e-06,
"loss": 0.4261,
"step": 6700
},
{
"epoch": 0.44,
"learning_rate": 8.19768115942029e-06,
"loss": 0.4482,
"step": 6725
},
{
"epoch": 0.44,
"learning_rate": 8.190434782608695e-06,
"loss": 0.39,
"step": 6750
},
{
"epoch": 0.44,
"learning_rate": 8.183188405797102e-06,
"loss": 0.6096,
"step": 6775
},
{
"epoch": 0.44,
"learning_rate": 8.175942028985507e-06,
"loss": 0.3912,
"step": 6800
},
{
"epoch": 0.44,
"learning_rate": 8.168695652173914e-06,
"loss": 0.3141,
"step": 6825
},
{
"epoch": 0.44,
"learning_rate": 8.16144927536232e-06,
"loss": 0.3593,
"step": 6850
},
{
"epoch": 0.45,
"learning_rate": 8.154202898550725e-06,
"loss": 0.4331,
"step": 6875
},
{
"epoch": 0.45,
"learning_rate": 8.14695652173913e-06,
"loss": 0.4574,
"step": 6900
},
{
"epoch": 0.45,
"learning_rate": 8.139710144927537e-06,
"loss": 0.3546,
"step": 6925
},
{
"epoch": 0.45,
"learning_rate": 8.132463768115942e-06,
"loss": 0.3894,
"step": 6950
},
{
"epoch": 0.45,
"learning_rate": 8.125217391304349e-06,
"loss": 0.393,
"step": 6975
},
{
"epoch": 0.45,
"learning_rate": 8.117971014492756e-06,
"loss": 0.4925,
"step": 7000
},
{
"epoch": 0.45,
"eval_cer": 8.3723990358601,
"eval_loss": 0.4348393380641937,
"eval_runtime": 3254.2457,
"eval_samples_per_second": 0.763,
"eval_steps_per_second": 0.381,
"eval_wer": 22.178768820278254,
"step": 7000
},
{
"epoch": 0.46,
"learning_rate": 8.11072463768116e-06,
"loss": 0.3986,
"step": 7025
},
{
"epoch": 0.46,
"learning_rate": 8.103478260869566e-06,
"loss": 0.3943,
"step": 7050
},
{
"epoch": 0.46,
"learning_rate": 8.09623188405797e-06,
"loss": 0.4803,
"step": 7075
},
{
"epoch": 0.46,
"learning_rate": 8.088985507246377e-06,
"loss": 0.4128,
"step": 7100
},
{
"epoch": 0.46,
"learning_rate": 8.081739130434784e-06,
"loss": 0.5511,
"step": 7125
},
{
"epoch": 0.46,
"learning_rate": 8.074492753623189e-06,
"loss": 0.4377,
"step": 7150
},
{
"epoch": 0.46,
"learning_rate": 8.067246376811596e-06,
"loss": 0.453,
"step": 7175
},
{
"epoch": 0.47,
"learning_rate": 8.06e-06,
"loss": 0.4019,
"step": 7200
},
{
"epoch": 0.47,
"learning_rate": 8.052753623188406e-06,
"loss": 0.4934,
"step": 7225
},
{
"epoch": 0.47,
"learning_rate": 8.045507246376812e-06,
"loss": 0.3873,
"step": 7250
},
{
"epoch": 0.47,
"learning_rate": 8.038260869565217e-06,
"loss": 0.389,
"step": 7275
},
{
"epoch": 0.47,
"learning_rate": 8.031014492753624e-06,
"loss": 0.4086,
"step": 7300
},
{
"epoch": 0.47,
"learning_rate": 8.02376811594203e-06,
"loss": 0.3844,
"step": 7325
},
{
"epoch": 0.48,
"learning_rate": 8.016521739130436e-06,
"loss": 0.4577,
"step": 7350
},
{
"epoch": 0.48,
"learning_rate": 8.009275362318841e-06,
"loss": 0.383,
"step": 7375
},
{
"epoch": 0.48,
"learning_rate": 8.002028985507248e-06,
"loss": 0.5191,
"step": 7400
},
{
"epoch": 0.48,
"learning_rate": 7.994782608695653e-06,
"loss": 0.3293,
"step": 7425
},
{
"epoch": 0.48,
"learning_rate": 7.98753623188406e-06,
"loss": 0.4246,
"step": 7450
},
{
"epoch": 0.48,
"learning_rate": 7.980289855072464e-06,
"loss": 0.3811,
"step": 7475
},
{
"epoch": 0.49,
"learning_rate": 7.97304347826087e-06,
"loss": 0.3891,
"step": 7500
},
{
"epoch": 0.49,
"learning_rate": 7.965797101449276e-06,
"loss": 0.4367,
"step": 7525
},
{
"epoch": 0.49,
"learning_rate": 7.958550724637681e-06,
"loss": 0.4793,
"step": 7550
},
{
"epoch": 0.49,
"learning_rate": 7.951304347826088e-06,
"loss": 0.3993,
"step": 7575
},
{
"epoch": 0.49,
"learning_rate": 7.944347826086957e-06,
"loss": 0.3095,
"step": 7600
},
{
"epoch": 0.49,
"learning_rate": 7.937101449275362e-06,
"loss": 0.4002,
"step": 7625
},
{
"epoch": 0.5,
"learning_rate": 7.929855072463769e-06,
"loss": 0.4037,
"step": 7650
},
{
"epoch": 0.5,
"learning_rate": 7.922608695652174e-06,
"loss": 0.3694,
"step": 7675
},
{
"epoch": 0.5,
"learning_rate": 7.91536231884058e-06,
"loss": 0.3969,
"step": 7700
},
{
"epoch": 0.5,
"learning_rate": 7.908115942028987e-06,
"loss": 0.4404,
"step": 7725
},
{
"epoch": 0.5,
"learning_rate": 7.900869565217392e-06,
"loss": 0.4489,
"step": 7750
},
{
"epoch": 0.5,
"learning_rate": 7.893623188405797e-06,
"loss": 0.3542,
"step": 7775
},
{
"epoch": 0.51,
"learning_rate": 7.886376811594204e-06,
"loss": 0.4793,
"step": 7800
},
{
"epoch": 0.51,
"learning_rate": 7.879130434782609e-06,
"loss": 0.3876,
"step": 7825
},
{
"epoch": 0.51,
"learning_rate": 7.871884057971016e-06,
"loss": 0.3983,
"step": 7850
},
{
"epoch": 0.51,
"learning_rate": 7.86463768115942e-06,
"loss": 0.5017,
"step": 7875
},
{
"epoch": 0.51,
"learning_rate": 7.857391304347827e-06,
"loss": 0.3704,
"step": 7900
},
{
"epoch": 0.51,
"learning_rate": 7.850144927536232e-06,
"loss": 0.4443,
"step": 7925
},
{
"epoch": 0.51,
"learning_rate": 7.842898550724637e-06,
"loss": 0.3535,
"step": 7950
},
{
"epoch": 0.52,
"learning_rate": 7.835652173913044e-06,
"loss": 0.4255,
"step": 7975
},
{
"epoch": 0.52,
"learning_rate": 7.828405797101451e-06,
"loss": 0.4455,
"step": 8000
},
{
"epoch": 0.52,
"eval_cer": 8.29885877318117,
"eval_loss": 0.42695876955986023,
"eval_runtime": 3202.8428,
"eval_samples_per_second": 0.775,
"eval_steps_per_second": 0.387,
"eval_wer": 21.754907566228322,
"step": 8000
},
{
"epoch": 0.52,
"learning_rate": 7.821159420289856e-06,
"loss": 0.5201,
"step": 8025
},
{
"epoch": 0.52,
"learning_rate": 7.813913043478263e-06,
"loss": 0.4287,
"step": 8050
},
{
"epoch": 0.52,
"learning_rate": 7.806666666666668e-06,
"loss": 0.3597,
"step": 8075
},
{
"epoch": 0.52,
"learning_rate": 7.799420289855073e-06,
"loss": 0.2911,
"step": 8100
},
{
"epoch": 0.53,
"learning_rate": 7.79217391304348e-06,
"loss": 0.4192,
"step": 8125
},
{
"epoch": 0.53,
"learning_rate": 7.784927536231884e-06,
"loss": 0.328,
"step": 8150
},
{
"epoch": 0.53,
"learning_rate": 7.777681159420291e-06,
"loss": 0.4364,
"step": 8175
},
{
"epoch": 0.53,
"learning_rate": 7.770434782608696e-06,
"loss": 0.2877,
"step": 8200
},
{
"epoch": 0.53,
"learning_rate": 7.763188405797101e-06,
"loss": 0.3641,
"step": 8225
},
{
"epoch": 0.53,
"learning_rate": 7.755942028985508e-06,
"loss": 0.3338,
"step": 8250
},
{
"epoch": 0.54,
"learning_rate": 7.748695652173913e-06,
"loss": 0.3425,
"step": 8275
},
{
"epoch": 0.54,
"learning_rate": 7.74144927536232e-06,
"loss": 0.3633,
"step": 8300
},
{
"epoch": 0.54,
"learning_rate": 7.734202898550726e-06,
"loss": 0.4027,
"step": 8325
},
{
"epoch": 0.54,
"learning_rate": 7.726956521739131e-06,
"loss": 0.4075,
"step": 8350
},
{
"epoch": 0.54,
"learning_rate": 7.719710144927536e-06,
"loss": 0.4272,
"step": 8375
},
{
"epoch": 0.54,
"learning_rate": 7.712463768115943e-06,
"loss": 0.4463,
"step": 8400
},
{
"epoch": 0.55,
"learning_rate": 7.705217391304348e-06,
"loss": 0.4225,
"step": 8425
},
{
"epoch": 0.55,
"learning_rate": 7.697971014492755e-06,
"loss": 0.4155,
"step": 8450
},
{
"epoch": 0.55,
"learning_rate": 7.69072463768116e-06,
"loss": 0.3319,
"step": 8475
},
{
"epoch": 0.55,
"learning_rate": 7.683478260869566e-06,
"loss": 0.3675,
"step": 8500
},
{
"epoch": 0.55,
"learning_rate": 7.676231884057971e-06,
"loss": 0.4573,
"step": 8525
},
{
"epoch": 0.55,
"learning_rate": 7.668985507246376e-06,
"loss": 0.3742,
"step": 8550
},
{
"epoch": 0.56,
"learning_rate": 7.661739130434783e-06,
"loss": 0.4487,
"step": 8575
},
{
"epoch": 0.56,
"learning_rate": 7.65449275362319e-06,
"loss": 0.3993,
"step": 8600
},
{
"epoch": 0.56,
"learning_rate": 7.647246376811595e-06,
"loss": 0.3999,
"step": 8625
},
{
"epoch": 0.56,
"learning_rate": 7.640000000000001e-06,
"loss": 0.4322,
"step": 8650
},
{
"epoch": 0.56,
"learning_rate": 7.632753623188406e-06,
"loss": 0.2906,
"step": 8675
},
{
"epoch": 0.56,
"learning_rate": 7.625507246376812e-06,
"loss": 0.41,
"step": 8700
},
{
"epoch": 0.57,
"learning_rate": 7.618260869565218e-06,
"loss": 0.2934,
"step": 8725
},
{
"epoch": 0.57,
"learning_rate": 7.611014492753623e-06,
"loss": 0.3668,
"step": 8750
},
{
"epoch": 0.57,
"learning_rate": 7.60376811594203e-06,
"loss": 0.3826,
"step": 8775
},
{
"epoch": 0.57,
"learning_rate": 7.596521739130436e-06,
"loss": 0.4043,
"step": 8800
},
{
"epoch": 0.57,
"learning_rate": 7.589275362318841e-06,
"loss": 0.6248,
"step": 8825
},
{
"epoch": 0.57,
"learning_rate": 7.582028985507247e-06,
"loss": 0.4668,
"step": 8850
},
{
"epoch": 0.57,
"learning_rate": 7.574782608695653e-06,
"loss": 0.4407,
"step": 8875
},
{
"epoch": 0.58,
"learning_rate": 7.567536231884058e-06,
"loss": 0.3811,
"step": 8900
},
{
"epoch": 0.58,
"learning_rate": 7.560289855072465e-06,
"loss": 0.4717,
"step": 8925
},
{
"epoch": 0.58,
"learning_rate": 7.55304347826087e-06,
"loss": 0.3531,
"step": 8950
},
{
"epoch": 0.58,
"learning_rate": 7.545797101449276e-06,
"loss": 0.4022,
"step": 8975
},
{
"epoch": 0.58,
"learning_rate": 7.5385507246376825e-06,
"loss": 0.3987,
"step": 9000
},
{
"epoch": 0.58,
"eval_cer": 7.9417334841851535,
"eval_loss": 0.41387349367141724,
"eval_runtime": 3295.4388,
"eval_samples_per_second": 0.753,
"eval_steps_per_second": 0.377,
"eval_wer": 20.842386125404992,
"step": 9000
},
{
"epoch": 0.58,
"learning_rate": 7.5313043478260875e-06,
"loss": 0.2728,
"step": 9025
},
{
"epoch": 0.59,
"learning_rate": 7.524057971014493e-06,
"loss": 0.5125,
"step": 9050
},
{
"epoch": 0.59,
"learning_rate": 7.516811594202899e-06,
"loss": 0.3452,
"step": 9075
},
{
"epoch": 0.59,
"learning_rate": 7.509565217391305e-06,
"loss": 0.3387,
"step": 9100
},
{
"epoch": 0.59,
"learning_rate": 7.502318840579711e-06,
"loss": 0.5818,
"step": 9125
},
{
"epoch": 0.59,
"learning_rate": 7.495072463768116e-06,
"loss": 0.3494,
"step": 9150
},
{
"epoch": 0.59,
"learning_rate": 7.487826086956523e-06,
"loss": 0.2902,
"step": 9175
},
{
"epoch": 0.6,
"learning_rate": 7.4805797101449285e-06,
"loss": 0.3691,
"step": 9200
},
{
"epoch": 0.6,
"learning_rate": 7.4733333333333335e-06,
"loss": 0.3344,
"step": 9225
},
{
"epoch": 0.6,
"learning_rate": 7.466086956521739e-06,
"loss": 0.3612,
"step": 9250
},
{
"epoch": 0.6,
"learning_rate": 7.458840579710146e-06,
"loss": 0.4311,
"step": 9275
},
{
"epoch": 0.6,
"learning_rate": 7.451594202898551e-06,
"loss": 0.4298,
"step": 9300
},
{
"epoch": 0.6,
"learning_rate": 7.444347826086957e-06,
"loss": 0.3657,
"step": 9325
},
{
"epoch": 0.61,
"learning_rate": 7.437101449275363e-06,
"loss": 0.4382,
"step": 9350
},
{
"epoch": 0.61,
"learning_rate": 7.429855072463769e-06,
"loss": 0.3775,
"step": 9375
},
{
"epoch": 0.61,
"learning_rate": 7.4226086956521745e-06,
"loss": 0.3566,
"step": 9400
},
{
"epoch": 0.61,
"learning_rate": 7.4153623188405795e-06,
"loss": 0.3423,
"step": 9425
},
{
"epoch": 0.61,
"learning_rate": 7.408115942028986e-06,
"loss": 0.4855,
"step": 9450
},
{
"epoch": 0.61,
"learning_rate": 7.400869565217392e-06,
"loss": 0.3648,
"step": 9475
},
{
"epoch": 0.62,
"learning_rate": 7.393623188405797e-06,
"loss": 0.3294,
"step": 9500
},
{
"epoch": 0.62,
"learning_rate": 7.386376811594204e-06,
"loss": 0.3991,
"step": 9525
},
{
"epoch": 0.62,
"learning_rate": 7.37913043478261e-06,
"loss": 0.347,
"step": 9550
},
{
"epoch": 0.62,
"learning_rate": 7.371884057971015e-06,
"loss": 0.4011,
"step": 9575
},
{
"epoch": 0.62,
"learning_rate": 7.364637681159421e-06,
"loss": 0.3433,
"step": 9600
},
{
"epoch": 0.62,
"learning_rate": 7.357391304347826e-06,
"loss": 0.4642,
"step": 9625
},
{
"epoch": 0.63,
"learning_rate": 7.350144927536232e-06,
"loss": 0.3897,
"step": 9650
},
{
"epoch": 0.63,
"learning_rate": 7.342898550724639e-06,
"loss": 0.4562,
"step": 9675
},
{
"epoch": 0.63,
"learning_rate": 7.335652173913044e-06,
"loss": 0.4942,
"step": 9700
},
{
"epoch": 0.63,
"learning_rate": 7.32840579710145e-06,
"loss": 0.3497,
"step": 9725
},
{
"epoch": 0.63,
"learning_rate": 7.3211594202898564e-06,
"loss": 0.3713,
"step": 9750
},
{
"epoch": 0.63,
"learning_rate": 7.3139130434782614e-06,
"loss": 0.3558,
"step": 9775
},
{
"epoch": 0.63,
"learning_rate": 7.306666666666667e-06,
"loss": 0.4417,
"step": 9800
},
{
"epoch": 0.64,
"learning_rate": 7.299420289855072e-06,
"loss": 0.4752,
"step": 9825
},
{
"epoch": 0.64,
"learning_rate": 7.292173913043479e-06,
"loss": 0.3515,
"step": 9850
},
{
"epoch": 0.64,
"learning_rate": 7.284927536231885e-06,
"loss": 0.4731,
"step": 9875
},
{
"epoch": 0.64,
"learning_rate": 7.27768115942029e-06,
"loss": 0.3111,
"step": 9900
},
{
"epoch": 0.64,
"learning_rate": 7.2704347826086966e-06,
"loss": 0.3776,
"step": 9925
},
{
"epoch": 0.64,
"learning_rate": 7.263188405797102e-06,
"loss": 0.4209,
"step": 9950
},
{
"epoch": 0.65,
"learning_rate": 7.2559420289855074e-06,
"loss": 0.3707,
"step": 9975
},
{
"epoch": 0.65,
"learning_rate": 7.248695652173914e-06,
"loss": 0.3373,
"step": 10000
},
{
"epoch": 0.65,
"eval_cer": 7.887131683801465,
"eval_loss": 0.4116414785385132,
"eval_runtime": 3350.806,
"eval_samples_per_second": 0.741,
"eval_steps_per_second": 0.37,
"eval_wer": 21.214408233276156,
"step": 10000
},
{
"epoch": 0.65,
"learning_rate": 7.241449275362319e-06,
"loss": 0.3843,
"step": 10025
},
{
"epoch": 0.65,
"learning_rate": 7.234202898550725e-06,
"loss": 0.3891,
"step": 10050
},
{
"epoch": 0.65,
"learning_rate": 7.226956521739132e-06,
"loss": 0.4058,
"step": 10075
},
{
"epoch": 0.65,
"learning_rate": 7.219710144927537e-06,
"loss": 0.3908,
"step": 10100
},
{
"epoch": 0.66,
"learning_rate": 7.2124637681159426e-06,
"loss": 0.384,
"step": 10125
},
{
"epoch": 0.66,
"learning_rate": 7.205217391304348e-06,
"loss": 0.4804,
"step": 10150
},
{
"epoch": 0.66,
"learning_rate": 7.197971014492754e-06,
"loss": 0.2675,
"step": 10175
},
{
"epoch": 0.66,
"learning_rate": 7.19072463768116e-06,
"loss": 0.4003,
"step": 10200
},
{
"epoch": 0.66,
"learning_rate": 7.183478260869566e-06,
"loss": 0.4716,
"step": 10225
},
{
"epoch": 0.66,
"learning_rate": 7.176231884057972e-06,
"loss": 0.3955,
"step": 10250
},
{
"epoch": 0.67,
"learning_rate": 7.168985507246378e-06,
"loss": 0.4133,
"step": 10275
},
{
"epoch": 0.67,
"learning_rate": 7.161739130434783e-06,
"loss": 0.454,
"step": 10300
},
{
"epoch": 0.67,
"learning_rate": 7.1544927536231885e-06,
"loss": 0.4465,
"step": 10325
},
{
"epoch": 0.67,
"learning_rate": 7.147246376811595e-06,
"loss": 0.3997,
"step": 10350
},
{
"epoch": 0.67,
"learning_rate": 7.14e-06,
"loss": 0.43,
"step": 10375
},
{
"epoch": 0.67,
"learning_rate": 7.132753623188406e-06,
"loss": 0.373,
"step": 10400
},
{
"epoch": 0.68,
"learning_rate": 7.125507246376813e-06,
"loss": 0.4268,
"step": 10425
},
{
"epoch": 0.68,
"learning_rate": 7.118260869565218e-06,
"loss": 0.331,
"step": 10450
},
{
"epoch": 0.68,
"learning_rate": 7.111014492753624e-06,
"loss": 0.4018,
"step": 10475
},
{
"epoch": 0.68,
"learning_rate": 7.103768115942029e-06,
"loss": 0.3489,
"step": 10500
},
{
"epoch": 0.68,
"learning_rate": 7.096521739130435e-06,
"loss": 0.3914,
"step": 10525
},
{
"epoch": 0.68,
"learning_rate": 7.089275362318841e-06,
"loss": 0.3368,
"step": 10550
},
{
"epoch": 0.68,
"learning_rate": 7.082028985507246e-06,
"loss": 0.3999,
"step": 10575
},
{
"epoch": 0.69,
"learning_rate": 7.074782608695653e-06,
"loss": 0.334,
"step": 10600
},
{
"epoch": 0.69,
"learning_rate": 7.067536231884059e-06,
"loss": 0.4635,
"step": 10625
},
{
"epoch": 0.69,
"learning_rate": 7.060289855072464e-06,
"loss": 0.475,
"step": 10650
},
{
"epoch": 0.69,
"learning_rate": 7.0530434782608705e-06,
"loss": 0.3621,
"step": 10675
},
{
"epoch": 0.69,
"learning_rate": 7.0457971014492755e-06,
"loss": 0.4164,
"step": 10700
},
{
"epoch": 0.69,
"learning_rate": 7.038550724637681e-06,
"loss": 0.3648,
"step": 10725
},
{
"epoch": 0.7,
"learning_rate": 7.031304347826088e-06,
"loss": 0.4358,
"step": 10750
},
{
"epoch": 0.7,
"learning_rate": 7.024057971014493e-06,
"loss": 0.3316,
"step": 10775
},
{
"epoch": 0.7,
"learning_rate": 7.016811594202899e-06,
"loss": 0.4052,
"step": 10800
},
{
"epoch": 0.7,
"learning_rate": 7.009565217391306e-06,
"loss": 0.4474,
"step": 10825
},
{
"epoch": 0.7,
"learning_rate": 7.002318840579711e-06,
"loss": 0.339,
"step": 10850
},
{
"epoch": 0.7,
"learning_rate": 6.9950724637681165e-06,
"loss": 0.3653,
"step": 10875
},
{
"epoch": 0.71,
"learning_rate": 6.9878260869565215e-06,
"loss": 0.3337,
"step": 10900
},
{
"epoch": 0.71,
"learning_rate": 6.980579710144928e-06,
"loss": 0.3516,
"step": 10925
},
{
"epoch": 0.71,
"learning_rate": 6.973333333333334e-06,
"loss": 0.3092,
"step": 10950
},
{
"epoch": 0.71,
"learning_rate": 6.966086956521739e-06,
"loss": 0.4312,
"step": 10975
},
{
"epoch": 0.71,
"learning_rate": 6.958840579710146e-06,
"loss": 0.3808,
"step": 11000
},
{
"epoch": 0.71,
"eval_cer": 7.6264203846721434,
"eval_loss": 0.4016057252883911,
"eval_runtime": 3251.7215,
"eval_samples_per_second": 0.763,
"eval_steps_per_second": 0.382,
"eval_wer": 20.509243377167905,
"step": 11000
},
{
"epoch": 0.71,
"learning_rate": 6.951594202898552e-06,
"loss": 0.6109,
"step": 11025
},
{
"epoch": 0.72,
"learning_rate": 6.944347826086957e-06,
"loss": 0.4322,
"step": 11050
},
{
"epoch": 0.72,
"learning_rate": 6.937101449275363e-06,
"loss": 0.318,
"step": 11075
},
{
"epoch": 0.72,
"learning_rate": 6.929855072463769e-06,
"loss": 0.3855,
"step": 11100
},
{
"epoch": 0.72,
"learning_rate": 6.922608695652174e-06,
"loss": 0.3817,
"step": 11125
},
{
"epoch": 0.72,
"learning_rate": 6.915362318840581e-06,
"loss": 0.384,
"step": 11150
},
{
"epoch": 0.72,
"learning_rate": 6.908115942028986e-06,
"loss": 0.3451,
"step": 11175
},
{
"epoch": 0.73,
"learning_rate": 6.900869565217392e-06,
"loss": 0.3518,
"step": 11200
},
{
"epoch": 0.73,
"learning_rate": 6.8936231884057984e-06,
"loss": 0.4567,
"step": 11225
},
{
"epoch": 0.73,
"learning_rate": 6.886666666666667e-06,
"loss": 0.3848,
"step": 11250
},
{
"epoch": 0.73,
"learning_rate": 6.879420289855073e-06,
"loss": 0.4563,
"step": 11275
},
{
"epoch": 0.73,
"learning_rate": 6.872173913043478e-06,
"loss": 0.3633,
"step": 11300
},
{
"epoch": 0.73,
"learning_rate": 6.864927536231885e-06,
"loss": 0.425,
"step": 11325
},
{
"epoch": 0.74,
"learning_rate": 6.8576811594202905e-06,
"loss": 0.3508,
"step": 11350
},
{
"epoch": 0.74,
"learning_rate": 6.8504347826086955e-06,
"loss": 0.3351,
"step": 11375
},
{
"epoch": 0.74,
"learning_rate": 6.843188405797102e-06,
"loss": 0.4659,
"step": 11400
},
{
"epoch": 0.74,
"learning_rate": 6.835942028985508e-06,
"loss": 0.346,
"step": 11425
},
{
"epoch": 0.74,
"learning_rate": 6.828695652173913e-06,
"loss": 0.3896,
"step": 11450
},
{
"epoch": 0.74,
"learning_rate": 6.82144927536232e-06,
"loss": 0.4153,
"step": 11475
},
{
"epoch": 0.74,
"learning_rate": 6.814202898550725e-06,
"loss": 0.3759,
"step": 11500
},
{
"epoch": 0.75,
"learning_rate": 6.806956521739131e-06,
"loss": 0.3328,
"step": 11525
},
{
"epoch": 0.75,
"learning_rate": 6.799710144927537e-06,
"loss": 0.5639,
"step": 11550
},
{
"epoch": 0.75,
"learning_rate": 6.792463768115942e-06,
"loss": 0.3775,
"step": 11575
},
{
"epoch": 0.75,
"learning_rate": 6.785217391304348e-06,
"loss": 0.4081,
"step": 11600
},
{
"epoch": 0.75,
"learning_rate": 6.777971014492755e-06,
"loss": 0.4266,
"step": 11625
},
{
"epoch": 0.75,
"learning_rate": 6.77072463768116e-06,
"loss": 0.3683,
"step": 11650
},
{
"epoch": 0.76,
"learning_rate": 6.763478260869566e-06,
"loss": 0.4148,
"step": 11675
},
{
"epoch": 0.76,
"learning_rate": 6.756231884057971e-06,
"loss": 0.3413,
"step": 11700
},
{
"epoch": 0.76,
"learning_rate": 6.7489855072463775e-06,
"loss": 0.3954,
"step": 11725
},
{
"epoch": 0.76,
"learning_rate": 6.741739130434783e-06,
"loss": 0.3807,
"step": 11750
},
{
"epoch": 0.76,
"learning_rate": 6.734492753623188e-06,
"loss": 0.3475,
"step": 11775
},
{
"epoch": 0.76,
"learning_rate": 6.727246376811595e-06,
"loss": 0.3428,
"step": 11800
},
{
"epoch": 0.77,
"learning_rate": 6.720000000000001e-06,
"loss": 0.3614,
"step": 11825
},
{
"epoch": 0.77,
"learning_rate": 6.712753623188406e-06,
"loss": 0.3261,
"step": 11850
},
{
"epoch": 0.77,
"learning_rate": 6.705507246376813e-06,
"loss": 0.463,
"step": 11875
},
{
"epoch": 0.77,
"learning_rate": 6.6982608695652184e-06,
"loss": 0.3045,
"step": 11900
},
{
"epoch": 0.77,
"learning_rate": 6.6910144927536235e-06,
"loss": 0.3677,
"step": 11925
},
{
"epoch": 0.77,
"learning_rate": 6.68376811594203e-06,
"loss": 0.3405,
"step": 11950
},
{
"epoch": 0.78,
"learning_rate": 6.676521739130435e-06,
"loss": 0.3467,
"step": 11975
},
{
"epoch": 0.78,
"learning_rate": 6.669275362318841e-06,
"loss": 0.4214,
"step": 12000
},
{
"epoch": 0.78,
"eval_cer": 7.4152688277829695,
"eval_loss": 0.39488446712493896,
"eval_runtime": 3259.8037,
"eval_samples_per_second": 0.761,
"eval_steps_per_second": 0.381,
"eval_wer": 20.093767867352774,
"step": 12000
},
{
"epoch": 0.78,
"learning_rate": 6.662028985507248e-06,
"loss": 0.3608,
"step": 12025
},
{
"epoch": 0.78,
"learning_rate": 6.654782608695653e-06,
"loss": 0.3147,
"step": 12050
},
{
"epoch": 0.78,
"learning_rate": 6.647536231884059e-06,
"loss": 0.2764,
"step": 12075
},
{
"epoch": 0.78,
"learning_rate": 6.6402898550724644e-06,
"loss": 0.3447,
"step": 12100
},
{
"epoch": 0.79,
"learning_rate": 6.63304347826087e-06,
"loss": 0.3727,
"step": 12125
},
{
"epoch": 0.79,
"learning_rate": 6.625797101449276e-06,
"loss": 0.4042,
"step": 12150
},
{
"epoch": 0.79,
"learning_rate": 6.618550724637681e-06,
"loss": 0.3758,
"step": 12175
},
{
"epoch": 0.79,
"learning_rate": 6.611304347826088e-06,
"loss": 0.3582,
"step": 12200
},
{
"epoch": 0.79,
"learning_rate": 6.604057971014494e-06,
"loss": 0.3571,
"step": 12225
},
{
"epoch": 0.79,
"learning_rate": 6.596811594202899e-06,
"loss": 0.3676,
"step": 12250
},
{
"epoch": 0.8,
"learning_rate": 6.5895652173913046e-06,
"loss": 0.3224,
"step": 12275
},
{
"epoch": 0.8,
"learning_rate": 6.582318840579711e-06,
"loss": 0.3025,
"step": 12300
},
{
"epoch": 0.8,
"learning_rate": 6.575072463768116e-06,
"loss": 0.3686,
"step": 12325
},
{
"epoch": 0.8,
"learning_rate": 6.567826086956522e-06,
"loss": 0.3866,
"step": 12350
},
{
"epoch": 0.8,
"learning_rate": 6.560579710144928e-06,
"loss": 0.3662,
"step": 12375
},
{
"epoch": 0.8,
"learning_rate": 6.553333333333334e-06,
"loss": 0.3507,
"step": 12400
},
{
"epoch": 0.8,
"learning_rate": 6.54608695652174e-06,
"loss": 0.3165,
"step": 12425
},
{
"epoch": 0.81,
"learning_rate": 6.538840579710145e-06,
"loss": 0.3616,
"step": 12450
},
{
"epoch": 0.81,
"learning_rate": 6.531594202898551e-06,
"loss": 0.3466,
"step": 12475
},
{
"epoch": 0.81,
"learning_rate": 6.524347826086957e-06,
"loss": 0.5202,
"step": 12500
},
{
"epoch": 0.81,
"learning_rate": 6.517101449275362e-06,
"loss": 0.3789,
"step": 12525
},
{
"epoch": 0.81,
"learning_rate": 6.509855072463769e-06,
"loss": 0.5112,
"step": 12550
},
{
"epoch": 0.81,
"learning_rate": 6.502608695652174e-06,
"loss": 0.353,
"step": 12575
},
{
"epoch": 0.82,
"learning_rate": 6.49536231884058e-06,
"loss": 0.3469,
"step": 12600
},
{
"epoch": 0.82,
"learning_rate": 6.4881159420289865e-06,
"loss": 0.4366,
"step": 12625
},
{
"epoch": 0.82,
"learning_rate": 6.4808695652173915e-06,
"loss": 0.309,
"step": 12650
},
{
"epoch": 0.82,
"learning_rate": 6.473623188405797e-06,
"loss": 0.4358,
"step": 12675
},
{
"epoch": 0.82,
"learning_rate": 6.466376811594204e-06,
"loss": 0.3286,
"step": 12700
},
{
"epoch": 0.82,
"learning_rate": 6.459130434782609e-06,
"loss": 0.2837,
"step": 12725
},
{
"epoch": 0.83,
"learning_rate": 6.451884057971015e-06,
"loss": 0.3613,
"step": 12750
},
{
"epoch": 0.83,
"learning_rate": 6.444637681159422e-06,
"loss": 0.2637,
"step": 12775
},
{
"epoch": 0.83,
"learning_rate": 6.437391304347827e-06,
"loss": 0.3415,
"step": 12800
},
{
"epoch": 0.83,
"learning_rate": 6.4301449275362325e-06,
"loss": 0.371,
"step": 12825
},
{
"epoch": 0.83,
"learning_rate": 6.4228985507246375e-06,
"loss": 0.286,
"step": 12850
},
{
"epoch": 0.83,
"learning_rate": 6.415652173913044e-06,
"loss": 0.3646,
"step": 12875
},
{
"epoch": 0.84,
"learning_rate": 6.40840579710145e-06,
"loss": 0.4352,
"step": 12900
},
{
"epoch": 0.84,
"learning_rate": 6.401159420289855e-06,
"loss": 0.2876,
"step": 12925
},
{
"epoch": 0.84,
"learning_rate": 6.393913043478262e-06,
"loss": 0.3672,
"step": 12950
},
{
"epoch": 0.84,
"learning_rate": 6.386666666666668e-06,
"loss": 0.2878,
"step": 12975
},
{
"epoch": 0.84,
"learning_rate": 6.379420289855073e-06,
"loss": 0.3029,
"step": 13000
},
{
"epoch": 0.84,
"eval_cer": 7.358084509813567,
"eval_loss": 0.3902455270290375,
"eval_runtime": 3231.646,
"eval_samples_per_second": 0.768,
"eval_steps_per_second": 0.384,
"eval_wer": 19.7347055460263,
"step": 13000
},
{
"epoch": 1.55,
"learning_rate": 6.372173913043479e-06,
"loss": 0.3232,
"step": 13025
},
{
"epoch": 1.55,
"learning_rate": 6.364927536231884e-06,
"loss": 0.3888,
"step": 13050
},
{
"epoch": 1.55,
"learning_rate": 6.35768115942029e-06,
"loss": 0.3928,
"step": 13075
},
{
"epoch": 1.55,
"learning_rate": 6.350434782608697e-06,
"loss": 0.3615,
"step": 13100
},
{
"epoch": 1.56,
"learning_rate": 6.343188405797102e-06,
"loss": 0.4292,
"step": 13125
},
{
"epoch": 1.56,
"learning_rate": 6.335942028985508e-06,
"loss": 0.3445,
"step": 13150
},
{
"epoch": 1.56,
"learning_rate": 6.328695652173914e-06,
"loss": 0.3983,
"step": 13175
},
{
"epoch": 1.57,
"learning_rate": 6.3214492753623195e-06,
"loss": 0.3746,
"step": 13200
},
{
"epoch": 1.57,
"learning_rate": 6.314202898550725e-06,
"loss": 0.3714,
"step": 13225
},
{
"epoch": 1.57,
"learning_rate": 6.30695652173913e-06,
"loss": 0.369,
"step": 13250
},
{
"epoch": 1.58,
"learning_rate": 6.299710144927537e-06,
"loss": 0.3991,
"step": 13275
},
{
"epoch": 1.58,
"learning_rate": 6.292463768115943e-06,
"loss": 0.4264,
"step": 13300
},
{
"epoch": 1.58,
"learning_rate": 6.285217391304348e-06,
"loss": 0.2885,
"step": 13325
},
{
"epoch": 1.58,
"learning_rate": 6.277971014492754e-06,
"loss": 0.3356,
"step": 13350
},
{
"epoch": 1.59,
"learning_rate": 6.2707246376811605e-06,
"loss": 0.3758,
"step": 13375
},
{
"epoch": 1.59,
"learning_rate": 6.2634782608695655e-06,
"loss": 0.3424,
"step": 13400
},
{
"epoch": 1.59,
"learning_rate": 6.256231884057971e-06,
"loss": 0.3376,
"step": 13425
},
{
"epoch": 1.6,
"learning_rate": 6.248985507246378e-06,
"loss": 0.3928,
"step": 13450
},
{
"epoch": 1.6,
"learning_rate": 6.241739130434783e-06,
"loss": 0.3247,
"step": 13475
},
{
"epoch": 1.6,
"learning_rate": 6.234492753623189e-06,
"loss": 0.3002,
"step": 13500
},
{
"epoch": 1.6,
"learning_rate": 6.227246376811594e-06,
"loss": 0.2954,
"step": 13525
},
{
"epoch": 1.61,
"learning_rate": 6.220000000000001e-06,
"loss": 0.3292,
"step": 13550
},
{
"epoch": 1.61,
"learning_rate": 6.213043478260871e-06,
"loss": 0.3325,
"step": 13575
},
{
"epoch": 1.61,
"learning_rate": 6.205797101449276e-06,
"loss": 0.3929,
"step": 13600
},
{
"epoch": 1.62,
"learning_rate": 6.198550724637682e-06,
"loss": 0.3311,
"step": 13625
},
{
"epoch": 1.62,
"learning_rate": 6.191304347826087e-06,
"loss": 0.2803,
"step": 13650
},
{
"epoch": 1.62,
"learning_rate": 6.1840579710144935e-06,
"loss": 0.3777,
"step": 13675
},
{
"epoch": 1.63,
"learning_rate": 6.176811594202899e-06,
"loss": 0.387,
"step": 13700
},
{
"epoch": 1.63,
"learning_rate": 6.169565217391304e-06,
"loss": 0.3304,
"step": 13725
},
{
"epoch": 1.63,
"learning_rate": 6.162318840579711e-06,
"loss": 0.4854,
"step": 13750
},
{
"epoch": 1.63,
"learning_rate": 6.155072463768117e-06,
"loss": 0.3572,
"step": 13775
},
{
"epoch": 1.64,
"learning_rate": 6.147826086956522e-06,
"loss": 0.3484,
"step": 13800
},
{
"epoch": 1.64,
"learning_rate": 6.140579710144929e-06,
"loss": 0.3671,
"step": 13825
},
{
"epoch": 1.64,
"learning_rate": 6.133333333333334e-06,
"loss": 0.376,
"step": 13850
},
{
"epoch": 1.65,
"learning_rate": 6.1260869565217395e-06,
"loss": 0.3435,
"step": 13875
},
{
"epoch": 1.65,
"learning_rate": 6.118840579710146e-06,
"loss": 0.4171,
"step": 13900
},
{
"epoch": 1.65,
"learning_rate": 6.111594202898551e-06,
"loss": 0.3793,
"step": 13925
},
{
"epoch": 1.66,
"learning_rate": 6.104347826086957e-06,
"loss": 0.4026,
"step": 13950
},
{
"epoch": 1.66,
"learning_rate": 6.097101449275363e-06,
"loss": 0.3086,
"step": 13975
},
{
"epoch": 1.66,
"learning_rate": 6.089855072463769e-06,
"loss": 0.3549,
"step": 14000
},
{
"epoch": 1.66,
"eval_cer": 7.119509075704658,
"eval_loss": 0.39083221554756165,
"eval_runtime": 3180.5722,
"eval_samples_per_second": 0.78,
"eval_steps_per_second": 0.39,
"eval_wer": 19.411473222793976,
"step": 14000
},
{
"epoch": 1.66,
"learning_rate": 6.082608695652175e-06,
"loss": 0.3889,
"step": 14025
},
{
"epoch": 1.67,
"learning_rate": 6.07536231884058e-06,
"loss": 0.3197,
"step": 14050
},
{
"epoch": 1.67,
"learning_rate": 6.068115942028986e-06,
"loss": 0.3279,
"step": 14075
},
{
"epoch": 1.67,
"learning_rate": 6.060869565217392e-06,
"loss": 0.4178,
"step": 14100
},
{
"epoch": 1.68,
"learning_rate": 6.053623188405797e-06,
"loss": 0.3872,
"step": 14125
},
{
"epoch": 1.68,
"learning_rate": 6.046376811594203e-06,
"loss": 0.3375,
"step": 14150
},
{
"epoch": 1.68,
"learning_rate": 6.03913043478261e-06,
"loss": 0.4023,
"step": 14175
},
{
"epoch": 1.69,
"learning_rate": 6.031884057971015e-06,
"loss": 0.4128,
"step": 14200
},
{
"epoch": 1.69,
"learning_rate": 6.024637681159421e-06,
"loss": 0.3603,
"step": 14225
},
{
"epoch": 1.69,
"learning_rate": 6.0173913043478264e-06,
"loss": 0.3824,
"step": 14250
},
{
"epoch": 1.69,
"learning_rate": 6.010144927536232e-06,
"loss": 0.4071,
"step": 14275
},
{
"epoch": 1.7,
"learning_rate": 6.002898550724638e-06,
"loss": 0.2672,
"step": 14300
},
{
"epoch": 1.7,
"learning_rate": 5.995652173913043e-06,
"loss": 0.327,
"step": 14325
},
{
"epoch": 1.7,
"learning_rate": 5.98840579710145e-06,
"loss": 0.3569,
"step": 14350
},
{
"epoch": 1.71,
"learning_rate": 5.981159420289856e-06,
"loss": 0.3308,
"step": 14375
},
{
"epoch": 1.71,
"learning_rate": 5.973913043478261e-06,
"loss": 0.3802,
"step": 14400
},
{
"epoch": 1.71,
"learning_rate": 5.966666666666667e-06,
"loss": 0.4012,
"step": 14425
},
{
"epoch": 1.71,
"learning_rate": 5.959420289855073e-06,
"loss": 0.3191,
"step": 14450
},
{
"epoch": 1.72,
"learning_rate": 5.952173913043478e-06,
"loss": 0.2991,
"step": 14475
},
{
"epoch": 1.72,
"learning_rate": 5.944927536231885e-06,
"loss": 0.3889,
"step": 14500
},
{
"epoch": 1.72,
"learning_rate": 5.93768115942029e-06,
"loss": 0.3315,
"step": 14525
},
{
"epoch": 1.73,
"learning_rate": 5.930434782608696e-06,
"loss": 0.3925,
"step": 14550
},
{
"epoch": 1.73,
"learning_rate": 5.9231884057971025e-06,
"loss": 0.3661,
"step": 14575
},
{
"epoch": 1.73,
"learning_rate": 5.9159420289855076e-06,
"loss": 0.4426,
"step": 14600
},
{
"epoch": 1.74,
"learning_rate": 5.908695652173913e-06,
"loss": 0.4046,
"step": 14625
},
{
"epoch": 1.74,
"learning_rate": 5.90144927536232e-06,
"loss": 0.3361,
"step": 14650
},
{
"epoch": 1.74,
"learning_rate": 5.894202898550725e-06,
"loss": 0.4759,
"step": 14675
},
{
"epoch": 1.74,
"learning_rate": 5.886956521739131e-06,
"loss": 0.4326,
"step": 14700
},
{
"epoch": 1.75,
"learning_rate": 5.879710144927536e-06,
"loss": 0.2716,
"step": 14725
},
{
"epoch": 1.75,
"learning_rate": 5.872463768115943e-06,
"loss": 0.3416,
"step": 14750
},
{
"epoch": 1.75,
"learning_rate": 5.8652173913043485e-06,
"loss": 0.3715,
"step": 14775
},
{
"epoch": 1.76,
"learning_rate": 5.8579710144927535e-06,
"loss": 0.3737,
"step": 14800
},
{
"epoch": 1.76,
"learning_rate": 5.85072463768116e-06,
"loss": 0.309,
"step": 14825
},
{
"epoch": 1.76,
"learning_rate": 5.843478260869566e-06,
"loss": 0.3327,
"step": 14850
},
{
"epoch": 1.77,
"learning_rate": 5.836231884057971e-06,
"loss": 0.401,
"step": 14875
},
{
"epoch": 1.77,
"learning_rate": 5.828985507246378e-06,
"loss": 0.2827,
"step": 14900
},
{
"epoch": 1.77,
"learning_rate": 5.821739130434783e-06,
"loss": 0.3644,
"step": 14925
},
{
"epoch": 1.77,
"learning_rate": 5.814492753623189e-06,
"loss": 0.3638,
"step": 14950
},
{
"epoch": 1.78,
"learning_rate": 5.807246376811595e-06,
"loss": 0.4652,
"step": 14975
},
{
"epoch": 1.78,
"learning_rate": 5.8e-06,
"loss": 0.3385,
"step": 15000
},
{
"epoch": 1.78,
"eval_cer": 7.779157853313001,
"eval_loss": 0.39061304926872253,
"eval_runtime": 3221.9453,
"eval_samples_per_second": 0.77,
"eval_steps_per_second": 0.385,
"eval_wer": 20.20506956356013,
"step": 15000
},
{
"epoch": 1.78,
"learning_rate": 5.792753623188406e-06,
"loss": 0.4065,
"step": 15025
},
{
"epoch": 1.79,
"learning_rate": 5.785507246376812e-06,
"loss": 0.4354,
"step": 15050
},
{
"epoch": 1.79,
"learning_rate": 5.778260869565218e-06,
"loss": 0.3932,
"step": 15075
},
{
"epoch": 1.79,
"learning_rate": 5.771014492753624e-06,
"loss": 0.3212,
"step": 15100
},
{
"epoch": 1.79,
"learning_rate": 5.76376811594203e-06,
"loss": 0.4244,
"step": 15125
},
{
"epoch": 1.8,
"learning_rate": 5.7565217391304355e-06,
"loss": 0.306,
"step": 15150
},
{
"epoch": 1.8,
"learning_rate": 5.749275362318841e-06,
"loss": 0.3492,
"step": 15175
},
{
"epoch": 1.8,
"learning_rate": 5.742028985507246e-06,
"loss": 0.3573,
"step": 15200
},
{
"epoch": 1.81,
"learning_rate": 5.734782608695652e-06,
"loss": 0.3975,
"step": 15225
},
{
"epoch": 1.81,
"learning_rate": 5.727536231884059e-06,
"loss": 0.3276,
"step": 15250
},
{
"epoch": 1.81,
"learning_rate": 5.720289855072464e-06,
"loss": 0.3638,
"step": 15275
},
{
"epoch": 1.82,
"learning_rate": 5.71304347826087e-06,
"loss": 0.3312,
"step": 15300
},
{
"epoch": 1.82,
"learning_rate": 5.7057971014492765e-06,
"loss": 0.3026,
"step": 15325
},
{
"epoch": 1.82,
"learning_rate": 5.6985507246376815e-06,
"loss": 0.3493,
"step": 15350
},
{
"epoch": 1.82,
"learning_rate": 5.691304347826087e-06,
"loss": 0.309,
"step": 15375
},
{
"epoch": 1.83,
"learning_rate": 5.684057971014492e-06,
"loss": 0.2761,
"step": 15400
},
{
"epoch": 1.83,
"learning_rate": 5.676811594202899e-06,
"loss": 0.3507,
"step": 15425
},
{
"epoch": 1.83,
"learning_rate": 5.669565217391305e-06,
"loss": 0.3359,
"step": 15450
},
{
"epoch": 1.84,
"learning_rate": 5.66231884057971e-06,
"loss": 0.3132,
"step": 15475
},
{
"epoch": 1.84,
"learning_rate": 5.655072463768117e-06,
"loss": 0.2976,
"step": 15500
},
{
"epoch": 1.84,
"learning_rate": 5.6478260869565225e-06,
"loss": 0.3893,
"step": 15525
},
{
"epoch": 1.85,
"learning_rate": 5.6405797101449275e-06,
"loss": 0.3417,
"step": 15550
},
{
"epoch": 1.85,
"learning_rate": 5.633333333333334e-06,
"loss": 0.3462,
"step": 15575
},
{
"epoch": 1.85,
"learning_rate": 5.626086956521739e-06,
"loss": 0.3885,
"step": 15600
},
{
"epoch": 1.85,
"learning_rate": 5.618840579710145e-06,
"loss": 0.3844,
"step": 15625
},
{
"epoch": 1.86,
"learning_rate": 5.611594202898552e-06,
"loss": 0.3112,
"step": 15650
},
{
"epoch": 1.86,
"learning_rate": 5.604347826086957e-06,
"loss": 0.3266,
"step": 15675
},
{
"epoch": 1.86,
"learning_rate": 5.597101449275363e-06,
"loss": 0.3538,
"step": 15700
},
{
"epoch": 1.87,
"learning_rate": 5.589855072463769e-06,
"loss": 0.351,
"step": 15725
},
{
"epoch": 1.87,
"learning_rate": 5.582608695652174e-06,
"loss": 0.3373,
"step": 15750
},
{
"epoch": 1.87,
"learning_rate": 5.57536231884058e-06,
"loss": 0.4156,
"step": 15775
},
{
"epoch": 1.87,
"learning_rate": 5.568115942028985e-06,
"loss": 0.4124,
"step": 15800
},
{
"epoch": 1.88,
"learning_rate": 5.560869565217392e-06,
"loss": 0.3716,
"step": 15825
},
{
"epoch": 1.88,
"learning_rate": 5.553623188405798e-06,
"loss": 0.5276,
"step": 15850
},
{
"epoch": 1.88,
"learning_rate": 5.546376811594203e-06,
"loss": 0.3412,
"step": 15875
},
{
"epoch": 1.89,
"learning_rate": 5.5391304347826094e-06,
"loss": 0.3293,
"step": 15900
},
{
"epoch": 1.89,
"learning_rate": 5.531884057971015e-06,
"loss": 0.3759,
"step": 15925
},
{
"epoch": 1.89,
"learning_rate": 5.52463768115942e-06,
"loss": 0.3926,
"step": 15950
},
{
"epoch": 1.9,
"learning_rate": 5.517391304347827e-06,
"loss": 0.3686,
"step": 15975
},
{
"epoch": 1.9,
"learning_rate": 5.510144927536233e-06,
"loss": 0.3282,
"step": 16000
},
{
"epoch": 1.9,
"eval_cer": 7.108072212110778,
"eval_loss": 0.39232152700424194,
"eval_runtime": 3154.8615,
"eval_samples_per_second": 0.787,
"eval_steps_per_second": 0.393,
"eval_wer": 19.265103868877453,
"step": 16000
},
{
"epoch": 1.9,
"learning_rate": 5.502898550724638e-06,
"loss": 0.3279,
"step": 16025
},
{
"epoch": 1.9,
"learning_rate": 5.4956521739130446e-06,
"loss": 0.4442,
"step": 16050
},
{
"epoch": 1.91,
"learning_rate": 5.4884057971014496e-06,
"loss": 0.4354,
"step": 16075
},
{
"epoch": 1.91,
"learning_rate": 5.481159420289855e-06,
"loss": 0.362,
"step": 16100
},
{
"epoch": 1.91,
"learning_rate": 5.473913043478261e-06,
"loss": 0.3849,
"step": 16125
},
{
"epoch": 1.92,
"learning_rate": 5.466666666666667e-06,
"loss": 0.3956,
"step": 16150
},
{
"epoch": 1.92,
"learning_rate": 5.459420289855073e-06,
"loss": 0.2881,
"step": 16175
},
{
"epoch": 1.92,
"learning_rate": 5.452173913043479e-06,
"loss": 0.3321,
"step": 16200
},
{
"epoch": 1.93,
"learning_rate": 5.444927536231885e-06,
"loss": 0.3512,
"step": 16225
},
{
"epoch": 1.93,
"learning_rate": 5.4376811594202905e-06,
"loss": 0.3227,
"step": 16250
},
{
"epoch": 1.93,
"learning_rate": 5.4304347826086955e-06,
"loss": 0.3204,
"step": 16275
},
{
"epoch": 1.93,
"learning_rate": 5.423188405797101e-06,
"loss": 0.2884,
"step": 16300
},
{
"epoch": 1.94,
"learning_rate": 5.415942028985508e-06,
"loss": 0.3259,
"step": 16325
},
{
"epoch": 1.94,
"learning_rate": 5.408695652173913e-06,
"loss": 0.3611,
"step": 16350
},
{
"epoch": 1.94,
"learning_rate": 5.401449275362319e-06,
"loss": 0.3598,
"step": 16375
},
{
"epoch": 1.95,
"learning_rate": 5.394202898550726e-06,
"loss": 0.3911,
"step": 16400
},
{
"epoch": 1.95,
"learning_rate": 5.386956521739131e-06,
"loss": 0.4117,
"step": 16425
},
{
"epoch": 1.95,
"learning_rate": 5.3797101449275365e-06,
"loss": 0.4095,
"step": 16450
},
{
"epoch": 1.96,
"learning_rate": 5.3724637681159415e-06,
"loss": 0.3033,
"step": 16475
},
{
"epoch": 1.96,
"learning_rate": 5.365217391304348e-06,
"loss": 0.3534,
"step": 16500
},
{
"epoch": 1.96,
"learning_rate": 5.357971014492754e-06,
"loss": 0.2906,
"step": 16525
},
{
"epoch": 1.96,
"learning_rate": 5.350724637681159e-06,
"loss": 0.2948,
"step": 16550
},
{
"epoch": 1.97,
"learning_rate": 5.343478260869566e-06,
"loss": 0.2731,
"step": 16575
},
{
"epoch": 1.97,
"learning_rate": 5.336231884057972e-06,
"loss": 0.3218,
"step": 16600
},
{
"epoch": 1.97,
"learning_rate": 5.328985507246377e-06,
"loss": 0.328,
"step": 16625
},
{
"epoch": 1.98,
"learning_rate": 5.321739130434783e-06,
"loss": 0.274,
"step": 16650
},
{
"epoch": 1.98,
"learning_rate": 5.314492753623189e-06,
"loss": 0.2936,
"step": 16675
},
{
"epoch": 1.98,
"learning_rate": 5.307246376811594e-06,
"loss": 0.3601,
"step": 16700
},
{
"epoch": 1.98,
"learning_rate": 5.3002898550724646e-06,
"loss": 0.4228,
"step": 16725
},
{
"epoch": 1.99,
"learning_rate": 5.2930434782608696e-06,
"loss": 0.3024,
"step": 16750
},
{
"epoch": 1.99,
"learning_rate": 5.285797101449276e-06,
"loss": 0.3463,
"step": 16775
},
{
"epoch": 1.99,
"learning_rate": 5.278550724637682e-06,
"loss": 0.3282,
"step": 16800
},
{
"epoch": 2.0,
"learning_rate": 5.271304347826087e-06,
"loss": 0.3138,
"step": 16825
},
{
"epoch": 2.0,
"learning_rate": 5.264057971014494e-06,
"loss": 0.3608,
"step": 16850
},
{
"epoch": 2.0,
"learning_rate": 5.256811594202899e-06,
"loss": 0.2716,
"step": 16875
},
{
"epoch": 2.01,
"learning_rate": 5.249565217391305e-06,
"loss": 0.4661,
"step": 16900
},
{
"epoch": 2.01,
"learning_rate": 5.242318840579711e-06,
"loss": 0.2482,
"step": 16925
},
{
"epoch": 2.01,
"learning_rate": 5.235072463768116e-06,
"loss": 0.34,
"step": 16950
},
{
"epoch": 2.01,
"learning_rate": 5.227826086956522e-06,
"loss": 0.3228,
"step": 16975
},
{
"epoch": 2.02,
"learning_rate": 5.220579710144928e-06,
"loss": 0.3196,
"step": 17000
},
{
"epoch": 2.02,
"eval_cer": 7.224900388607408,
"eval_loss": 0.39229413866996765,
"eval_runtime": 3162.0207,
"eval_samples_per_second": 0.785,
"eval_steps_per_second": 0.392,
"eval_wer": 19.335239184295787,
"step": 17000
},
{
"epoch": 2.02,
"learning_rate": 5.213333333333334e-06,
"loss": 0.2583,
"step": 17025
},
{
"epoch": 2.02,
"learning_rate": 5.20608695652174e-06,
"loss": 0.248,
"step": 17050
},
{
"epoch": 2.03,
"learning_rate": 5.198840579710145e-06,
"loss": 0.2901,
"step": 17075
},
{
"epoch": 2.03,
"learning_rate": 5.191594202898551e-06,
"loss": 0.2492,
"step": 17100
},
{
"epoch": 2.03,
"learning_rate": 5.184347826086957e-06,
"loss": 0.3115,
"step": 17125
},
{
"epoch": 2.04,
"learning_rate": 5.177101449275362e-06,
"loss": 0.3328,
"step": 17150
},
{
"epoch": 2.04,
"learning_rate": 5.169855072463768e-06,
"loss": 0.2782,
"step": 17175
},
{
"epoch": 2.04,
"learning_rate": 5.162608695652175e-06,
"loss": 0.2778,
"step": 17200
},
{
"epoch": 2.04,
"learning_rate": 5.15536231884058e-06,
"loss": 0.2721,
"step": 17225
},
{
"epoch": 2.05,
"learning_rate": 5.148115942028986e-06,
"loss": 0.361,
"step": 17250
},
{
"epoch": 2.05,
"learning_rate": 5.140869565217391e-06,
"loss": 0.3612,
"step": 17275
},
{
"epoch": 2.05,
"learning_rate": 5.1336231884057975e-06,
"loss": 0.2824,
"step": 17300
},
{
"epoch": 2.06,
"learning_rate": 5.126376811594203e-06,
"loss": 0.2909,
"step": 17325
},
{
"epoch": 2.06,
"learning_rate": 5.119130434782608e-06,
"loss": 0.2773,
"step": 17350
},
{
"epoch": 2.06,
"learning_rate": 5.111884057971015e-06,
"loss": 0.3971,
"step": 17375
},
{
"epoch": 2.06,
"learning_rate": 5.104637681159421e-06,
"loss": 0.2334,
"step": 17400
},
{
"epoch": 2.07,
"learning_rate": 5.097391304347826e-06,
"loss": 0.3899,
"step": 17425
},
{
"epoch": 2.07,
"learning_rate": 5.090144927536233e-06,
"loss": 0.321,
"step": 17450
},
{
"epoch": 2.07,
"learning_rate": 5.082898550724638e-06,
"loss": 0.2295,
"step": 17475
},
{
"epoch": 2.08,
"learning_rate": 5.0756521739130435e-06,
"loss": 0.278,
"step": 17500
},
{
"epoch": 2.08,
"learning_rate": 5.06840579710145e-06,
"loss": 0.2696,
"step": 17525
},
{
"epoch": 2.08,
"learning_rate": 5.061159420289855e-06,
"loss": 0.2604,
"step": 17550
},
{
"epoch": 2.09,
"learning_rate": 5.053913043478261e-06,
"loss": 0.3015,
"step": 17575
},
{
"epoch": 2.09,
"learning_rate": 5.046666666666668e-06,
"loss": 0.1998,
"step": 17600
},
{
"epoch": 2.09,
"learning_rate": 5.039420289855073e-06,
"loss": 0.3426,
"step": 17625
},
{
"epoch": 2.09,
"learning_rate": 5.032173913043479e-06,
"loss": 0.3037,
"step": 17650
},
{
"epoch": 2.1,
"learning_rate": 5.024927536231885e-06,
"loss": 0.3063,
"step": 17675
},
{
"epoch": 2.1,
"learning_rate": 5.01768115942029e-06,
"loss": 0.2932,
"step": 17700
},
{
"epoch": 2.1,
"learning_rate": 5.010434782608696e-06,
"loss": 0.3028,
"step": 17725
},
{
"epoch": 2.11,
"learning_rate": 5.003188405797101e-06,
"loss": 0.2644,
"step": 17750
},
{
"epoch": 2.11,
"learning_rate": 4.995942028985508e-06,
"loss": 0.2902,
"step": 17775
},
{
"epoch": 2.11,
"learning_rate": 4.988695652173913e-06,
"loss": 0.2816,
"step": 17800
},
{
"epoch": 2.12,
"learning_rate": 4.98144927536232e-06,
"loss": 0.3323,
"step": 17825
},
{
"epoch": 2.12,
"learning_rate": 4.9742028985507255e-06,
"loss": 0.2923,
"step": 17850
},
{
"epoch": 2.12,
"learning_rate": 4.9669565217391305e-06,
"loss": 0.3281,
"step": 17875
},
{
"epoch": 2.12,
"learning_rate": 4.959710144927536e-06,
"loss": 0.3877,
"step": 17900
},
{
"epoch": 2.13,
"learning_rate": 4.952463768115943e-06,
"loss": 0.372,
"step": 17925
},
{
"epoch": 2.13,
"learning_rate": 4.945217391304348e-06,
"loss": 0.2854,
"step": 17950
},
{
"epoch": 2.13,
"learning_rate": 4.937971014492754e-06,
"loss": 0.3001,
"step": 17975
},
{
"epoch": 2.14,
"learning_rate": 4.93072463768116e-06,
"loss": 0.3251,
"step": 18000
},
{
"epoch": 2.14,
"eval_cer": 7.176078508534606,
"eval_loss": 0.39806175231933594,
"eval_runtime": 3134.0346,
"eval_samples_per_second": 0.792,
"eval_steps_per_second": 0.396,
"eval_wer": 19.483133218982278,
"step": 18000
},
{
"epoch": 2.14,
"learning_rate": 4.923478260869566e-06,
"loss": 0.3021,
"step": 18025
},
{
"epoch": 2.14,
"learning_rate": 4.9162318840579714e-06,
"loss": 0.2846,
"step": 18050
},
{
"epoch": 2.14,
"learning_rate": 4.908985507246377e-06,
"loss": 0.284,
"step": 18075
},
{
"epoch": 2.15,
"learning_rate": 4.901739130434783e-06,
"loss": 0.2423,
"step": 18100
},
{
"epoch": 2.15,
"learning_rate": 4.894492753623189e-06,
"loss": 0.2551,
"step": 18125
},
{
"epoch": 2.15,
"learning_rate": 4.887246376811595e-06,
"loss": 0.4317,
"step": 18150
},
{
"epoch": 2.16,
"learning_rate": 4.880000000000001e-06,
"loss": 0.4729,
"step": 18175
},
{
"epoch": 2.16,
"learning_rate": 4.872753623188406e-06,
"loss": 0.2887,
"step": 18200
},
{
"epoch": 2.16,
"learning_rate": 4.865507246376812e-06,
"loss": 0.4263,
"step": 18225
},
{
"epoch": 2.17,
"learning_rate": 4.8582608695652174e-06,
"loss": 0.3566,
"step": 18250
},
{
"epoch": 2.17,
"learning_rate": 4.851014492753623e-06,
"loss": 0.3274,
"step": 18275
},
{
"epoch": 2.17,
"learning_rate": 4.843768115942029e-06,
"loss": 0.2818,
"step": 18300
},
{
"epoch": 2.17,
"learning_rate": 4.836521739130435e-06,
"loss": 0.29,
"step": 18325
},
{
"epoch": 2.18,
"learning_rate": 4.829275362318841e-06,
"loss": 0.3009,
"step": 18350
},
{
"epoch": 2.18,
"learning_rate": 4.822028985507247e-06,
"loss": 0.3663,
"step": 18375
},
{
"epoch": 2.18,
"learning_rate": 4.8147826086956526e-06,
"loss": 0.2181,
"step": 18400
},
{
"epoch": 2.19,
"learning_rate": 4.807536231884058e-06,
"loss": 0.4402,
"step": 18425
},
{
"epoch": 2.19,
"learning_rate": 4.800289855072464e-06,
"loss": 0.3224,
"step": 18450
},
{
"epoch": 2.19,
"learning_rate": 4.79304347826087e-06,
"loss": 0.4503,
"step": 18475
},
{
"epoch": 2.2,
"learning_rate": 4.785797101449276e-06,
"loss": 0.3597,
"step": 18500
},
{
"epoch": 2.2,
"learning_rate": 4.778550724637682e-06,
"loss": 0.3584,
"step": 18525
},
{
"epoch": 2.2,
"learning_rate": 4.771304347826088e-06,
"loss": 0.3391,
"step": 18550
},
{
"epoch": 2.2,
"learning_rate": 4.764057971014493e-06,
"loss": 0.3192,
"step": 18575
},
{
"epoch": 2.21,
"learning_rate": 4.756811594202899e-06,
"loss": 0.3671,
"step": 18600
},
{
"epoch": 2.21,
"learning_rate": 4.749565217391305e-06,
"loss": 0.3506,
"step": 18625
},
{
"epoch": 2.21,
"learning_rate": 4.74231884057971e-06,
"loss": 0.3515,
"step": 18650
},
{
"epoch": 2.22,
"learning_rate": 4.735072463768116e-06,
"loss": 0.2615,
"step": 18675
},
{
"epoch": 2.22,
"learning_rate": 4.727826086956522e-06,
"loss": 0.2509,
"step": 18700
},
{
"epoch": 2.22,
"learning_rate": 4.720579710144928e-06,
"loss": 0.3,
"step": 18725
},
{
"epoch": 2.22,
"learning_rate": 4.713333333333334e-06,
"loss": 0.302,
"step": 18750
},
{
"epoch": 2.23,
"learning_rate": 4.7060869565217395e-06,
"loss": 0.2971,
"step": 18775
},
{
"epoch": 2.23,
"learning_rate": 4.698840579710145e-06,
"loss": 0.4138,
"step": 18800
},
{
"epoch": 2.23,
"learning_rate": 4.691594202898551e-06,
"loss": 0.296,
"step": 18825
},
{
"epoch": 2.24,
"learning_rate": 4.684347826086957e-06,
"loss": 0.2533,
"step": 18850
},
{
"epoch": 2.24,
"learning_rate": 4.677101449275362e-06,
"loss": 0.2477,
"step": 18875
},
{
"epoch": 2.24,
"learning_rate": 4.669855072463769e-06,
"loss": 0.2952,
"step": 18900
},
{
"epoch": 2.25,
"learning_rate": 4.662608695652175e-06,
"loss": 0.2471,
"step": 18925
},
{
"epoch": 2.25,
"learning_rate": 4.65536231884058e-06,
"loss": 0.2664,
"step": 18950
},
{
"epoch": 2.25,
"learning_rate": 4.6481159420289855e-06,
"loss": 0.2127,
"step": 18975
},
{
"epoch": 2.25,
"learning_rate": 4.640869565217392e-06,
"loss": 0.4162,
"step": 19000
},
{
"epoch": 2.25,
"eval_cer": 7.059004377982194,
"eval_loss": 0.39584028720855713,
"eval_runtime": 3153.6429,
"eval_samples_per_second": 0.787,
"eval_steps_per_second": 0.394,
"eval_wer": 19.057747284162378,
"step": 19000
},
{
"epoch": 2.26,
"learning_rate": 4.633623188405797e-06,
"loss": 0.286,
"step": 19025
},
{
"epoch": 2.26,
"learning_rate": 4.626376811594203e-06,
"loss": 0.2912,
"step": 19050
},
{
"epoch": 2.26,
"learning_rate": 4.619130434782609e-06,
"loss": 0.2905,
"step": 19075
},
{
"epoch": 2.27,
"learning_rate": 4.611884057971015e-06,
"loss": 0.333,
"step": 19100
},
{
"epoch": 2.27,
"learning_rate": 4.604637681159421e-06,
"loss": 0.2647,
"step": 19125
},
{
"epoch": 2.27,
"learning_rate": 4.5973913043478265e-06,
"loss": 0.2746,
"step": 19150
},
{
"epoch": 2.28,
"learning_rate": 4.590144927536232e-06,
"loss": 0.3317,
"step": 19175
},
{
"epoch": 2.28,
"learning_rate": 4.582898550724638e-06,
"loss": 0.2549,
"step": 19200
},
{
"epoch": 2.28,
"learning_rate": 4.575652173913044e-06,
"loss": 0.312,
"step": 19225
},
{
"epoch": 2.28,
"learning_rate": 4.56840579710145e-06,
"loss": 0.3177,
"step": 19250
},
{
"epoch": 2.29,
"learning_rate": 4.561159420289856e-06,
"loss": 0.3063,
"step": 19275
},
{
"epoch": 2.29,
"learning_rate": 4.553913043478262e-06,
"loss": 0.3964,
"step": 19300
},
{
"epoch": 2.29,
"learning_rate": 4.546666666666667e-06,
"loss": 0.3377,
"step": 19325
},
{
"epoch": 2.3,
"learning_rate": 4.5394202898550725e-06,
"loss": 0.2753,
"step": 19350
},
{
"epoch": 2.3,
"learning_rate": 4.532173913043479e-06,
"loss": 0.2735,
"step": 19375
},
{
"epoch": 2.3,
"learning_rate": 4.524927536231884e-06,
"loss": 0.292,
"step": 19400
},
{
"epoch": 2.31,
"learning_rate": 4.51768115942029e-06,
"loss": 0.2894,
"step": 19425
},
{
"epoch": 2.31,
"learning_rate": 4.510434782608696e-06,
"loss": 0.367,
"step": 19450
},
{
"epoch": 2.31,
"learning_rate": 4.503188405797102e-06,
"loss": 0.2483,
"step": 19475
},
{
"epoch": 2.31,
"learning_rate": 4.495942028985508e-06,
"loss": 0.4151,
"step": 19500
},
{
"epoch": 2.32,
"learning_rate": 4.4886956521739134e-06,
"loss": 0.269,
"step": 19525
},
{
"epoch": 2.32,
"learning_rate": 4.481449275362319e-06,
"loss": 0.3127,
"step": 19550
},
{
"epoch": 2.32,
"learning_rate": 4.474202898550725e-06,
"loss": 0.2615,
"step": 19575
},
{
"epoch": 2.33,
"learning_rate": 4.466956521739131e-06,
"loss": 0.2606,
"step": 19600
},
{
"epoch": 2.33,
"learning_rate": 4.459710144927537e-06,
"loss": 0.2855,
"step": 19625
},
{
"epoch": 2.33,
"learning_rate": 4.452463768115942e-06,
"loss": 0.2419,
"step": 19650
},
{
"epoch": 2.33,
"learning_rate": 4.4452173913043486e-06,
"loss": 0.3292,
"step": 19675
},
{
"epoch": 2.34,
"learning_rate": 4.4379710144927544e-06,
"loss": 0.2821,
"step": 19700
},
{
"epoch": 2.34,
"learning_rate": 4.4307246376811594e-06,
"loss": 0.3189,
"step": 19725
},
{
"epoch": 2.34,
"learning_rate": 4.423478260869565e-06,
"loss": 0.286,
"step": 19750
},
{
"epoch": 2.35,
"learning_rate": 4.416231884057971e-06,
"loss": 0.2853,
"step": 19775
},
{
"epoch": 2.35,
"learning_rate": 4.408985507246377e-06,
"loss": 0.2835,
"step": 19800
},
{
"epoch": 2.35,
"learning_rate": 4.401739130434783e-06,
"loss": 0.2626,
"step": 19825
},
{
"epoch": 2.36,
"learning_rate": 4.394492753623189e-06,
"loss": 0.3301,
"step": 19850
},
{
"epoch": 2.36,
"learning_rate": 4.3872463768115946e-06,
"loss": 0.3094,
"step": 19875
},
{
"epoch": 2.36,
"learning_rate": 4.380289855072464e-06,
"loss": 0.2322,
"step": 19900
},
{
"epoch": 2.36,
"learning_rate": 4.37304347826087e-06,
"loss": 0.3167,
"step": 19925
},
{
"epoch": 2.37,
"learning_rate": 4.365797101449276e-06,
"loss": 0.3029,
"step": 19950
},
{
"epoch": 2.37,
"learning_rate": 4.358550724637682e-06,
"loss": 0.2892,
"step": 19975
},
{
"epoch": 2.37,
"learning_rate": 4.3513043478260875e-06,
"loss": 0.2851,
"step": 20000
},
{
"epoch": 2.37,
"eval_cer": 7.0167002803876235,
"eval_loss": 0.39532455801963806,
"eval_runtime": 3151.9912,
"eval_samples_per_second": 0.787,
"eval_steps_per_second": 0.394,
"eval_wer": 19.209453020773775,
"step": 20000
},
{
"epoch": 2.38,
"learning_rate": 4.344057971014493e-06,
"loss": 0.2749,
"step": 20025
},
{
"epoch": 2.38,
"learning_rate": 4.336811594202899e-06,
"loss": 0.3344,
"step": 20050
},
{
"epoch": 2.38,
"learning_rate": 4.329565217391305e-06,
"loss": 0.2773,
"step": 20075
},
{
"epoch": 2.39,
"learning_rate": 4.322318840579711e-06,
"loss": 0.2361,
"step": 20100
},
{
"epoch": 2.39,
"learning_rate": 4.315072463768116e-06,
"loss": 0.2254,
"step": 20125
},
{
"epoch": 2.39,
"learning_rate": 4.307826086956522e-06,
"loss": 0.2396,
"step": 20150
},
{
"epoch": 2.39,
"learning_rate": 4.3005797101449284e-06,
"loss": 0.2621,
"step": 20175
},
{
"epoch": 2.4,
"learning_rate": 4.2933333333333334e-06,
"loss": 0.31,
"step": 20200
},
{
"epoch": 2.4,
"learning_rate": 4.286086956521739e-06,
"loss": 0.3039,
"step": 20225
},
{
"epoch": 2.4,
"learning_rate": 4.278840579710145e-06,
"loss": 0.2772,
"step": 20250
},
{
"epoch": 2.41,
"learning_rate": 4.271594202898551e-06,
"loss": 0.2535,
"step": 20275
},
{
"epoch": 2.41,
"learning_rate": 4.264347826086957e-06,
"loss": 0.2903,
"step": 20300
},
{
"epoch": 2.41,
"learning_rate": 4.257101449275363e-06,
"loss": 0.3347,
"step": 20325
},
{
"epoch": 2.41,
"learning_rate": 4.2498550724637686e-06,
"loss": 0.3133,
"step": 20350
},
{
"epoch": 2.42,
"learning_rate": 4.2426086956521744e-06,
"loss": 0.2631,
"step": 20375
},
{
"epoch": 2.42,
"learning_rate": 4.23536231884058e-06,
"loss": 0.2973,
"step": 20400
},
{
"epoch": 2.42,
"learning_rate": 4.228115942028986e-06,
"loss": 0.2731,
"step": 20425
},
{
"epoch": 2.43,
"learning_rate": 4.220869565217391e-06,
"loss": 0.3088,
"step": 20450
},
{
"epoch": 2.43,
"learning_rate": 4.213623188405798e-06,
"loss": 0.3291,
"step": 20475
},
{
"epoch": 2.43,
"learning_rate": 4.206376811594204e-06,
"loss": 0.2447,
"step": 20500
},
{
"epoch": 2.44,
"learning_rate": 4.199130434782609e-06,
"loss": 0.3862,
"step": 20525
},
{
"epoch": 2.44,
"learning_rate": 4.1918840579710146e-06,
"loss": 0.3494,
"step": 20550
},
{
"epoch": 2.44,
"learning_rate": 4.18463768115942e-06,
"loss": 0.314,
"step": 20575
},
{
"epoch": 2.44,
"learning_rate": 4.177391304347826e-06,
"loss": 0.3158,
"step": 20600
},
{
"epoch": 2.45,
"learning_rate": 4.170144927536232e-06,
"loss": 0.2839,
"step": 20625
},
{
"epoch": 2.45,
"learning_rate": 4.162898550724638e-06,
"loss": 0.2518,
"step": 20650
},
{
"epoch": 2.45,
"learning_rate": 4.155652173913044e-06,
"loss": 0.3692,
"step": 20675
},
{
"epoch": 2.46,
"learning_rate": 4.14840579710145e-06,
"loss": 0.2712,
"step": 20700
},
{
"epoch": 2.46,
"learning_rate": 4.1411594202898555e-06,
"loss": 0.2804,
"step": 20725
},
{
"epoch": 2.46,
"learning_rate": 4.1339130434782605e-06,
"loss": 0.3514,
"step": 20750
},
{
"epoch": 2.47,
"learning_rate": 4.126666666666667e-06,
"loss": 0.2892,
"step": 20775
},
{
"epoch": 2.47,
"learning_rate": 4.119420289855073e-06,
"loss": 0.2898,
"step": 20800
},
{
"epoch": 2.47,
"learning_rate": 4.112173913043478e-06,
"loss": 0.3071,
"step": 20825
},
{
"epoch": 2.47,
"learning_rate": 4.104927536231885e-06,
"loss": 0.2719,
"step": 20850
},
{
"epoch": 2.48,
"learning_rate": 4.097681159420291e-06,
"loss": 0.3628,
"step": 20875
},
{
"epoch": 2.48,
"learning_rate": 4.090434782608696e-06,
"loss": 0.3201,
"step": 20900
},
{
"epoch": 2.48,
"learning_rate": 4.0831884057971015e-06,
"loss": 0.3166,
"step": 20925
},
{
"epoch": 2.49,
"learning_rate": 4.075942028985508e-06,
"loss": 0.3418,
"step": 20950
},
{
"epoch": 2.49,
"learning_rate": 4.068695652173913e-06,
"loss": 0.288,
"step": 20975
},
{
"epoch": 2.49,
"learning_rate": 4.061449275362319e-06,
"loss": 0.2982,
"step": 21000
},
{
"epoch": 2.49,
"eval_cer": 6.842564808893699,
"eval_loss": 0.39293238520622253,
"eval_runtime": 3128.5672,
"eval_samples_per_second": 0.793,
"eval_steps_per_second": 0.397,
"eval_wer": 18.80998665904326,
"step": 21000
},
{
"epoch": 2.49,
"learning_rate": 4.054202898550725e-06,
"loss": 0.2191,
"step": 21025
},
{
"epoch": 2.5,
"learning_rate": 4.046956521739131e-06,
"loss": 0.3047,
"step": 21050
},
{
"epoch": 2.5,
"learning_rate": 4.039710144927537e-06,
"loss": 0.2752,
"step": 21075
},
{
"epoch": 2.5,
"learning_rate": 4.0324637681159425e-06,
"loss": 0.2675,
"step": 21100
},
{
"epoch": 2.51,
"learning_rate": 4.025217391304348e-06,
"loss": 0.2971,
"step": 21125
},
{
"epoch": 2.51,
"learning_rate": 4.017971014492754e-06,
"loss": 0.3199,
"step": 21150
},
{
"epoch": 2.51,
"learning_rate": 4.01072463768116e-06,
"loss": 0.2402,
"step": 21175
},
{
"epoch": 2.52,
"learning_rate": 4.003478260869565e-06,
"loss": 0.2752,
"step": 21200
},
{
"epoch": 2.52,
"learning_rate": 3.996231884057971e-06,
"loss": 0.3148,
"step": 21225
},
{
"epoch": 2.52,
"learning_rate": 3.988985507246378e-06,
"loss": 0.2471,
"step": 21250
},
{
"epoch": 2.52,
"learning_rate": 3.981739130434783e-06,
"loss": 0.2807,
"step": 21275
},
{
"epoch": 2.53,
"learning_rate": 3.9744927536231885e-06,
"loss": 0.2242,
"step": 21300
},
{
"epoch": 2.53,
"learning_rate": 3.967246376811594e-06,
"loss": 0.4252,
"step": 21325
},
{
"epoch": 2.53,
"learning_rate": 3.96e-06,
"loss": 0.2453,
"step": 21350
},
{
"epoch": 2.54,
"learning_rate": 3.952753623188406e-06,
"loss": 0.2282,
"step": 21375
},
{
"epoch": 2.54,
"learning_rate": 3.945507246376812e-06,
"loss": 0.353,
"step": 21400
},
{
"epoch": 2.54,
"learning_rate": 3.938260869565218e-06,
"loss": 0.3021,
"step": 21425
},
{
"epoch": 2.55,
"learning_rate": 3.931014492753624e-06,
"loss": 0.2803,
"step": 21450
},
{
"epoch": 2.55,
"learning_rate": 3.9237681159420295e-06,
"loss": 0.2523,
"step": 21475
},
{
"epoch": 2.55,
"learning_rate": 3.916521739130435e-06,
"loss": 0.2748,
"step": 21500
},
{
"epoch": 2.55,
"learning_rate": 3.90927536231884e-06,
"loss": 0.3106,
"step": 21525
},
{
"epoch": 2.56,
"learning_rate": 3.902028985507247e-06,
"loss": 0.3489,
"step": 21550
},
{
"epoch": 2.56,
"learning_rate": 3.894782608695653e-06,
"loss": 0.3188,
"step": 21575
},
{
"epoch": 2.56,
"learning_rate": 3.887536231884058e-06,
"loss": 0.3188,
"step": 21600
},
{
"epoch": 2.57,
"learning_rate": 3.880289855072465e-06,
"loss": 0.3178,
"step": 21625
},
{
"epoch": 2.57,
"learning_rate": 3.87304347826087e-06,
"loss": 0.2279,
"step": 21650
},
{
"epoch": 2.57,
"learning_rate": 3.8657971014492755e-06,
"loss": 0.2803,
"step": 21675
},
{
"epoch": 2.58,
"learning_rate": 3.858550724637681e-06,
"loss": 0.21,
"step": 21700
},
{
"epoch": 2.58,
"learning_rate": 3.851304347826087e-06,
"loss": 0.2753,
"step": 21725
},
{
"epoch": 2.58,
"learning_rate": 3.844057971014493e-06,
"loss": 0.4256,
"step": 21750
},
{
"epoch": 2.58,
"learning_rate": 3.836811594202899e-06,
"loss": 0.2934,
"step": 21775
},
{
"epoch": 2.59,
"learning_rate": 3.829565217391305e-06,
"loss": 0.3364,
"step": 21800
},
{
"epoch": 2.59,
"learning_rate": 3.822318840579711e-06,
"loss": 0.3053,
"step": 21825
},
{
"epoch": 2.59,
"learning_rate": 3.8150724637681164e-06,
"loss": 0.3143,
"step": 21850
},
{
"epoch": 2.6,
"learning_rate": 3.807826086956522e-06,
"loss": 0.2758,
"step": 21875
},
{
"epoch": 2.6,
"learning_rate": 3.8005797101449277e-06,
"loss": 0.2616,
"step": 21900
},
{
"epoch": 2.6,
"learning_rate": 3.793333333333334e-06,
"loss": 0.2949,
"step": 21925
},
{
"epoch": 2.6,
"learning_rate": 3.7860869565217394e-06,
"loss": 0.358,
"step": 21950
},
{
"epoch": 2.61,
"learning_rate": 3.7788405797101453e-06,
"loss": 0.2856,
"step": 21975
},
{
"epoch": 2.61,
"learning_rate": 3.7715942028985507e-06,
"loss": 0.3642,
"step": 22000
},
{
"epoch": 2.61,
"eval_cer": 6.886713561906636,
"eval_loss": 0.3953614830970764,
"eval_runtime": 3140.8887,
"eval_samples_per_second": 0.79,
"eval_steps_per_second": 0.395,
"eval_wer": 18.69716028206594,
"step": 22000
},
{
"epoch": 2.61,
"learning_rate": 3.764347826086957e-06,
"loss": 0.283,
"step": 22025
},
{
"epoch": 2.62,
"learning_rate": 3.757101449275363e-06,
"loss": 0.3267,
"step": 22050
},
{
"epoch": 2.62,
"learning_rate": 3.7498550724637683e-06,
"loss": 0.3271,
"step": 22075
},
{
"epoch": 2.62,
"learning_rate": 3.742608695652174e-06,
"loss": 0.3372,
"step": 22100
},
{
"epoch": 2.63,
"learning_rate": 3.7353623188405804e-06,
"loss": 0.2551,
"step": 22125
},
{
"epoch": 2.63,
"learning_rate": 3.728115942028986e-06,
"loss": 0.3063,
"step": 22150
},
{
"epoch": 2.63,
"learning_rate": 3.7208695652173917e-06,
"loss": 0.2902,
"step": 22175
},
{
"epoch": 2.63,
"learning_rate": 3.713623188405797e-06,
"loss": 0.255,
"step": 22200
},
{
"epoch": 2.64,
"learning_rate": 3.7063768115942034e-06,
"loss": 0.3041,
"step": 22225
},
{
"epoch": 2.64,
"learning_rate": 3.699130434782609e-06,
"loss": 0.3338,
"step": 22250
},
{
"epoch": 2.64,
"learning_rate": 3.6918840579710147e-06,
"loss": 0.2509,
"step": 22275
},
{
"epoch": 2.65,
"learning_rate": 3.68463768115942e-06,
"loss": 0.2996,
"step": 22300
},
{
"epoch": 2.65,
"learning_rate": 3.6773913043478264e-06,
"loss": 0.3299,
"step": 22325
},
{
"epoch": 2.65,
"learning_rate": 3.6701449275362323e-06,
"loss": 0.234,
"step": 22350
},
{
"epoch": 2.66,
"learning_rate": 3.6628985507246377e-06,
"loss": 0.304,
"step": 22375
},
{
"epoch": 2.66,
"learning_rate": 3.6556521739130435e-06,
"loss": 0.3406,
"step": 22400
},
{
"epoch": 2.66,
"learning_rate": 3.64840579710145e-06,
"loss": 0.2437,
"step": 22425
},
{
"epoch": 2.66,
"learning_rate": 3.6411594202898552e-06,
"loss": 0.4036,
"step": 22450
},
{
"epoch": 2.67,
"learning_rate": 3.633913043478261e-06,
"loss": 0.431,
"step": 22475
},
{
"epoch": 2.67,
"learning_rate": 3.6266666666666674e-06,
"loss": 0.2864,
"step": 22500
},
{
"epoch": 2.67,
"learning_rate": 3.619420289855073e-06,
"loss": 0.2791,
"step": 22525
},
{
"epoch": 2.68,
"learning_rate": 3.6121739130434787e-06,
"loss": 0.2975,
"step": 22550
},
{
"epoch": 2.68,
"learning_rate": 3.604927536231884e-06,
"loss": 0.3252,
"step": 22575
},
{
"epoch": 2.68,
"learning_rate": 3.5976811594202904e-06,
"loss": 0.2389,
"step": 22600
},
{
"epoch": 2.68,
"learning_rate": 3.5904347826086962e-06,
"loss": 0.3063,
"step": 22625
},
{
"epoch": 2.69,
"learning_rate": 3.5831884057971017e-06,
"loss": 0.2614,
"step": 22650
},
{
"epoch": 2.69,
"learning_rate": 3.5759420289855075e-06,
"loss": 0.2833,
"step": 22675
},
{
"epoch": 2.69,
"learning_rate": 3.5686956521739134e-06,
"loss": 0.3931,
"step": 22700
},
{
"epoch": 2.7,
"learning_rate": 3.5614492753623192e-06,
"loss": 0.2804,
"step": 22725
},
{
"epoch": 2.7,
"learning_rate": 3.554202898550725e-06,
"loss": 0.2688,
"step": 22750
},
{
"epoch": 2.7,
"learning_rate": 3.5469565217391305e-06,
"loss": 0.2059,
"step": 22775
},
{
"epoch": 2.71,
"learning_rate": 3.5397101449275368e-06,
"loss": 0.3133,
"step": 22800
},
{
"epoch": 2.71,
"learning_rate": 3.5324637681159422e-06,
"loss": 0.2725,
"step": 22825
},
{
"epoch": 2.71,
"learning_rate": 3.525217391304348e-06,
"loss": 0.2712,
"step": 22850
},
{
"epoch": 2.71,
"learning_rate": 3.5179710144927535e-06,
"loss": 0.264,
"step": 22875
},
{
"epoch": 2.72,
"learning_rate": 3.5107246376811598e-06,
"loss": 0.2404,
"step": 22900
},
{
"epoch": 2.72,
"learning_rate": 3.5034782608695656e-06,
"loss": 0.3211,
"step": 22925
},
{
"epoch": 2.72,
"learning_rate": 3.496231884057971e-06,
"loss": 0.2726,
"step": 22950
},
{
"epoch": 2.73,
"learning_rate": 3.488985507246377e-06,
"loss": 0.399,
"step": 22975
},
{
"epoch": 2.73,
"learning_rate": 3.481739130434783e-06,
"loss": 0.2297,
"step": 23000
},
{
"epoch": 2.73,
"eval_cer": 6.938363913620936,
"eval_loss": 0.3916235566139221,
"eval_runtime": 3180.568,
"eval_samples_per_second": 0.78,
"eval_steps_per_second": 0.39,
"eval_wer": 18.73299028016009,
"step": 23000
},
{
"epoch": 2.73,
"learning_rate": 3.4744927536231886e-06,
"loss": 0.3484,
"step": 23025
},
{
"epoch": 2.74,
"learning_rate": 3.4672463768115945e-06,
"loss": 0.2585,
"step": 23050
},
{
"epoch": 2.74,
"learning_rate": 3.46e-06,
"loss": 0.2843,
"step": 23075
},
{
"epoch": 2.74,
"learning_rate": 3.452753623188406e-06,
"loss": 0.3526,
"step": 23100
},
{
"epoch": 2.74,
"learning_rate": 3.445507246376812e-06,
"loss": 0.3063,
"step": 23125
},
{
"epoch": 2.75,
"learning_rate": 3.4382608695652175e-06,
"loss": 0.3701,
"step": 23150
},
{
"epoch": 2.75,
"learning_rate": 3.4310144927536233e-06,
"loss": 0.2438,
"step": 23175
},
{
"epoch": 2.75,
"learning_rate": 3.4237681159420296e-06,
"loss": 0.3001,
"step": 23200
},
{
"epoch": 2.76,
"learning_rate": 3.416521739130435e-06,
"loss": 0.3103,
"step": 23225
},
{
"epoch": 2.76,
"learning_rate": 3.409275362318841e-06,
"loss": 0.2769,
"step": 23250
},
{
"epoch": 2.76,
"learning_rate": 3.4020289855072467e-06,
"loss": 0.4483,
"step": 23275
},
{
"epoch": 2.76,
"learning_rate": 3.3947826086956526e-06,
"loss": 0.2777,
"step": 23300
},
{
"epoch": 2.77,
"learning_rate": 3.387536231884058e-06,
"loss": 0.2413,
"step": 23325
},
{
"epoch": 2.77,
"learning_rate": 3.380289855072464e-06,
"loss": 0.2911,
"step": 23350
},
{
"epoch": 2.77,
"learning_rate": 3.37304347826087e-06,
"loss": 0.3544,
"step": 23375
},
{
"epoch": 2.78,
"learning_rate": 3.3657971014492756e-06,
"loss": 0.349,
"step": 23400
},
{
"epoch": 2.78,
"learning_rate": 3.3585507246376814e-06,
"loss": 0.3243,
"step": 23425
},
{
"epoch": 2.78,
"learning_rate": 3.351304347826087e-06,
"loss": 0.2601,
"step": 23450
},
{
"epoch": 2.79,
"learning_rate": 3.344057971014493e-06,
"loss": 0.268,
"step": 23475
},
{
"epoch": 2.79,
"learning_rate": 3.336811594202899e-06,
"loss": 0.294,
"step": 23500
},
{
"epoch": 2.79,
"learning_rate": 3.3295652173913044e-06,
"loss": 0.3095,
"step": 23525
},
{
"epoch": 2.79,
"learning_rate": 3.3223188405797103e-06,
"loss": 0.2588,
"step": 23550
},
{
"epoch": 2.8,
"learning_rate": 3.3150724637681166e-06,
"loss": 0.4027,
"step": 23575
},
{
"epoch": 2.8,
"learning_rate": 3.307826086956522e-06,
"loss": 0.2887,
"step": 23600
},
{
"epoch": 2.8,
"learning_rate": 3.300579710144928e-06,
"loss": 0.2459,
"step": 23625
},
{
"epoch": 2.81,
"learning_rate": 3.2933333333333333e-06,
"loss": 0.2288,
"step": 23650
},
{
"epoch": 2.81,
"learning_rate": 3.2860869565217396e-06,
"loss": 0.2998,
"step": 23675
},
{
"epoch": 2.81,
"learning_rate": 3.2788405797101454e-06,
"loss": 0.3197,
"step": 23700
},
{
"epoch": 2.82,
"learning_rate": 3.271594202898551e-06,
"loss": 0.2931,
"step": 23725
},
{
"epoch": 2.82,
"learning_rate": 3.2643478260869567e-06,
"loss": 0.2451,
"step": 23750
},
{
"epoch": 2.82,
"learning_rate": 3.2571014492753626e-06,
"loss": 0.251,
"step": 23775
},
{
"epoch": 2.82,
"learning_rate": 3.2498550724637684e-06,
"loss": 0.291,
"step": 23800
},
{
"epoch": 2.83,
"learning_rate": 3.2426086956521743e-06,
"loss": 0.2916,
"step": 23825
},
{
"epoch": 2.83,
"learning_rate": 3.2353623188405797e-06,
"loss": 0.3365,
"step": 23850
},
{
"epoch": 2.83,
"learning_rate": 3.228115942028986e-06,
"loss": 0.2967,
"step": 23875
},
{
"epoch": 2.84,
"learning_rate": 3.2208695652173914e-06,
"loss": 0.2435,
"step": 23900
},
{
"epoch": 2.84,
"learning_rate": 3.2136231884057973e-06,
"loss": 0.3885,
"step": 23925
},
{
"epoch": 2.84,
"learning_rate": 3.2063768115942027e-06,
"loss": 0.2373,
"step": 23950
},
{
"epoch": 2.85,
"learning_rate": 3.199130434782609e-06,
"loss": 0.3457,
"step": 23975
},
{
"epoch": 2.85,
"learning_rate": 3.191884057971015e-06,
"loss": 0.2313,
"step": 24000
},
{
"epoch": 2.85,
"eval_cer": 6.778493777362389,
"eval_loss": 0.3930225968360901,
"eval_runtime": 3191.3103,
"eval_samples_per_second": 0.778,
"eval_steps_per_second": 0.389,
"eval_wer": 18.60339241471317,
"step": 24000
},
{
"epoch": 2.85,
"learning_rate": 3.1846376811594202e-06,
"loss": 0.2984,
"step": 24025
},
{
"epoch": 2.85,
"learning_rate": 3.1773913043478265e-06,
"loss": 0.2425,
"step": 24050
},
{
"epoch": 2.86,
"learning_rate": 3.1701449275362324e-06,
"loss": 0.3009,
"step": 24075
},
{
"epoch": 2.86,
"learning_rate": 3.162898550724638e-06,
"loss": 0.251,
"step": 24100
},
{
"epoch": 2.86,
"learning_rate": 3.1556521739130437e-06,
"loss": 0.2794,
"step": 24125
},
{
"epoch": 2.87,
"learning_rate": 3.14840579710145e-06,
"loss": 0.326,
"step": 24150
},
{
"epoch": 2.87,
"learning_rate": 3.1414492753623194e-06,
"loss": 0.2487,
"step": 24175
},
{
"epoch": 2.87,
"learning_rate": 3.134202898550725e-06,
"loss": 0.2793,
"step": 24200
},
{
"epoch": 2.87,
"learning_rate": 3.1269565217391307e-06,
"loss": 0.3093,
"step": 24225
},
{
"epoch": 2.88,
"learning_rate": 3.119710144927536e-06,
"loss": 0.2536,
"step": 24250
},
{
"epoch": 2.88,
"learning_rate": 3.1124637681159424e-06,
"loss": 0.3143,
"step": 24275
},
{
"epoch": 2.88,
"learning_rate": 3.1052173913043483e-06,
"loss": 0.2409,
"step": 24300
},
{
"epoch": 2.89,
"learning_rate": 3.0979710144927537e-06,
"loss": 0.3879,
"step": 24325
},
{
"epoch": 2.89,
"learning_rate": 3.0907246376811596e-06,
"loss": 0.3521,
"step": 24350
},
{
"epoch": 2.89,
"learning_rate": 3.083478260869566e-06,
"loss": 0.2628,
"step": 24375
},
{
"epoch": 2.9,
"learning_rate": 3.0762318840579713e-06,
"loss": 0.2127,
"step": 24400
},
{
"epoch": 2.9,
"learning_rate": 3.068985507246377e-06,
"loss": 0.3071,
"step": 24425
},
{
"epoch": 2.9,
"learning_rate": 3.0617391304347826e-06,
"loss": 0.2488,
"step": 24450
},
{
"epoch": 2.9,
"learning_rate": 3.054492753623189e-06,
"loss": 0.2462,
"step": 24475
},
{
"epoch": 2.91,
"learning_rate": 3.0472463768115947e-06,
"loss": 0.2651,
"step": 24500
},
{
"epoch": 2.91,
"learning_rate": 3.04e-06,
"loss": 0.2555,
"step": 24525
},
{
"epoch": 2.91,
"learning_rate": 3.032753623188406e-06,
"loss": 0.2511,
"step": 24550
},
{
"epoch": 2.92,
"learning_rate": 3.025507246376812e-06,
"loss": 0.2761,
"step": 24575
},
{
"epoch": 2.92,
"learning_rate": 3.0182608695652177e-06,
"loss": 0.3315,
"step": 24600
},
{
"epoch": 2.92,
"learning_rate": 3.0110144927536235e-06,
"loss": 0.4222,
"step": 24625
},
{
"epoch": 2.93,
"learning_rate": 3.003768115942029e-06,
"loss": 0.252,
"step": 24650
},
{
"epoch": 2.93,
"learning_rate": 2.9965217391304352e-06,
"loss": 0.3424,
"step": 24675
},
{
"epoch": 2.93,
"learning_rate": 2.9892753623188407e-06,
"loss": 0.3086,
"step": 24700
},
{
"epoch": 2.93,
"learning_rate": 2.9820289855072465e-06,
"loss": 0.3246,
"step": 24725
},
{
"epoch": 2.94,
"learning_rate": 2.974782608695652e-06,
"loss": 0.4331,
"step": 24750
},
{
"epoch": 2.94,
"learning_rate": 2.9675362318840582e-06,
"loss": 0.2933,
"step": 24775
},
{
"epoch": 2.94,
"learning_rate": 2.960289855072464e-06,
"loss": 0.3234,
"step": 24800
},
{
"epoch": 2.95,
"learning_rate": 2.9530434782608695e-06,
"loss": 0.2495,
"step": 24825
},
{
"epoch": 2.95,
"learning_rate": 2.9457971014492754e-06,
"loss": 0.2506,
"step": 24850
},
{
"epoch": 2.95,
"learning_rate": 2.9385507246376817e-06,
"loss": 0.2862,
"step": 24875
},
{
"epoch": 2.95,
"learning_rate": 2.931304347826087e-06,
"loss": 0.2804,
"step": 24900
},
{
"epoch": 2.96,
"learning_rate": 2.924057971014493e-06,
"loss": 0.2659,
"step": 24925
},
{
"epoch": 2.96,
"learning_rate": 2.9168115942028992e-06,
"loss": 0.2801,
"step": 24950
},
{
"epoch": 2.96,
"learning_rate": 2.9095652173913046e-06,
"loss": 0.3455,
"step": 24975
},
{
"epoch": 2.97,
"learning_rate": 2.902608695652174e-06,
"loss": 0.2833,
"step": 25000
},
{
"epoch": 2.97,
"eval_cer": 6.855231442766491,
"eval_loss": 0.39096301794052124,
"eval_runtime": 3187.6224,
"eval_samples_per_second": 0.779,
"eval_steps_per_second": 0.389,
"eval_wer": 18.598056032018295,
"step": 25000
},
{
"epoch": 2.97,
"learning_rate": 2.89536231884058e-06,
"loss": 0.2299,
"step": 25025
},
{
"epoch": 2.97,
"learning_rate": 2.8881159420289854e-06,
"loss": 0.2482,
"step": 25050
},
{
"epoch": 2.98,
"learning_rate": 2.8808695652173917e-06,
"loss": 0.3388,
"step": 25075
},
{
"epoch": 2.98,
"learning_rate": 2.8736231884057975e-06,
"loss": 0.4429,
"step": 25100
},
{
"epoch": 2.98,
"learning_rate": 2.866376811594203e-06,
"loss": 0.2245,
"step": 25125
},
{
"epoch": 2.98,
"learning_rate": 2.859130434782609e-06,
"loss": 0.2648,
"step": 25150
},
{
"epoch": 2.99,
"learning_rate": 2.851884057971015e-06,
"loss": 0.1995,
"step": 25175
},
{
"epoch": 2.99,
"learning_rate": 2.8446376811594205e-06,
"loss": 0.2652,
"step": 25200
},
{
"epoch": 2.99,
"learning_rate": 2.8373913043478264e-06,
"loss": 0.2587,
"step": 25225
},
{
"epoch": 3.0,
"learning_rate": 2.830144927536232e-06,
"loss": 0.2889,
"step": 25250
},
{
"epoch": 3.0,
"learning_rate": 2.822898550724638e-06,
"loss": 0.2257,
"step": 25275
},
{
"epoch": 3.0,
"learning_rate": 2.815652173913044e-06,
"loss": 0.1742,
"step": 25300
},
{
"epoch": 3.01,
"learning_rate": 2.8084057971014494e-06,
"loss": 0.1856,
"step": 25325
},
{
"epoch": 3.01,
"learning_rate": 2.8011594202898552e-06,
"loss": 0.1801,
"step": 25350
},
{
"epoch": 3.01,
"learning_rate": 2.7939130434782615e-06,
"loss": 0.2185,
"step": 25375
},
{
"epoch": 3.01,
"learning_rate": 2.786666666666667e-06,
"loss": 0.2565,
"step": 25400
},
{
"epoch": 3.02,
"learning_rate": 2.779420289855073e-06,
"loss": 0.2026,
"step": 25425
},
{
"epoch": 3.02,
"learning_rate": 2.7721739130434782e-06,
"loss": 0.2373,
"step": 25450
},
{
"epoch": 3.02,
"learning_rate": 2.7649275362318845e-06,
"loss": 0.2406,
"step": 25475
},
{
"epoch": 3.03,
"learning_rate": 2.75768115942029e-06,
"loss": 0.4514,
"step": 25500
},
{
"epoch": 3.03,
"learning_rate": 2.750434782608696e-06,
"loss": 0.1876,
"step": 25525
},
{
"epoch": 3.03,
"learning_rate": 2.7431884057971012e-06,
"loss": 0.2703,
"step": 25550
},
{
"epoch": 3.03,
"learning_rate": 2.7359420289855075e-06,
"loss": 0.1749,
"step": 25575
},
{
"epoch": 3.04,
"learning_rate": 2.7286956521739134e-06,
"loss": 0.2088,
"step": 25600
},
{
"epoch": 3.04,
"learning_rate": 2.721449275362319e-06,
"loss": 0.2087,
"step": 25625
},
{
"epoch": 3.04,
"learning_rate": 2.7142028985507246e-06,
"loss": 0.3172,
"step": 25650
},
{
"epoch": 3.05,
"learning_rate": 2.706956521739131e-06,
"loss": 0.1898,
"step": 25675
},
{
"epoch": 3.05,
"learning_rate": 2.6997101449275364e-06,
"loss": 0.1685,
"step": 25700
},
{
"epoch": 3.05,
"learning_rate": 2.692463768115942e-06,
"loss": 0.1918,
"step": 25725
},
{
"epoch": 3.06,
"learning_rate": 2.6852173913043476e-06,
"loss": 0.2734,
"step": 25750
},
{
"epoch": 3.06,
"learning_rate": 2.677971014492754e-06,
"loss": 0.1485,
"step": 25775
},
{
"epoch": 3.06,
"learning_rate": 2.6707246376811598e-06,
"loss": 0.1542,
"step": 25800
},
{
"epoch": 3.06,
"learning_rate": 2.663478260869565e-06,
"loss": 0.1694,
"step": 25825
},
{
"epoch": 3.07,
"learning_rate": 2.6562318840579715e-06,
"loss": 0.1685,
"step": 25850
},
{
"epoch": 3.07,
"learning_rate": 2.6489855072463773e-06,
"loss": 0.1719,
"step": 25875
},
{
"epoch": 3.07,
"learning_rate": 2.6417391304347828e-06,
"loss": 0.1573,
"step": 25900
},
{
"epoch": 3.08,
"learning_rate": 2.6344927536231886e-06,
"loss": 0.2429,
"step": 25925
},
{
"epoch": 3.08,
"learning_rate": 2.6272463768115945e-06,
"loss": 0.1751,
"step": 25950
},
{
"epoch": 3.08,
"learning_rate": 2.6202898550724644e-06,
"loss": 0.2976,
"step": 25975
},
{
"epoch": 3.09,
"learning_rate": 2.61304347826087e-06,
"loss": 0.2509,
"step": 26000
},
{
"epoch": 3.09,
"eval_cer": 6.816493678980766,
"eval_loss": 0.3948805630207062,
"eval_runtime": 3174.2689,
"eval_samples_per_second": 0.782,
"eval_steps_per_second": 0.391,
"eval_wer": 18.518010291595196,
"step": 26000
},
{
"epoch": 3.09,
"learning_rate": 2.6057971014492757e-06,
"loss": 0.377,
"step": 26025
},
{
"epoch": 3.09,
"learning_rate": 2.598550724637681e-06,
"loss": 0.1902,
"step": 26050
},
{
"epoch": 3.09,
"learning_rate": 2.5913043478260874e-06,
"loss": 0.2086,
"step": 26075
},
{
"epoch": 3.1,
"learning_rate": 2.5840579710144932e-06,
"loss": 0.269,
"step": 26100
},
{
"epoch": 3.1,
"learning_rate": 2.5768115942028987e-06,
"loss": 0.2287,
"step": 26125
},
{
"epoch": 3.1,
"learning_rate": 2.5695652173913045e-06,
"loss": 0.2673,
"step": 26150
},
{
"epoch": 3.11,
"learning_rate": 2.562318840579711e-06,
"loss": 0.1238,
"step": 26175
},
{
"epoch": 3.11,
"learning_rate": 2.5550724637681162e-06,
"loss": 0.2047,
"step": 26200
},
{
"epoch": 3.11,
"learning_rate": 2.547826086956522e-06,
"loss": 0.3,
"step": 26225
},
{
"epoch": 3.11,
"learning_rate": 2.5405797101449275e-06,
"loss": 0.201,
"step": 26250
},
{
"epoch": 3.12,
"learning_rate": 2.5333333333333338e-06,
"loss": 0.1864,
"step": 26275
},
{
"epoch": 3.12,
"learning_rate": 2.5260869565217392e-06,
"loss": 0.2565,
"step": 26300
},
{
"epoch": 3.12,
"learning_rate": 2.518840579710145e-06,
"loss": 0.189,
"step": 26325
},
{
"epoch": 3.13,
"learning_rate": 2.511594202898551e-06,
"loss": 0.2006,
"step": 26350
},
{
"epoch": 3.13,
"learning_rate": 2.5043478260869568e-06,
"loss": 0.1992,
"step": 26375
},
{
"epoch": 3.13,
"learning_rate": 2.4971014492753626e-06,
"loss": 0.1742,
"step": 26400
},
{
"epoch": 3.14,
"learning_rate": 2.489855072463768e-06,
"loss": 0.1909,
"step": 26425
},
{
"epoch": 3.14,
"learning_rate": 2.4826086956521743e-06,
"loss": 0.1935,
"step": 26450
},
{
"epoch": 3.14,
"learning_rate": 2.4753623188405798e-06,
"loss": 0.2335,
"step": 26475
},
{
"epoch": 3.14,
"learning_rate": 2.4681159420289856e-06,
"loss": 0.2635,
"step": 26500
},
{
"epoch": 3.15,
"learning_rate": 2.4608695652173915e-06,
"loss": 0.2079,
"step": 26525
},
{
"epoch": 3.15,
"learning_rate": 2.4536231884057973e-06,
"loss": 0.2006,
"step": 26550
},
{
"epoch": 3.15,
"learning_rate": 2.446376811594203e-06,
"loss": 0.244,
"step": 26575
},
{
"epoch": 3.16,
"learning_rate": 2.439130434782609e-06,
"loss": 0.32,
"step": 26600
},
{
"epoch": 3.16,
"learning_rate": 2.4318840579710145e-06,
"loss": 0.1757,
"step": 26625
},
{
"epoch": 3.16,
"learning_rate": 2.4246376811594203e-06,
"loss": 0.151,
"step": 26650
},
{
"epoch": 3.17,
"learning_rate": 2.417391304347826e-06,
"loss": 0.1985,
"step": 26675
},
{
"epoch": 3.17,
"learning_rate": 2.410144927536232e-06,
"loss": 0.2241,
"step": 26700
},
{
"epoch": 3.17,
"learning_rate": 2.402898550724638e-06,
"loss": 0.1411,
"step": 26725
},
{
"epoch": 3.17,
"learning_rate": 2.3956521739130437e-06,
"loss": 0.2348,
"step": 26750
},
{
"epoch": 3.18,
"learning_rate": 2.3884057971014496e-06,
"loss": 0.2529,
"step": 26775
},
{
"epoch": 3.18,
"learning_rate": 2.3811594202898555e-06,
"loss": 0.1819,
"step": 26800
},
{
"epoch": 3.18,
"learning_rate": 2.3739130434782613e-06,
"loss": 0.2473,
"step": 26825
},
{
"epoch": 3.19,
"learning_rate": 2.3666666666666667e-06,
"loss": 0.2902,
"step": 26850
},
{
"epoch": 3.19,
"learning_rate": 2.3594202898550726e-06,
"loss": 0.1368,
"step": 26875
},
{
"epoch": 3.19,
"learning_rate": 2.3521739130434784e-06,
"loss": 0.2857,
"step": 26900
},
{
"epoch": 3.2,
"learning_rate": 2.3449275362318843e-06,
"loss": 0.1613,
"step": 26925
},
{
"epoch": 3.2,
"learning_rate": 2.33768115942029e-06,
"loss": 0.2573,
"step": 26950
},
{
"epoch": 3.2,
"learning_rate": 2.330434782608696e-06,
"loss": 0.2029,
"step": 26975
},
{
"epoch": 3.2,
"learning_rate": 2.3231884057971014e-06,
"loss": 0.2085,
"step": 27000
},
{
"epoch": 3.2,
"eval_cer": 6.811328643809336,
"eval_loss": 0.3984606862068176,
"eval_runtime": 3176.0872,
"eval_samples_per_second": 0.781,
"eval_steps_per_second": 0.391,
"eval_wer": 18.613302839717935,
"step": 27000
},
{
"epoch": 3.21,
"learning_rate": 2.3159420289855077e-06,
"loss": 0.235,
"step": 27025
},
{
"epoch": 3.21,
"learning_rate": 2.308695652173913e-06,
"loss": 0.1992,
"step": 27050
},
{
"epoch": 3.21,
"learning_rate": 2.301449275362319e-06,
"loss": 0.2457,
"step": 27075
},
{
"epoch": 3.22,
"learning_rate": 2.294202898550725e-06,
"loss": 0.1871,
"step": 27100
},
{
"epoch": 3.22,
"learning_rate": 2.2869565217391307e-06,
"loss": 0.1464,
"step": 27125
},
{
"epoch": 3.22,
"learning_rate": 2.279710144927536e-06,
"loss": 0.2012,
"step": 27150
},
{
"epoch": 3.22,
"learning_rate": 2.2724637681159424e-06,
"loss": 0.1757,
"step": 27175
},
{
"epoch": 3.23,
"learning_rate": 2.265217391304348e-06,
"loss": 0.1795,
"step": 27200
},
{
"epoch": 3.23,
"learning_rate": 2.2579710144927537e-06,
"loss": 0.1706,
"step": 27225
},
{
"epoch": 3.23,
"learning_rate": 2.2507246376811596e-06,
"loss": 0.2044,
"step": 27250
},
{
"epoch": 3.24,
"learning_rate": 2.2434782608695654e-06,
"loss": 0.2155,
"step": 27275
},
{
"epoch": 3.24,
"learning_rate": 2.2362318840579713e-06,
"loss": 0.1811,
"step": 27300
},
{
"epoch": 3.24,
"learning_rate": 2.228985507246377e-06,
"loss": 0.2311,
"step": 27325
},
{
"epoch": 3.25,
"learning_rate": 2.2217391304347825e-06,
"loss": 0.3311,
"step": 27350
},
{
"epoch": 3.25,
"learning_rate": 2.2144927536231884e-06,
"loss": 0.1692,
"step": 27375
},
{
"epoch": 3.25,
"learning_rate": 2.2072463768115943e-06,
"loss": 0.2069,
"step": 27400
},
{
"epoch": 3.25,
"learning_rate": 2.2e-06,
"loss": 0.1755,
"step": 27425
},
{
"epoch": 3.26,
"learning_rate": 2.192753623188406e-06,
"loss": 0.2029,
"step": 27450
},
{
"epoch": 3.26,
"learning_rate": 2.185507246376812e-06,
"loss": 0.2542,
"step": 27475
},
{
"epoch": 3.26,
"learning_rate": 2.1782608695652177e-06,
"loss": 0.1882,
"step": 27500
},
{
"epoch": 3.27,
"learning_rate": 2.1710144927536235e-06,
"loss": 0.2374,
"step": 27525
},
{
"epoch": 3.27,
"learning_rate": 2.1637681159420294e-06,
"loss": 0.1967,
"step": 27550
},
{
"epoch": 3.27,
"learning_rate": 2.156521739130435e-06,
"loss": 0.1869,
"step": 27575
},
{
"epoch": 3.28,
"learning_rate": 2.1492753623188407e-06,
"loss": 0.2861,
"step": 27600
},
{
"epoch": 3.28,
"learning_rate": 2.1420289855072465e-06,
"loss": 0.2392,
"step": 27625
},
{
"epoch": 3.28,
"learning_rate": 2.1347826086956524e-06,
"loss": 0.18,
"step": 27650
},
{
"epoch": 3.28,
"learning_rate": 2.1275362318840582e-06,
"loss": 0.2496,
"step": 27675
},
{
"epoch": 3.29,
"learning_rate": 2.120289855072464e-06,
"loss": 0.1998,
"step": 27700
},
{
"epoch": 3.29,
"learning_rate": 2.1130434782608695e-06,
"loss": 0.259,
"step": 27725
},
{
"epoch": 3.29,
"learning_rate": 2.105797101449276e-06,
"loss": 0.3129,
"step": 27750
},
{
"epoch": 3.3,
"learning_rate": 2.0985507246376812e-06,
"loss": 0.1907,
"step": 27775
},
{
"epoch": 3.3,
"learning_rate": 2.091304347826087e-06,
"loss": 0.1343,
"step": 27800
},
{
"epoch": 3.3,
"learning_rate": 2.084057971014493e-06,
"loss": 0.1973,
"step": 27825
},
{
"epoch": 3.3,
"learning_rate": 2.0768115942028988e-06,
"loss": 0.1658,
"step": 27850
},
{
"epoch": 3.31,
"learning_rate": 2.0695652173913046e-06,
"loss": 0.1508,
"step": 27875
},
{
"epoch": 3.31,
"learning_rate": 2.0623188405797105e-06,
"loss": 0.1947,
"step": 27900
},
{
"epoch": 3.31,
"learning_rate": 2.055072463768116e-06,
"loss": 0.1812,
"step": 27925
},
{
"epoch": 3.32,
"learning_rate": 2.0478260869565218e-06,
"loss": 0.2154,
"step": 27950
},
{
"epoch": 3.32,
"learning_rate": 2.0405797101449276e-06,
"loss": 0.1456,
"step": 27975
},
{
"epoch": 3.32,
"learning_rate": 2.0333333333333335e-06,
"loss": 0.2055,
"step": 28000
},
{
"epoch": 3.32,
"eval_cer": 6.862364110384181,
"eval_loss": 0.39950060844421387,
"eval_runtime": 3191.9428,
"eval_samples_per_second": 0.778,
"eval_steps_per_second": 0.389,
"eval_wer": 18.76119687440442,
"step": 28000
},
{
"epoch": 3.33,
"learning_rate": 2.0260869565217393e-06,
"loss": 0.1855,
"step": 28025
},
{
"epoch": 3.33,
"learning_rate": 2.018840579710145e-06,
"loss": 0.2535,
"step": 28050
},
{
"epoch": 3.33,
"learning_rate": 2.0115942028985506e-06,
"loss": 0.2101,
"step": 28075
},
{
"epoch": 3.33,
"learning_rate": 2.004347826086957e-06,
"loss": 0.2977,
"step": 28100
},
{
"epoch": 3.34,
"learning_rate": 1.9971014492753623e-06,
"loss": 0.1915,
"step": 28125
},
{
"epoch": 3.34,
"learning_rate": 1.989855072463768e-06,
"loss": 0.1589,
"step": 28150
},
{
"epoch": 3.34,
"learning_rate": 1.982608695652174e-06,
"loss": 0.175,
"step": 28175
},
{
"epoch": 3.35,
"learning_rate": 1.97536231884058e-06,
"loss": 0.2892,
"step": 28200
},
{
"epoch": 3.35,
"learning_rate": 1.9681159420289853e-06,
"loss": 0.223,
"step": 28225
},
{
"epoch": 3.35,
"learning_rate": 1.9608695652173916e-06,
"loss": 0.1731,
"step": 28250
},
{
"epoch": 3.36,
"learning_rate": 1.9536231884057975e-06,
"loss": 0.2097,
"step": 28275
},
{
"epoch": 3.36,
"learning_rate": 1.946376811594203e-06,
"loss": 0.1909,
"step": 28300
},
{
"epoch": 3.36,
"learning_rate": 1.939130434782609e-06,
"loss": 0.2079,
"step": 28325
},
{
"epoch": 3.36,
"learning_rate": 1.9318840579710146e-06,
"loss": 0.1848,
"step": 28350
},
{
"epoch": 3.37,
"learning_rate": 1.9246376811594205e-06,
"loss": 0.1813,
"step": 28375
},
{
"epoch": 3.37,
"learning_rate": 1.9173913043478263e-06,
"loss": 0.1679,
"step": 28400
},
{
"epoch": 3.37,
"learning_rate": 1.910144927536232e-06,
"loss": 0.1787,
"step": 28425
},
{
"epoch": 3.38,
"learning_rate": 1.9028985507246378e-06,
"loss": 0.1718,
"step": 28450
},
{
"epoch": 3.38,
"learning_rate": 1.8956521739130437e-06,
"loss": 0.2553,
"step": 28475
},
{
"epoch": 3.38,
"learning_rate": 1.8884057971014493e-06,
"loss": 0.2249,
"step": 28500
},
{
"epoch": 3.38,
"learning_rate": 1.8811594202898554e-06,
"loss": 0.1657,
"step": 28525
},
{
"epoch": 3.39,
"learning_rate": 1.873913043478261e-06,
"loss": 0.1738,
"step": 28550
},
{
"epoch": 3.39,
"learning_rate": 1.8666666666666669e-06,
"loss": 0.1935,
"step": 28575
},
{
"epoch": 3.39,
"learning_rate": 1.8594202898550725e-06,
"loss": 0.2179,
"step": 28600
},
{
"epoch": 3.4,
"learning_rate": 1.8521739130434786e-06,
"loss": 0.2696,
"step": 28625
},
{
"epoch": 3.4,
"learning_rate": 1.8449275362318842e-06,
"loss": 0.1657,
"step": 28650
},
{
"epoch": 3.4,
"learning_rate": 1.83768115942029e-06,
"loss": 0.2302,
"step": 28675
},
{
"epoch": 3.41,
"learning_rate": 1.8304347826086957e-06,
"loss": 0.2888,
"step": 28700
},
{
"epoch": 3.41,
"learning_rate": 1.8231884057971016e-06,
"loss": 0.193,
"step": 28725
},
{
"epoch": 3.41,
"learning_rate": 1.8159420289855072e-06,
"loss": 0.2122,
"step": 28750
},
{
"epoch": 3.41,
"learning_rate": 1.8086956521739133e-06,
"loss": 0.1602,
"step": 28775
},
{
"epoch": 3.42,
"learning_rate": 1.801449275362319e-06,
"loss": 0.2419,
"step": 28800
},
{
"epoch": 3.42,
"learning_rate": 1.7942028985507248e-06,
"loss": 0.4138,
"step": 28825
},
{
"epoch": 3.42,
"learning_rate": 1.7869565217391304e-06,
"loss": 0.2473,
"step": 28850
},
{
"epoch": 3.43,
"learning_rate": 1.7797101449275365e-06,
"loss": 0.1792,
"step": 28875
},
{
"epoch": 3.43,
"learning_rate": 1.7724637681159421e-06,
"loss": 0.1822,
"step": 28900
},
{
"epoch": 3.43,
"learning_rate": 1.765217391304348e-06,
"loss": 0.1505,
"step": 28925
},
{
"epoch": 3.44,
"learning_rate": 1.7579710144927536e-06,
"loss": 0.1418,
"step": 28950
},
{
"epoch": 3.44,
"learning_rate": 1.7507246376811595e-06,
"loss": 0.1262,
"step": 28975
},
{
"epoch": 3.44,
"learning_rate": 1.7434782608695653e-06,
"loss": 0.175,
"step": 29000
},
{
"epoch": 3.44,
"eval_cer": 6.772713857051503,
"eval_loss": 0.40093937516212463,
"eval_runtime": 3157.1944,
"eval_samples_per_second": 0.786,
"eval_steps_per_second": 0.393,
"eval_wer": 18.48141795311607,
"step": 29000
},
{
"epoch": 3.44,
"learning_rate": 1.7362318840579712e-06,
"loss": 0.2065,
"step": 29025
},
{
"epoch": 3.45,
"learning_rate": 1.7289855072463768e-06,
"loss": 0.1723,
"step": 29050
},
{
"epoch": 3.45,
"learning_rate": 1.7217391304347827e-06,
"loss": 0.1419,
"step": 29075
},
{
"epoch": 3.45,
"learning_rate": 1.7144927536231887e-06,
"loss": 0.2607,
"step": 29100
},
{
"epoch": 3.46,
"learning_rate": 1.7072463768115944e-06,
"loss": 0.1884,
"step": 29125
},
{
"epoch": 3.46,
"learning_rate": 1.7000000000000002e-06,
"loss": 0.1824,
"step": 29150
},
{
"epoch": 3.46,
"learning_rate": 1.6927536231884059e-06,
"loss": 0.1657,
"step": 29175
},
{
"epoch": 3.47,
"learning_rate": 1.685507246376812e-06,
"loss": 0.248,
"step": 29200
},
{
"epoch": 3.47,
"learning_rate": 1.6782608695652176e-06,
"loss": 0.2124,
"step": 29225
},
{
"epoch": 3.47,
"learning_rate": 1.6710144927536234e-06,
"loss": 0.1964,
"step": 29250
},
{
"epoch": 3.47,
"learning_rate": 1.663768115942029e-06,
"loss": 0.3202,
"step": 29275
},
{
"epoch": 3.48,
"learning_rate": 1.656521739130435e-06,
"loss": 0.194,
"step": 29300
},
{
"epoch": 3.48,
"learning_rate": 1.6492753623188406e-06,
"loss": 0.2738,
"step": 29325
},
{
"epoch": 3.48,
"learning_rate": 1.6420289855072467e-06,
"loss": 0.1667,
"step": 29350
},
{
"epoch": 3.49,
"learning_rate": 1.6347826086956523e-06,
"loss": 0.2819,
"step": 29375
},
{
"epoch": 3.49,
"learning_rate": 1.6275362318840581e-06,
"loss": 0.1894,
"step": 29400
},
{
"epoch": 3.49,
"learning_rate": 1.6202898550724638e-06,
"loss": 0.1791,
"step": 29425
},
{
"epoch": 3.49,
"learning_rate": 1.6130434782608699e-06,
"loss": 0.1853,
"step": 29450
},
{
"epoch": 3.5,
"learning_rate": 1.6057971014492755e-06,
"loss": 0.2618,
"step": 29475
},
{
"epoch": 3.5,
"learning_rate": 1.5985507246376814e-06,
"loss": 0.2052,
"step": 29500
},
{
"epoch": 3.5,
"learning_rate": 1.591304347826087e-06,
"loss": 0.2185,
"step": 29525
},
{
"epoch": 3.51,
"learning_rate": 1.5840579710144928e-06,
"loss": 0.1305,
"step": 29550
},
{
"epoch": 3.51,
"learning_rate": 1.5768115942028985e-06,
"loss": 0.233,
"step": 29575
},
{
"epoch": 3.51,
"learning_rate": 1.5695652173913046e-06,
"loss": 0.2164,
"step": 29600
},
{
"epoch": 3.52,
"learning_rate": 1.5623188405797102e-06,
"loss": 0.1524,
"step": 29625
},
{
"epoch": 3.52,
"learning_rate": 1.555072463768116e-06,
"loss": 0.1961,
"step": 29650
},
{
"epoch": 3.52,
"learning_rate": 1.5478260869565217e-06,
"loss": 0.2242,
"step": 29675
},
{
"epoch": 3.52,
"learning_rate": 1.5405797101449278e-06,
"loss": 0.1997,
"step": 29700
},
{
"epoch": 3.53,
"learning_rate": 1.5333333333333334e-06,
"loss": 0.2001,
"step": 29725
},
{
"epoch": 3.53,
"learning_rate": 1.5260869565217393e-06,
"loss": 0.1888,
"step": 29750
},
{
"epoch": 3.53,
"learning_rate": 1.518840579710145e-06,
"loss": 0.2124,
"step": 29775
},
{
"epoch": 3.54,
"learning_rate": 1.5115942028985508e-06,
"loss": 0.2145,
"step": 29800
},
{
"epoch": 3.54,
"learning_rate": 1.5043478260869566e-06,
"loss": 0.2512,
"step": 29825
},
{
"epoch": 3.54,
"learning_rate": 1.4971014492753625e-06,
"loss": 0.1625,
"step": 29850
},
{
"epoch": 3.55,
"learning_rate": 1.4898550724637683e-06,
"loss": 0.1556,
"step": 29875
},
{
"epoch": 3.55,
"learning_rate": 1.482608695652174e-06,
"loss": 0.2134,
"step": 29900
},
{
"epoch": 3.55,
"learning_rate": 1.47536231884058e-06,
"loss": 0.1959,
"step": 29925
},
{
"epoch": 3.55,
"learning_rate": 1.4681159420289857e-06,
"loss": 0.197,
"step": 29950
},
{
"epoch": 3.56,
"learning_rate": 1.4608695652173915e-06,
"loss": 0.1825,
"step": 29975
},
{
"epoch": 3.56,
"learning_rate": 1.4536231884057972e-06,
"loss": 0.1701,
"step": 30000
},
{
"epoch": 3.56,
"eval_cer": 7.013625854690344,
"eval_loss": 0.3998452425003052,
"eval_runtime": 3192.2868,
"eval_samples_per_second": 0.777,
"eval_steps_per_second": 0.389,
"eval_wer": 18.834381551362682,
"step": 30000
},
{
"epoch": 32.74,
"learning_rate": 1.446376811594203e-06,
"loss": 1.1855,
"step": 30025
},
{
"epoch": 32.77,
"learning_rate": 1.4391304347826089e-06,
"loss": 1.0754,
"step": 30050
},
{
"epoch": 32.8,
"learning_rate": 1.4318840579710147e-06,
"loss": 0.9609,
"step": 30075
},
{
"epoch": 32.82,
"learning_rate": 1.4246376811594204e-06,
"loss": 0.9363,
"step": 30100
},
{
"epoch": 32.85,
"learning_rate": 1.4173913043478262e-06,
"loss": 0.9573,
"step": 30125
},
{
"epoch": 32.88,
"learning_rate": 1.4101449275362319e-06,
"loss": 0.945,
"step": 30150
},
{
"epoch": 32.91,
"learning_rate": 1.402898550724638e-06,
"loss": 0.8939,
"step": 30175
},
{
"epoch": 32.93,
"learning_rate": 1.3956521739130436e-06,
"loss": 0.9062,
"step": 30200
},
{
"epoch": 32.96,
"learning_rate": 1.3884057971014494e-06,
"loss": 0.9019,
"step": 30225
},
{
"epoch": 32.99,
"learning_rate": 1.381159420289855e-06,
"loss": 0.8691,
"step": 30250
},
{
"epoch": 33.02,
"learning_rate": 1.3739130434782611e-06,
"loss": 0.8198,
"step": 30275
},
{
"epoch": 33.04,
"learning_rate": 1.3666666666666668e-06,
"loss": 0.8642,
"step": 30300
},
{
"epoch": 33.07,
"learning_rate": 1.3594202898550726e-06,
"loss": 0.8705,
"step": 30325
},
{
"epoch": 33.1,
"learning_rate": 1.3521739130434783e-06,
"loss": 0.7469,
"step": 30350
},
{
"epoch": 33.12,
"learning_rate": 1.3449275362318841e-06,
"loss": 0.7704,
"step": 30375
},
{
"epoch": 33.15,
"learning_rate": 1.3376811594202898e-06,
"loss": 0.8126,
"step": 30400
},
{
"epoch": 33.18,
"learning_rate": 1.3304347826086958e-06,
"loss": 0.8152,
"step": 30425
},
{
"epoch": 33.21,
"learning_rate": 1.3231884057971015e-06,
"loss": 0.7214,
"step": 30450
},
{
"epoch": 33.23,
"learning_rate": 1.3159420289855073e-06,
"loss": 0.8131,
"step": 30475
},
{
"epoch": 33.26,
"learning_rate": 1.308695652173913e-06,
"loss": 0.7234,
"step": 30500
},
{
"epoch": 33.29,
"learning_rate": 1.301449275362319e-06,
"loss": 0.7552,
"step": 30525
},
{
"epoch": 33.32,
"learning_rate": 1.2942028985507247e-06,
"loss": 0.7036,
"step": 30550
},
{
"epoch": 33.34,
"learning_rate": 1.2869565217391305e-06,
"loss": 0.7777,
"step": 30575
},
{
"epoch": 33.37,
"learning_rate": 1.2797101449275362e-06,
"loss": 0.6986,
"step": 30600
},
{
"epoch": 33.4,
"learning_rate": 1.272463768115942e-06,
"loss": 0.7156,
"step": 30625
},
{
"epoch": 33.42,
"learning_rate": 1.265217391304348e-06,
"loss": 0.7919,
"step": 30650
},
{
"epoch": 33.45,
"learning_rate": 1.2579710144927537e-06,
"loss": 0.6559,
"step": 30675
},
{
"epoch": 33.48,
"learning_rate": 1.2507246376811596e-06,
"loss": 0.6646,
"step": 30700
},
{
"epoch": 33.51,
"learning_rate": 1.2434782608695652e-06,
"loss": 0.6952,
"step": 30725
},
{
"epoch": 33.53,
"learning_rate": 1.236231884057971e-06,
"loss": 0.7332,
"step": 30750
},
{
"epoch": 33.56,
"learning_rate": 1.228985507246377e-06,
"loss": 0.7673,
"step": 30775
},
{
"epoch": 33.59,
"learning_rate": 1.2217391304347826e-06,
"loss": 0.7079,
"step": 30800
},
{
"epoch": 33.62,
"learning_rate": 1.2144927536231884e-06,
"loss": 0.7293,
"step": 30825
},
{
"epoch": 33.64,
"learning_rate": 1.2072463768115943e-06,
"loss": 0.6716,
"step": 30850
},
{
"epoch": 33.67,
"learning_rate": 1.2000000000000002e-06,
"loss": 0.7037,
"step": 30875
},
{
"epoch": 33.7,
"learning_rate": 1.1927536231884058e-06,
"loss": 0.7235,
"step": 30900
},
{
"epoch": 33.72,
"learning_rate": 1.1855072463768117e-06,
"loss": 0.638,
"step": 30925
},
{
"epoch": 33.75,
"learning_rate": 1.1782608695652175e-06,
"loss": 0.7433,
"step": 30950
},
{
"epoch": 33.78,
"learning_rate": 1.1710144927536232e-06,
"loss": 0.7318,
"step": 30975
},
{
"epoch": 33.81,
"learning_rate": 1.163768115942029e-06,
"loss": 0.6832,
"step": 31000
},
{
"epoch": 33.81,
"eval_cer": 7.850853989513844,
"eval_loss": 0.542524516582489,
"eval_runtime": 3197.0599,
"eval_samples_per_second": 0.677,
"eval_steps_per_second": 0.17,
"eval_wer": 24.621636222704176,
"step": 31000
},
{
"epoch": 33.83,
"learning_rate": 1.1565217391304349e-06,
"loss": 0.673,
"step": 31025
},
{
"epoch": 33.86,
"learning_rate": 1.1492753623188407e-06,
"loss": 0.6608,
"step": 31050
},
{
"epoch": 33.89,
"learning_rate": 1.1420289855072466e-06,
"loss": 0.6553,
"step": 31075
},
{
"epoch": 33.91,
"learning_rate": 1.1347826086956524e-06,
"loss": 0.6837,
"step": 31100
},
{
"epoch": 33.94,
"learning_rate": 1.127536231884058e-06,
"loss": 0.6683,
"step": 31125
},
{
"epoch": 33.97,
"learning_rate": 1.120289855072464e-06,
"loss": 0.7043,
"step": 31150
},
{
"epoch": 34.0,
"learning_rate": 1.1130434782608698e-06,
"loss": 0.647,
"step": 31175
},
{
"epoch": 34.02,
"learning_rate": 1.1057971014492754e-06,
"loss": 0.691,
"step": 31200
},
{
"epoch": 34.05,
"learning_rate": 1.0985507246376813e-06,
"loss": 0.6857,
"step": 31225
},
{
"epoch": 34.08,
"learning_rate": 1.0913043478260871e-06,
"loss": 0.5965,
"step": 31250
},
{
"epoch": 34.11,
"learning_rate": 1.0840579710144928e-06,
"loss": 0.6514,
"step": 31275
},
{
"epoch": 34.13,
"learning_rate": 1.0768115942028986e-06,
"loss": 0.5753,
"step": 31300
},
{
"epoch": 34.16,
"learning_rate": 1.0695652173913045e-06,
"loss": 0.6485,
"step": 31325
},
{
"epoch": 34.19,
"learning_rate": 1.0623188405797103e-06,
"loss": 0.6007,
"step": 31350
},
{
"epoch": 34.21,
"learning_rate": 1.055072463768116e-06,
"loss": 0.5861,
"step": 31375
},
{
"epoch": 34.24,
"learning_rate": 1.0478260869565218e-06,
"loss": 0.6009,
"step": 31400
},
{
"epoch": 34.27,
"learning_rate": 1.0405797101449277e-06,
"loss": 0.5646,
"step": 31425
},
{
"epoch": 34.3,
"learning_rate": 1.0333333333333333e-06,
"loss": 0.5896,
"step": 31450
},
{
"epoch": 34.32,
"learning_rate": 1.0260869565217392e-06,
"loss": 0.6017,
"step": 31475
},
{
"epoch": 34.35,
"learning_rate": 1.018840579710145e-06,
"loss": 0.6172,
"step": 31500
},
{
"epoch": 34.38,
"learning_rate": 1.0115942028985509e-06,
"loss": 0.5782,
"step": 31525
},
{
"epoch": 34.41,
"learning_rate": 1.0043478260869565e-06,
"loss": 0.6157,
"step": 31550
},
{
"epoch": 34.43,
"learning_rate": 9.971014492753624e-07,
"loss": 0.6407,
"step": 31575
},
{
"epoch": 34.46,
"learning_rate": 9.898550724637682e-07,
"loss": 0.646,
"step": 31600
},
{
"epoch": 34.49,
"learning_rate": 9.826086956521739e-07,
"loss": 0.5987,
"step": 31625
},
{
"epoch": 34.51,
"learning_rate": 9.753623188405797e-07,
"loss": 0.5978,
"step": 31650
},
{
"epoch": 34.54,
"learning_rate": 9.681159420289856e-07,
"loss": 0.6151,
"step": 31675
},
{
"epoch": 34.57,
"learning_rate": 9.608695652173912e-07,
"loss": 0.6037,
"step": 31700
},
{
"epoch": 34.6,
"learning_rate": 9.536231884057971e-07,
"loss": 0.5898,
"step": 31725
},
{
"epoch": 34.62,
"learning_rate": 9.463768115942029e-07,
"loss": 0.5873,
"step": 31750
},
{
"epoch": 34.65,
"learning_rate": 9.391304347826087e-07,
"loss": 0.6409,
"step": 31775
},
{
"epoch": 34.68,
"learning_rate": 9.318840579710145e-07,
"loss": 0.6163,
"step": 31800
},
{
"epoch": 34.71,
"learning_rate": 9.246376811594204e-07,
"loss": 0.549,
"step": 31825
},
{
"epoch": 34.73,
"learning_rate": 9.173913043478262e-07,
"loss": 0.5967,
"step": 31850
},
{
"epoch": 34.76,
"learning_rate": 9.10144927536232e-07,
"loss": 0.5369,
"step": 31875
},
{
"epoch": 34.79,
"learning_rate": 9.028985507246379e-07,
"loss": 0.5848,
"step": 31900
},
{
"epoch": 34.81,
"learning_rate": 8.956521739130436e-07,
"loss": 0.569,
"step": 31925
},
{
"epoch": 34.84,
"learning_rate": 8.884057971014493e-07,
"loss": 0.5782,
"step": 31950
},
{
"epoch": 34.87,
"learning_rate": 8.811594202898552e-07,
"loss": 0.5425,
"step": 31975
},
{
"epoch": 34.9,
"learning_rate": 8.73913043478261e-07,
"loss": 0.5676,
"step": 32000
},
{
"epoch": 34.9,
"eval_cer": 7.377586234087609,
"eval_loss": 0.5141463875770569,
"eval_runtime": 3170.6638,
"eval_samples_per_second": 0.683,
"eval_steps_per_second": 0.171,
"eval_wer": 23.67895647544257,
"step": 32000
},
{
"epoch": 34.92,
"learning_rate": 8.666666666666668e-07,
"loss": 0.5505,
"step": 32025
},
{
"epoch": 34.95,
"learning_rate": 8.594202898550726e-07,
"loss": 0.5515,
"step": 32050
},
{
"epoch": 34.98,
"learning_rate": 8.521739130434783e-07,
"loss": 0.5501,
"step": 32075
},
{
"epoch": 35.01,
"learning_rate": 8.449275362318842e-07,
"loss": 0.5561,
"step": 32100
},
{
"epoch": 35.03,
"learning_rate": 8.376811594202899e-07,
"loss": 0.5846,
"step": 32125
},
{
"epoch": 35.06,
"learning_rate": 8.304347826086958e-07,
"loss": 0.5215,
"step": 32150
},
{
"epoch": 35.09,
"learning_rate": 8.231884057971015e-07,
"loss": 0.5006,
"step": 32175
},
{
"epoch": 35.11,
"learning_rate": 8.159420289855074e-07,
"loss": 0.5434,
"step": 32200
},
{
"epoch": 35.14,
"learning_rate": 8.086956521739131e-07,
"loss": 0.5447,
"step": 32225
},
{
"epoch": 35.17,
"learning_rate": 8.014492753623189e-07,
"loss": 0.5672,
"step": 32250
},
{
"epoch": 35.2,
"learning_rate": 7.942028985507247e-07,
"loss": 0.5617,
"step": 32275
},
{
"epoch": 35.22,
"learning_rate": 7.869565217391305e-07,
"loss": 0.5237,
"step": 32300
},
{
"epoch": 35.25,
"learning_rate": 7.797101449275363e-07,
"loss": 0.6142,
"step": 32325
},
{
"epoch": 35.28,
"learning_rate": 7.724637681159421e-07,
"loss": 0.5075,
"step": 32350
},
{
"epoch": 35.31,
"learning_rate": 7.652173913043478e-07,
"loss": 0.5431,
"step": 32375
},
{
"epoch": 35.33,
"learning_rate": 7.579710144927537e-07,
"loss": 0.4816,
"step": 32400
},
{
"epoch": 35.36,
"learning_rate": 7.507246376811594e-07,
"loss": 0.5244,
"step": 32425
},
{
"epoch": 35.39,
"learning_rate": 7.434782608695653e-07,
"loss": 0.5152,
"step": 32450
},
{
"epoch": 35.41,
"learning_rate": 7.36231884057971e-07,
"loss": 0.5653,
"step": 32475
},
{
"epoch": 35.44,
"learning_rate": 7.289855072463769e-07,
"loss": 0.4795,
"step": 32500
},
{
"epoch": 35.47,
"learning_rate": 7.217391304347826e-07,
"loss": 0.5132,
"step": 32525
},
{
"epoch": 35.5,
"learning_rate": 7.144927536231884e-07,
"loss": 0.5668,
"step": 32550
},
{
"epoch": 35.52,
"learning_rate": 7.072463768115942e-07,
"loss": 0.5509,
"step": 32575
},
{
"epoch": 35.55,
"learning_rate": 7.000000000000001e-07,
"loss": 0.532,
"step": 32600
},
{
"epoch": 35.58,
"learning_rate": 6.927536231884059e-07,
"loss": 0.5321,
"step": 32625
},
{
"epoch": 35.61,
"learning_rate": 6.855072463768117e-07,
"loss": 0.5079,
"step": 32650
},
{
"epoch": 35.63,
"learning_rate": 6.782608695652175e-07,
"loss": 0.5015,
"step": 32675
},
{
"epoch": 35.66,
"learning_rate": 6.710144927536233e-07,
"loss": 0.5693,
"step": 32700
},
{
"epoch": 35.69,
"learning_rate": 6.637681159420291e-07,
"loss": 0.5046,
"step": 32725
},
{
"epoch": 35.71,
"learning_rate": 6.565217391304349e-07,
"loss": 0.5433,
"step": 32750
},
{
"epoch": 35.74,
"learning_rate": 6.492753623188406e-07,
"loss": 0.5056,
"step": 32775
},
{
"epoch": 35.77,
"learning_rate": 6.420289855072465e-07,
"loss": 0.5413,
"step": 32800
},
{
"epoch": 35.8,
"learning_rate": 6.347826086956522e-07,
"loss": 0.5512,
"step": 32825
},
{
"epoch": 35.82,
"learning_rate": 6.275362318840581e-07,
"loss": 0.5224,
"step": 32850
},
{
"epoch": 35.85,
"learning_rate": 6.202898550724638e-07,
"loss": 0.4961,
"step": 32875
},
{
"epoch": 35.88,
"learning_rate": 6.130434782608696e-07,
"loss": 0.5242,
"step": 32900
},
{
"epoch": 35.91,
"learning_rate": 6.057971014492754e-07,
"loss": 0.471,
"step": 32925
},
{
"epoch": 35.93,
"learning_rate": 5.985507246376812e-07,
"loss": 0.547,
"step": 32950
},
{
"epoch": 35.96,
"learning_rate": 5.91304347826087e-07,
"loss": 0.5817,
"step": 32975
},
{
"epoch": 35.99,
"learning_rate": 5.840579710144928e-07,
"loss": 0.4863,
"step": 33000
},
{
"epoch": 35.99,
"eval_cer": 7.244107809276393,
"eval_loss": 0.5002937316894531,
"eval_runtime": 3172.2622,
"eval_samples_per_second": 0.683,
"eval_steps_per_second": 0.171,
"eval_wer": 23.0541571080715,
"step": 33000
},
{
"epoch": 36.01,
"learning_rate": 5.768115942028985e-07,
"loss": 0.4949,
"step": 33025
},
{
"epoch": 36.04,
"learning_rate": 5.695652173913044e-07,
"loss": 0.4664,
"step": 33050
},
{
"epoch": 36.07,
"learning_rate": 5.623188405797101e-07,
"loss": 0.4838,
"step": 33075
},
{
"epoch": 36.1,
"learning_rate": 5.55072463768116e-07,
"loss": 0.4896,
"step": 33100
},
{
"epoch": 36.12,
"learning_rate": 5.478260869565217e-07,
"loss": 0.5072,
"step": 33125
},
{
"epoch": 36.15,
"learning_rate": 5.405797101449276e-07,
"loss": 0.4928,
"step": 33150
},
{
"epoch": 36.18,
"learning_rate": 5.333333333333335e-07,
"loss": 0.5154,
"step": 33175
},
{
"epoch": 36.21,
"learning_rate": 5.260869565217392e-07,
"loss": 0.5093,
"step": 33200
},
{
"epoch": 36.23,
"learning_rate": 5.188405797101449e-07,
"loss": 0.4988,
"step": 33225
},
{
"epoch": 36.26,
"learning_rate": 5.115942028985508e-07,
"loss": 0.4689,
"step": 33250
},
{
"epoch": 36.29,
"learning_rate": 5.043478260869565e-07,
"loss": 0.5219,
"step": 33275
},
{
"epoch": 36.31,
"learning_rate": 4.971014492753624e-07,
"loss": 0.4721,
"step": 33300
},
{
"epoch": 36.34,
"learning_rate": 4.898550724637682e-07,
"loss": 0.5071,
"step": 33325
},
{
"epoch": 36.37,
"learning_rate": 4.82608695652174e-07,
"loss": 0.5119,
"step": 33350
},
{
"epoch": 36.4,
"learning_rate": 4.7536231884057975e-07,
"loss": 0.4618,
"step": 33375
},
{
"epoch": 36.42,
"learning_rate": 4.6811594202898556e-07,
"loss": 0.4778,
"step": 33400
},
{
"epoch": 36.45,
"learning_rate": 4.6086956521739136e-07,
"loss": 0.5451,
"step": 33425
},
{
"epoch": 36.48,
"learning_rate": 4.536231884057971e-07,
"loss": 0.4701,
"step": 33450
},
{
"epoch": 36.5,
"learning_rate": 4.463768115942029e-07,
"loss": 0.4444,
"step": 33475
},
{
"epoch": 36.53,
"learning_rate": 4.391304347826087e-07,
"loss": 0.4971,
"step": 33500
},
{
"epoch": 36.56,
"learning_rate": 4.318840579710145e-07,
"loss": 0.5379,
"step": 33525
},
{
"epoch": 36.59,
"learning_rate": 4.246376811594203e-07,
"loss": 0.4883,
"step": 33550
},
{
"epoch": 36.61,
"learning_rate": 4.1739130434782616e-07,
"loss": 0.5602,
"step": 33575
},
{
"epoch": 36.64,
"learning_rate": 4.1014492753623197e-07,
"loss": 0.4486,
"step": 33600
},
{
"epoch": 36.67,
"learning_rate": 4.028985507246377e-07,
"loss": 0.4654,
"step": 33625
},
{
"epoch": 36.7,
"learning_rate": 3.956521739130435e-07,
"loss": 0.4993,
"step": 33650
},
{
"epoch": 36.72,
"learning_rate": 3.884057971014493e-07,
"loss": 0.4552,
"step": 33675
},
{
"epoch": 36.75,
"learning_rate": 3.811594202898551e-07,
"loss": 0.5494,
"step": 33700
},
{
"epoch": 36.78,
"learning_rate": 3.739130434782609e-07,
"loss": 0.5392,
"step": 33725
},
{
"epoch": 36.8,
"learning_rate": 3.666666666666667e-07,
"loss": 0.4993,
"step": 33750
},
{
"epoch": 36.83,
"learning_rate": 3.5942028985507247e-07,
"loss": 0.4896,
"step": 33775
},
{
"epoch": 36.86,
"learning_rate": 3.5217391304347827e-07,
"loss": 0.4804,
"step": 33800
},
{
"epoch": 36.89,
"learning_rate": 3.4492753623188407e-07,
"loss": 0.5006,
"step": 33825
},
{
"epoch": 36.91,
"learning_rate": 3.3768115942028987e-07,
"loss": 0.4965,
"step": 33850
},
{
"epoch": 36.94,
"learning_rate": 3.304347826086957e-07,
"loss": 0.5459,
"step": 33875
},
{
"epoch": 36.97,
"learning_rate": 3.231884057971015e-07,
"loss": 0.4653,
"step": 33900
},
{
"epoch": 37.0,
"learning_rate": 3.159420289855072e-07,
"loss": 0.5432,
"step": 33925
},
{
"epoch": 37.02,
"learning_rate": 3.086956521739131e-07,
"loss": 0.5017,
"step": 33950
},
{
"epoch": 37.05,
"learning_rate": 3.014492753623189e-07,
"loss": 0.473,
"step": 33975
},
{
"epoch": 37.08,
"learning_rate": 2.942028985507247e-07,
"loss": 0.5007,
"step": 34000
},
{
"epoch": 37.08,
"eval_cer": 7.154500918291419,
"eval_loss": 0.4948059916496277,
"eval_runtime": 3148.2863,
"eval_samples_per_second": 0.688,
"eval_steps_per_second": 0.172,
"eval_wer": 22.92340335575199,
"step": 34000
},
{
"epoch": 37.1,
"learning_rate": 2.8695652173913043e-07,
"loss": 0.4543,
"step": 34025
},
{
"epoch": 37.13,
"learning_rate": 2.7971014492753623e-07,
"loss": 0.483,
"step": 34050
},
{
"epoch": 37.16,
"learning_rate": 2.724637681159421e-07,
"loss": 0.5062,
"step": 34075
},
{
"epoch": 37.19,
"learning_rate": 2.6521739130434783e-07,
"loss": 0.4614,
"step": 34100
},
{
"epoch": 37.21,
"learning_rate": 2.5797101449275363e-07,
"loss": 0.4805,
"step": 34125
},
{
"epoch": 37.24,
"learning_rate": 2.5072463768115944e-07,
"loss": 0.4723,
"step": 34150
},
{
"epoch": 37.27,
"learning_rate": 2.4347826086956524e-07,
"loss": 0.4788,
"step": 34175
},
{
"epoch": 37.3,
"learning_rate": 2.3623188405797104e-07,
"loss": 0.4736,
"step": 34200
},
{
"epoch": 37.32,
"learning_rate": 2.289855072463768e-07,
"loss": 0.4979,
"step": 34225
},
{
"epoch": 37.35,
"learning_rate": 2.2173913043478261e-07,
"loss": 0.4598,
"step": 34250
},
{
"epoch": 37.38,
"learning_rate": 2.1449275362318844e-07,
"loss": 0.4501,
"step": 34275
},
{
"epoch": 37.4,
"learning_rate": 2.0724637681159422e-07,
"loss": 0.4515,
"step": 34300
},
{
"epoch": 37.43,
"learning_rate": 2.0000000000000002e-07,
"loss": 0.4789,
"step": 34325
},
{
"epoch": 37.46,
"learning_rate": 1.9275362318840582e-07,
"loss": 0.4697,
"step": 34350
},
{
"epoch": 37.49,
"learning_rate": 1.855072463768116e-07,
"loss": 0.468,
"step": 34375
},
{
"epoch": 37.51,
"learning_rate": 1.782608695652174e-07,
"loss": 0.4904,
"step": 34400
},
{
"epoch": 37.54,
"learning_rate": 1.710144927536232e-07,
"loss": 0.4827,
"step": 34425
},
{
"epoch": 37.57,
"learning_rate": 1.6376811594202902e-07,
"loss": 0.4441,
"step": 34450
},
{
"epoch": 37.6,
"learning_rate": 1.565217391304348e-07,
"loss": 0.4665,
"step": 34475
},
{
"epoch": 37.62,
"learning_rate": 1.492753623188406e-07,
"loss": 0.4904,
"step": 34500
},
{
"epoch": 37.65,
"learning_rate": 1.420289855072464e-07,
"loss": 0.4366,
"step": 34525
},
{
"epoch": 37.68,
"learning_rate": 1.3478260869565218e-07,
"loss": 0.5191,
"step": 34550
},
{
"epoch": 37.7,
"learning_rate": 1.2753623188405798e-07,
"loss": 0.4901,
"step": 34575
},
{
"epoch": 37.73,
"learning_rate": 1.2028985507246378e-07,
"loss": 0.5176,
"step": 34600
},
{
"epoch": 37.76,
"learning_rate": 1.1304347826086958e-07,
"loss": 0.4337,
"step": 34625
},
{
"epoch": 37.79,
"learning_rate": 1.0579710144927537e-07,
"loss": 0.4485,
"step": 34650
},
{
"epoch": 37.81,
"learning_rate": 9.855072463768116e-08,
"loss": 0.5057,
"step": 34675
},
{
"epoch": 37.84,
"learning_rate": 9.130434782608697e-08,
"loss": 0.4539,
"step": 34700
},
{
"epoch": 37.87,
"learning_rate": 8.405797101449276e-08,
"loss": 0.4845,
"step": 34725
},
{
"epoch": 37.9,
"learning_rate": 7.681159420289856e-08,
"loss": 0.4679,
"step": 34750
},
{
"epoch": 37.92,
"learning_rate": 6.956521739130436e-08,
"loss": 0.5126,
"step": 34775
},
{
"epoch": 37.95,
"learning_rate": 6.231884057971015e-08,
"loss": 0.5234,
"step": 34800
},
{
"epoch": 37.98,
"learning_rate": 5.507246376811595e-08,
"loss": 0.4573,
"step": 34825
},
{
"epoch": 38.0,
"learning_rate": 4.782608695652174e-08,
"loss": 0.4481,
"step": 34850
},
{
"epoch": 38.03,
"learning_rate": 4.057971014492754e-08,
"loss": 0.4473,
"step": 34875
},
{
"epoch": 38.06,
"learning_rate": 3.333333333333334e-08,
"loss": 0.4978,
"step": 34900
},
{
"epoch": 38.09,
"learning_rate": 2.6086956521739135e-08,
"loss": 0.4456,
"step": 34925
},
{
"epoch": 38.11,
"learning_rate": 1.884057971014493e-08,
"loss": 0.47,
"step": 34950
},
{
"epoch": 38.14,
"learning_rate": 1.1594202898550725e-08,
"loss": 0.4272,
"step": 34975
},
{
"epoch": 38.17,
"learning_rate": 4.3478260869565225e-09,
"loss": 0.4519,
"step": 35000
},
{
"epoch": 38.17,
"eval_cer": 7.125683342150651,
"eval_loss": 0.49221470952033997,
"eval_runtime": 3147.7575,
"eval_samples_per_second": 0.688,
"eval_steps_per_second": 0.172,
"eval_wer": 22.824750824061823,
"step": 35000
},
{
"epoch": 38.2,
"learning_rate": 2.244943820224719e-06,
"loss": 0.5112,
"step": 35025
},
{
"epoch": 38.22,
"learning_rate": 2.2393258426966294e-06,
"loss": 0.4629,
"step": 35050
},
{
"epoch": 38.25,
"learning_rate": 2.2337078651685396e-06,
"loss": 0.4797,
"step": 35075
},
{
"epoch": 38.28,
"learning_rate": 2.22808988764045e-06,
"loss": 0.4799,
"step": 35100
},
{
"epoch": 38.3,
"learning_rate": 2.22247191011236e-06,
"loss": 0.4919,
"step": 35125
},
{
"epoch": 38.33,
"learning_rate": 2.21685393258427e-06,
"loss": 0.4669,
"step": 35150
},
{
"epoch": 38.36,
"learning_rate": 2.21123595505618e-06,
"loss": 0.4348,
"step": 35175
},
{
"epoch": 38.39,
"learning_rate": 2.20561797752809e-06,
"loss": 0.5559,
"step": 35200
},
{
"epoch": 38.41,
"learning_rate": 2.2e-06,
"loss": 0.4651,
"step": 35225
},
{
"epoch": 38.44,
"learning_rate": 2.1943820224719103e-06,
"loss": 0.4023,
"step": 35250
},
{
"epoch": 38.47,
"learning_rate": 2.1887640449438206e-06,
"loss": 0.4687,
"step": 35275
},
{
"epoch": 38.5,
"learning_rate": 2.183146067415731e-06,
"loss": 0.4999,
"step": 35300
},
{
"epoch": 38.52,
"learning_rate": 2.1775280898876406e-06,
"loss": 0.431,
"step": 35325
},
{
"epoch": 38.55,
"learning_rate": 2.171910112359551e-06,
"loss": 0.4887,
"step": 35350
},
{
"epoch": 38.58,
"learning_rate": 2.1662921348314606e-06,
"loss": 0.4401,
"step": 35375
},
{
"epoch": 38.6,
"learning_rate": 2.160674157303371e-06,
"loss": 0.4975,
"step": 35400
},
{
"epoch": 38.63,
"learning_rate": 2.155056179775281e-06,
"loss": 0.4447,
"step": 35425
},
{
"epoch": 38.66,
"learning_rate": 2.1494382022471913e-06,
"loss": 0.5491,
"step": 35450
},
{
"epoch": 38.69,
"learning_rate": 2.143820224719101e-06,
"loss": 0.4185,
"step": 35475
},
{
"epoch": 38.71,
"learning_rate": 2.1382022471910113e-06,
"loss": 0.4195,
"step": 35500
},
{
"epoch": 38.74,
"learning_rate": 2.1325842696629216e-06,
"loss": 0.5616,
"step": 35525
},
{
"epoch": 38.77,
"learning_rate": 2.126966292134832e-06,
"loss": 0.4316,
"step": 35550
},
{
"epoch": 38.79,
"learning_rate": 2.1213483146067416e-06,
"loss": 0.4601,
"step": 35575
},
{
"epoch": 38.82,
"learning_rate": 2.1159550561797753e-06,
"loss": 0.4268,
"step": 35600
},
{
"epoch": 38.85,
"learning_rate": 2.1103370786516855e-06,
"loss": 0.4646,
"step": 35625
},
{
"epoch": 38.88,
"learning_rate": 2.1047191011235957e-06,
"loss": 0.4052,
"step": 35650
},
{
"epoch": 38.9,
"learning_rate": 2.099101123595506e-06,
"loss": 0.4437,
"step": 35675
},
{
"epoch": 38.93,
"learning_rate": 2.0934831460674158e-06,
"loss": 0.4204,
"step": 35700
},
{
"epoch": 38.96,
"learning_rate": 2.087865168539326e-06,
"loss": 0.4344,
"step": 35725
},
{
"epoch": 38.99,
"learning_rate": 2.082247191011236e-06,
"loss": 0.5028,
"step": 35750
},
{
"epoch": 39.01,
"learning_rate": 2.076629213483146e-06,
"loss": 0.3716,
"step": 35775
},
{
"epoch": 39.04,
"learning_rate": 2.0710112359550563e-06,
"loss": 0.4251,
"step": 35800
},
{
"epoch": 39.07,
"learning_rate": 2.0653932584269665e-06,
"loss": 0.4155,
"step": 35825
},
{
"epoch": 39.09,
"learning_rate": 2.0597752808988767e-06,
"loss": 0.4249,
"step": 35850
},
{
"epoch": 39.12,
"learning_rate": 2.054157303370787e-06,
"loss": 0.3721,
"step": 35875
},
{
"epoch": 39.15,
"learning_rate": 2.0485393258426968e-06,
"loss": 0.4026,
"step": 35900
},
{
"epoch": 39.18,
"learning_rate": 2.042921348314607e-06,
"loss": 0.4425,
"step": 35925
},
{
"epoch": 39.2,
"learning_rate": 2.037303370786517e-06,
"loss": 0.399,
"step": 35950
},
{
"epoch": 39.23,
"learning_rate": 2.031685393258427e-06,
"loss": 0.4291,
"step": 35975
},
{
"epoch": 39.26,
"learning_rate": 2.0260674157303372e-06,
"loss": 0.3674,
"step": 36000
},
{
"epoch": 39.26,
"eval_cer": 7.010413037587582,
"eval_loss": 0.47536423802375793,
"eval_runtime": 3145.4396,
"eval_samples_per_second": 0.689,
"eval_steps_per_second": 0.172,
"eval_wer": 22.664244720915118,
"step": 36000
},
{
"epoch": 39.29,
"learning_rate": 2.0204494382022475e-06,
"loss": 0.3957,
"step": 36025
},
{
"epoch": 39.31,
"learning_rate": 2.0148314606741577e-06,
"loss": 0.3944,
"step": 36050
},
{
"epoch": 39.34,
"learning_rate": 2.0092134831460675e-06,
"loss": 0.4103,
"step": 36075
},
{
"epoch": 39.37,
"learning_rate": 2.0035955056179777e-06,
"loss": 0.3942,
"step": 36100
},
{
"epoch": 39.39,
"learning_rate": 1.997977528089888e-06,
"loss": 0.426,
"step": 36125
},
{
"epoch": 39.42,
"learning_rate": 1.9923595505617978e-06,
"loss": 0.3685,
"step": 36150
},
{
"epoch": 39.45,
"learning_rate": 1.986741573033708e-06,
"loss": 0.4251,
"step": 36175
},
{
"epoch": 39.48,
"learning_rate": 1.9811235955056182e-06,
"loss": 0.3852,
"step": 36200
},
{
"epoch": 39.5,
"learning_rate": 1.9755056179775285e-06,
"loss": 0.3743,
"step": 36225
},
{
"epoch": 39.53,
"learning_rate": 1.9698876404494383e-06,
"loss": 0.4061,
"step": 36250
},
{
"epoch": 39.56,
"learning_rate": 1.9642696629213485e-06,
"loss": 0.4062,
"step": 36275
},
{
"epoch": 39.59,
"learning_rate": 1.9586516853932587e-06,
"loss": 0.3523,
"step": 36300
},
{
"epoch": 39.61,
"learning_rate": 1.9530337078651685e-06,
"loss": 0.4023,
"step": 36325
},
{
"epoch": 39.64,
"learning_rate": 1.9474157303370787e-06,
"loss": 0.3799,
"step": 36350
},
{
"epoch": 39.67,
"learning_rate": 1.941797752808989e-06,
"loss": 0.3439,
"step": 36375
},
{
"epoch": 39.69,
"learning_rate": 1.9361797752808988e-06,
"loss": 0.4106,
"step": 36400
},
{
"epoch": 39.72,
"learning_rate": 1.930561797752809e-06,
"loss": 0.407,
"step": 36425
},
{
"epoch": 39.75,
"learning_rate": 1.9249438202247192e-06,
"loss": 0.3814,
"step": 36450
},
{
"epoch": 39.78,
"learning_rate": 1.9193258426966295e-06,
"loss": 0.3561,
"step": 36475
},
{
"epoch": 39.8,
"learning_rate": 1.9137078651685397e-06,
"loss": 0.3886,
"step": 36500
},
{
"epoch": 39.83,
"learning_rate": 1.9080898876404495e-06,
"loss": 0.3777,
"step": 36525
},
{
"epoch": 39.86,
"learning_rate": 1.9024719101123597e-06,
"loss": 0.39,
"step": 36550
},
{
"epoch": 39.89,
"learning_rate": 1.8968539325842697e-06,
"loss": 0.3945,
"step": 36575
},
{
"epoch": 39.91,
"learning_rate": 1.8912359550561798e-06,
"loss": 0.3531,
"step": 36600
},
{
"epoch": 39.94,
"learning_rate": 1.88561797752809e-06,
"loss": 0.4433,
"step": 36625
},
{
"epoch": 39.97,
"learning_rate": 1.8800000000000002e-06,
"loss": 0.4188,
"step": 36650
},
{
"epoch": 39.99,
"learning_rate": 1.8743820224719102e-06,
"loss": 0.3897,
"step": 36675
},
{
"epoch": 40.02,
"learning_rate": 1.8687640449438205e-06,
"loss": 0.3282,
"step": 36700
},
{
"epoch": 40.05,
"learning_rate": 1.8631460674157307e-06,
"loss": 0.341,
"step": 36725
},
{
"epoch": 40.08,
"learning_rate": 1.8575280898876405e-06,
"loss": 0.3239,
"step": 36750
},
{
"epoch": 40.1,
"learning_rate": 1.8519101123595507e-06,
"loss": 0.3518,
"step": 36775
},
{
"epoch": 40.13,
"learning_rate": 1.8462921348314607e-06,
"loss": 0.3387,
"step": 36800
},
{
"epoch": 40.16,
"learning_rate": 1.840674157303371e-06,
"loss": 0.3201,
"step": 36825
},
{
"epoch": 40.19,
"learning_rate": 1.8350561797752812e-06,
"loss": 0.3128,
"step": 36850
},
{
"epoch": 40.21,
"learning_rate": 1.8294382022471912e-06,
"loss": 0.3749,
"step": 36875
},
{
"epoch": 40.24,
"learning_rate": 1.8238202247191012e-06,
"loss": 0.3756,
"step": 36900
},
{
"epoch": 40.27,
"learning_rate": 1.8182022471910112e-06,
"loss": 0.3545,
"step": 36925
},
{
"epoch": 40.29,
"learning_rate": 1.8125842696629215e-06,
"loss": 0.3746,
"step": 36950
},
{
"epoch": 40.32,
"learning_rate": 1.8069662921348317e-06,
"loss": 0.3308,
"step": 36975
},
{
"epoch": 40.35,
"learning_rate": 1.8013483146067417e-06,
"loss": 0.3481,
"step": 37000
},
{
"epoch": 40.35,
"eval_cer": 7.031058465270519,
"eval_loss": 0.46790996193885803,
"eval_runtime": 3161.6657,
"eval_samples_per_second": 0.685,
"eval_steps_per_second": 0.171,
"eval_wer": 22.631360543685062,
"step": 37000
},
{
"epoch": 40.38,
"learning_rate": 1.795730337078652e-06,
"loss": 0.3225,
"step": 37025
},
{
"epoch": 40.4,
"learning_rate": 1.7901123595505622e-06,
"loss": 0.299,
"step": 37050
},
{
"epoch": 40.43,
"learning_rate": 1.784494382022472e-06,
"loss": 0.3152,
"step": 37075
},
{
"epoch": 40.46,
"learning_rate": 1.778876404494382e-06,
"loss": 0.3268,
"step": 37100
},
{
"epoch": 40.49,
"learning_rate": 1.7732584269662922e-06,
"loss": 0.3411,
"step": 37125
},
{
"epoch": 40.51,
"learning_rate": 1.7676404494382024e-06,
"loss": 0.3846,
"step": 37150
},
{
"epoch": 40.54,
"learning_rate": 1.7620224719101125e-06,
"loss": 0.3168,
"step": 37175
},
{
"epoch": 40.57,
"learning_rate": 1.7564044943820227e-06,
"loss": 0.3377,
"step": 37200
},
{
"epoch": 40.59,
"learning_rate": 1.750786516853933e-06,
"loss": 0.3618,
"step": 37225
},
{
"epoch": 40.62,
"learning_rate": 1.7451685393258427e-06,
"loss": 0.3215,
"step": 37250
},
{
"epoch": 40.65,
"learning_rate": 1.739550561797753e-06,
"loss": 0.3859,
"step": 37275
},
{
"epoch": 40.68,
"learning_rate": 1.733932584269663e-06,
"loss": 0.3484,
"step": 37300
},
{
"epoch": 40.7,
"learning_rate": 1.7283146067415732e-06,
"loss": 0.375,
"step": 37325
},
{
"epoch": 40.73,
"learning_rate": 1.7226966292134834e-06,
"loss": 0.327,
"step": 37350
},
{
"epoch": 40.76,
"learning_rate": 1.7170786516853934e-06,
"loss": 0.2798,
"step": 37375
},
{
"epoch": 40.79,
"learning_rate": 1.7114606741573035e-06,
"loss": 0.3273,
"step": 37400
},
{
"epoch": 40.81,
"learning_rate": 1.7058426966292135e-06,
"loss": 0.3762,
"step": 37425
},
{
"epoch": 40.84,
"learning_rate": 1.7002247191011237e-06,
"loss": 0.2886,
"step": 37450
},
{
"epoch": 40.87,
"learning_rate": 1.6948314606741576e-06,
"loss": 0.3368,
"step": 37475
},
{
"epoch": 40.89,
"learning_rate": 1.6892134831460674e-06,
"loss": 0.3812,
"step": 37500
},
{
"epoch": 40.92,
"learning_rate": 1.6835955056179776e-06,
"loss": 0.3301,
"step": 37525
},
{
"epoch": 40.95,
"learning_rate": 1.6779775280898876e-06,
"loss": 0.3193,
"step": 37550
},
{
"epoch": 40.98,
"learning_rate": 1.6723595505617979e-06,
"loss": 0.3263,
"step": 37575
},
{
"epoch": 41.0,
"learning_rate": 1.666741573033708e-06,
"loss": 0.3422,
"step": 37600
},
{
"epoch": 41.03,
"learning_rate": 1.6611235955056181e-06,
"loss": 0.3138,
"step": 37625
},
{
"epoch": 41.06,
"learning_rate": 1.6555056179775283e-06,
"loss": 0.2919,
"step": 37650
},
{
"epoch": 41.09,
"learning_rate": 1.6498876404494381e-06,
"loss": 0.2828,
"step": 37675
},
{
"epoch": 41.11,
"learning_rate": 1.6442696629213484e-06,
"loss": 0.2607,
"step": 37700
},
{
"epoch": 41.14,
"learning_rate": 1.6386516853932586e-06,
"loss": 0.2524,
"step": 37725
},
{
"epoch": 41.17,
"learning_rate": 1.6330337078651686e-06,
"loss": 0.3627,
"step": 37750
},
{
"epoch": 41.19,
"learning_rate": 1.6274157303370788e-06,
"loss": 0.2641,
"step": 37775
},
{
"epoch": 41.22,
"learning_rate": 1.621797752808989e-06,
"loss": 0.2859,
"step": 37800
},
{
"epoch": 41.25,
"learning_rate": 1.616179775280899e-06,
"loss": 0.277,
"step": 37825
},
{
"epoch": 41.28,
"learning_rate": 1.610561797752809e-06,
"loss": 0.2923,
"step": 37850
},
{
"epoch": 41.3,
"learning_rate": 1.6049438202247191e-06,
"loss": 0.3439,
"step": 37875
},
{
"epoch": 41.33,
"learning_rate": 1.5993258426966293e-06,
"loss": 0.2374,
"step": 37900
},
{
"epoch": 41.36,
"learning_rate": 1.5937078651685396e-06,
"loss": 0.3332,
"step": 37925
},
{
"epoch": 41.38,
"learning_rate": 1.5880898876404496e-06,
"loss": 0.2999,
"step": 37950
},
{
"epoch": 41.41,
"learning_rate": 1.5824719101123598e-06,
"loss": 0.3052,
"step": 37975
},
{
"epoch": 41.44,
"learning_rate": 1.5768539325842696e-06,
"loss": 0.2992,
"step": 38000
},
{
"epoch": 41.44,
"eval_cer": 6.946469560180704,
"eval_loss": 0.4622255265712738,
"eval_runtime": 3167.1342,
"eval_samples_per_second": 0.684,
"eval_steps_per_second": 0.171,
"eval_wer": 22.25945615834514,
"step": 38000
},
{
"epoch": 41.47,
"learning_rate": 1.5712359550561799e-06,
"loss": 0.2935,
"step": 38025
},
{
"epoch": 41.49,
"learning_rate": 1.5656179775280899e-06,
"loss": 0.3086,
"step": 38050
},
{
"epoch": 41.52,
"learning_rate": 1.56e-06,
"loss": 0.301,
"step": 38075
},
{
"epoch": 41.55,
"learning_rate": 1.5543820224719103e-06,
"loss": 0.2848,
"step": 38100
},
{
"epoch": 41.58,
"learning_rate": 1.5487640449438203e-06,
"loss": 0.2642,
"step": 38125
},
{
"epoch": 41.6,
"learning_rate": 1.5431460674157306e-06,
"loss": 0.3192,
"step": 38150
},
{
"epoch": 41.63,
"learning_rate": 1.5375280898876404e-06,
"loss": 0.2712,
"step": 38175
},
{
"epoch": 41.66,
"learning_rate": 1.5319101123595506e-06,
"loss": 0.2649,
"step": 38200
},
{
"epoch": 41.68,
"learning_rate": 1.5262921348314608e-06,
"loss": 0.2872,
"step": 38225
},
{
"epoch": 41.71,
"learning_rate": 1.5206741573033708e-06,
"loss": 0.3132,
"step": 38250
},
{
"epoch": 41.74,
"learning_rate": 1.515056179775281e-06,
"loss": 0.2831,
"step": 38275
},
{
"epoch": 41.77,
"learning_rate": 1.5094382022471913e-06,
"loss": 0.2998,
"step": 38300
},
{
"epoch": 41.79,
"learning_rate": 1.5038202247191013e-06,
"loss": 0.3153,
"step": 38325
},
{
"epoch": 41.82,
"learning_rate": 1.4982022471910113e-06,
"loss": 0.2693,
"step": 38350
},
{
"epoch": 41.85,
"learning_rate": 1.4925842696629214e-06,
"loss": 0.3361,
"step": 38375
},
{
"epoch": 41.88,
"learning_rate": 1.4869662921348316e-06,
"loss": 0.3173,
"step": 38400
},
{
"epoch": 41.9,
"learning_rate": 1.4813483146067418e-06,
"loss": 0.2723,
"step": 38425
},
{
"epoch": 41.93,
"learning_rate": 1.4757303370786518e-06,
"loss": 0.3004,
"step": 38450
},
{
"epoch": 41.96,
"learning_rate": 1.470112359550562e-06,
"loss": 0.3207,
"step": 38475
},
{
"epoch": 41.98,
"learning_rate": 1.4644943820224719e-06,
"loss": 0.2761,
"step": 38500
},
{
"epoch": 42.01,
"learning_rate": 1.458876404494382e-06,
"loss": 0.3081,
"step": 38525
},
{
"epoch": 42.04,
"learning_rate": 1.4532584269662923e-06,
"loss": 0.2535,
"step": 38550
},
{
"epoch": 42.07,
"learning_rate": 1.4476404494382023e-06,
"loss": 0.2461,
"step": 38575
},
{
"epoch": 42.09,
"learning_rate": 1.4420224719101126e-06,
"loss": 0.2822,
"step": 38600
},
{
"epoch": 42.12,
"learning_rate": 1.4364044943820226e-06,
"loss": 0.2379,
"step": 38625
},
{
"epoch": 42.15,
"learning_rate": 1.4307865168539328e-06,
"loss": 0.2468,
"step": 38650
},
{
"epoch": 42.18,
"learning_rate": 1.4251685393258426e-06,
"loss": 0.2701,
"step": 38675
},
{
"epoch": 42.2,
"learning_rate": 1.4195505617977528e-06,
"loss": 0.258,
"step": 38700
},
{
"epoch": 42.23,
"learning_rate": 1.413932584269663e-06,
"loss": 0.2449,
"step": 38725
},
{
"epoch": 42.26,
"learning_rate": 1.408314606741573e-06,
"loss": 0.2615,
"step": 38750
},
{
"epoch": 42.28,
"learning_rate": 1.4026966292134833e-06,
"loss": 0.2735,
"step": 38775
},
{
"epoch": 42.31,
"learning_rate": 1.3970786516853935e-06,
"loss": 0.2429,
"step": 38800
},
{
"epoch": 42.34,
"learning_rate": 1.3914606741573033e-06,
"loss": 0.2835,
"step": 38825
},
{
"epoch": 42.37,
"learning_rate": 1.3858426966292136e-06,
"loss": 0.2713,
"step": 38850
},
{
"epoch": 42.39,
"learning_rate": 1.3802247191011236e-06,
"loss": 0.2523,
"step": 38875
},
{
"epoch": 42.42,
"learning_rate": 1.3746067415730338e-06,
"loss": 0.3313,
"step": 38900
},
{
"epoch": 42.45,
"learning_rate": 1.368988764044944e-06,
"loss": 0.243,
"step": 38925
},
{
"epoch": 42.48,
"learning_rate": 1.363370786516854e-06,
"loss": 0.2526,
"step": 38950
},
{
"epoch": 42.5,
"learning_rate": 1.3577528089887643e-06,
"loss": 0.2498,
"step": 38975
},
{
"epoch": 42.53,
"learning_rate": 1.352134831460674e-06,
"loss": 0.2505,
"step": 39000
},
{
"epoch": 42.53,
"eval_cer": 6.9198025494235775,
"eval_loss": 0.4640973210334778,
"eval_runtime": 3164.4611,
"eval_samples_per_second": 0.684,
"eval_steps_per_second": 0.171,
"eval_wer": 22.19368780388503,
"step": 39000
},
{
"epoch": 42.56,
"learning_rate": 1.3465168539325843e-06,
"loss": 0.2524,
"step": 39025
},
{
"epoch": 42.58,
"learning_rate": 1.3408988764044945e-06,
"loss": 0.2544,
"step": 39050
},
{
"epoch": 42.61,
"learning_rate": 1.3352808988764046e-06,
"loss": 0.2662,
"step": 39075
},
{
"epoch": 42.64,
"learning_rate": 1.3296629213483148e-06,
"loss": 0.2585,
"step": 39100
},
{
"epoch": 42.67,
"learning_rate": 1.324044943820225e-06,
"loss": 0.2696,
"step": 39125
},
{
"epoch": 42.69,
"learning_rate": 1.318426966292135e-06,
"loss": 0.2485,
"step": 39150
},
{
"epoch": 42.72,
"learning_rate": 1.312808988764045e-06,
"loss": 0.2799,
"step": 39175
},
{
"epoch": 42.75,
"learning_rate": 1.307191011235955e-06,
"loss": 0.2432,
"step": 39200
},
{
"epoch": 42.78,
"learning_rate": 1.3015730337078653e-06,
"loss": 0.2511,
"step": 39225
},
{
"epoch": 42.8,
"learning_rate": 1.2959550561797753e-06,
"loss": 0.3178,
"step": 39250
},
{
"epoch": 42.83,
"learning_rate": 1.2903370786516855e-06,
"loss": 0.2375,
"step": 39275
},
{
"epoch": 42.86,
"learning_rate": 1.2847191011235958e-06,
"loss": 0.2477,
"step": 39300
},
{
"epoch": 42.88,
"learning_rate": 1.2791011235955056e-06,
"loss": 0.2577,
"step": 39325
},
{
"epoch": 42.91,
"learning_rate": 1.2734831460674158e-06,
"loss": 0.2973,
"step": 39350
},
{
"epoch": 42.94,
"learning_rate": 1.2678651685393258e-06,
"loss": 0.3231,
"step": 39375
},
{
"epoch": 42.97,
"learning_rate": 1.262247191011236e-06,
"loss": 0.2593,
"step": 39400
},
{
"epoch": 42.99,
"learning_rate": 1.2566292134831463e-06,
"loss": 0.2557,
"step": 39425
},
{
"epoch": 43.02,
"learning_rate": 1.2510112359550563e-06,
"loss": 0.248,
"step": 39450
},
{
"epoch": 43.05,
"learning_rate": 1.2453932584269663e-06,
"loss": 0.2346,
"step": 39475
},
{
"epoch": 43.08,
"learning_rate": 1.2397752808988765e-06,
"loss": 0.2541,
"step": 39500
},
{
"epoch": 43.1,
"learning_rate": 1.2341573033707868e-06,
"loss": 0.2447,
"step": 39525
},
{
"epoch": 43.13,
"learning_rate": 1.2285393258426968e-06,
"loss": 0.2534,
"step": 39550
},
{
"epoch": 43.16,
"learning_rate": 1.2229213483146068e-06,
"loss": 0.2688,
"step": 39575
},
{
"epoch": 43.18,
"learning_rate": 1.217303370786517e-06,
"loss": 0.2358,
"step": 39600
},
{
"epoch": 43.21,
"learning_rate": 1.211685393258427e-06,
"loss": 0.2607,
"step": 39625
},
{
"epoch": 43.24,
"learning_rate": 1.2060674157303373e-06,
"loss": 0.2362,
"step": 39650
},
{
"epoch": 43.27,
"learning_rate": 1.2004494382022473e-06,
"loss": 0.2014,
"step": 39675
},
{
"epoch": 43.29,
"learning_rate": 1.1948314606741573e-06,
"loss": 0.243,
"step": 39700
},
{
"epoch": 43.32,
"learning_rate": 1.1892134831460675e-06,
"loss": 0.2331,
"step": 39725
},
{
"epoch": 43.35,
"learning_rate": 1.1835955056179778e-06,
"loss": 0.2281,
"step": 39750
},
{
"epoch": 43.38,
"learning_rate": 1.1779775280898878e-06,
"loss": 0.2671,
"step": 39775
},
{
"epoch": 43.4,
"learning_rate": 1.1723595505617978e-06,
"loss": 0.2365,
"step": 39800
},
{
"epoch": 43.43,
"learning_rate": 1.166741573033708e-06,
"loss": 0.2356,
"step": 39825
},
{
"epoch": 43.46,
"learning_rate": 1.161123595505618e-06,
"loss": 0.2366,
"step": 39850
},
{
"epoch": 43.48,
"learning_rate": 1.155505617977528e-06,
"loss": 0.2345,
"step": 39875
},
{
"epoch": 43.51,
"learning_rate": 1.1498876404494383e-06,
"loss": 0.2239,
"step": 39900
},
{
"epoch": 43.54,
"learning_rate": 1.1442696629213485e-06,
"loss": 0.2391,
"step": 39925
},
{
"epoch": 43.57,
"learning_rate": 1.1386516853932585e-06,
"loss": 0.2517,
"step": 39950
},
{
"epoch": 43.59,
"learning_rate": 1.1330337078651685e-06,
"loss": 0.2091,
"step": 39975
},
{
"epoch": 43.62,
"learning_rate": 1.1274157303370788e-06,
"loss": 0.2477,
"step": 40000
},
{
"epoch": 43.62,
"eval_cer": 7.2008097595524525,
"eval_loss": 0.46780213713645935,
"eval_runtime": 3174.0364,
"eval_samples_per_second": 0.682,
"eval_steps_per_second": 0.171,
"eval_wer": 22.827882650464684,
"step": 40000
},
{
"epoch": 43.65,
"learning_rate": 1.121797752808989e-06,
"loss": 0.2545,
"step": 40025
},
{
"epoch": 43.68,
"learning_rate": 1.116179775280899e-06,
"loss": 0.2254,
"step": 40050
},
{
"epoch": 43.7,
"learning_rate": 1.110561797752809e-06,
"loss": 0.2051,
"step": 40075
},
{
"epoch": 43.73,
"learning_rate": 1.1049438202247193e-06,
"loss": 0.2168,
"step": 40100
},
{
"epoch": 43.76,
"learning_rate": 1.0993258426966293e-06,
"loss": 0.2304,
"step": 40125
},
{
"epoch": 43.78,
"learning_rate": 1.0937078651685395e-06,
"loss": 0.2346,
"step": 40150
},
{
"epoch": 43.81,
"learning_rate": 1.0880898876404495e-06,
"loss": 0.2231,
"step": 40175
},
{
"epoch": 43.84,
"learning_rate": 1.0824719101123595e-06,
"loss": 0.2233,
"step": 40200
},
{
"epoch": 43.87,
"learning_rate": 1.0768539325842698e-06,
"loss": 0.2394,
"step": 40225
},
{
"epoch": 43.89,
"learning_rate": 1.07123595505618e-06,
"loss": 0.2243,
"step": 40250
},
{
"epoch": 43.92,
"learning_rate": 1.06561797752809e-06,
"loss": 0.2352,
"step": 40275
},
{
"epoch": 43.95,
"learning_rate": 1.06e-06,
"loss": 0.2776,
"step": 40300
},
{
"epoch": 43.97,
"learning_rate": 1.0543820224719102e-06,
"loss": 0.2271,
"step": 40325
},
{
"epoch": 44.0,
"learning_rate": 1.0487640449438203e-06,
"loss": 0.2344,
"step": 40350
},
{
"epoch": 44.03,
"learning_rate": 1.0431460674157303e-06,
"loss": 0.1906,
"step": 40375
},
{
"epoch": 44.06,
"learning_rate": 1.0375280898876405e-06,
"loss": 0.2142,
"step": 40400
},
{
"epoch": 44.08,
"learning_rate": 1.0319101123595507e-06,
"loss": 0.1885,
"step": 40425
},
{
"epoch": 44.11,
"learning_rate": 1.0262921348314607e-06,
"loss": 0.2192,
"step": 40450
},
{
"epoch": 44.14,
"learning_rate": 1.0206741573033708e-06,
"loss": 0.2242,
"step": 40475
},
{
"epoch": 44.17,
"learning_rate": 1.015056179775281e-06,
"loss": 0.2627,
"step": 40500
},
{
"epoch": 44.19,
"learning_rate": 1.0094382022471912e-06,
"loss": 0.1955,
"step": 40525
},
{
"epoch": 44.22,
"learning_rate": 1.0038202247191012e-06,
"loss": 0.2384,
"step": 40550
},
{
"epoch": 44.25,
"learning_rate": 9.982022471910113e-07,
"loss": 0.2457,
"step": 40575
},
{
"epoch": 44.27,
"learning_rate": 9.925842696629215e-07,
"loss": 0.1971,
"step": 40600
},
{
"epoch": 44.3,
"learning_rate": 9.869662921348315e-07,
"loss": 0.2013,
"step": 40625
},
{
"epoch": 44.33,
"learning_rate": 9.813483146067417e-07,
"loss": 0.203,
"step": 40650
},
{
"epoch": 44.36,
"learning_rate": 9.757303370786517e-07,
"loss": 0.2259,
"step": 40675
},
{
"epoch": 44.38,
"learning_rate": 9.701123595505618e-07,
"loss": 0.201,
"step": 40700
},
{
"epoch": 44.41,
"learning_rate": 9.64494382022472e-07,
"loss": 0.2531,
"step": 40725
},
{
"epoch": 44.44,
"learning_rate": 9.588764044943822e-07,
"loss": 0.1835,
"step": 40750
},
{
"epoch": 44.47,
"learning_rate": 9.532584269662921e-07,
"loss": 0.2384,
"step": 40775
},
{
"epoch": 44.49,
"learning_rate": 9.476404494382022e-07,
"loss": 0.2023,
"step": 40800
},
{
"epoch": 44.52,
"learning_rate": 9.420224719101125e-07,
"loss": 0.2448,
"step": 40825
},
{
"epoch": 44.55,
"learning_rate": 9.364044943820226e-07,
"loss": 0.2104,
"step": 40850
},
{
"epoch": 44.57,
"learning_rate": 9.307865168539326e-07,
"loss": 0.2211,
"step": 40875
},
{
"epoch": 44.6,
"learning_rate": 9.251685393258427e-07,
"loss": 0.2498,
"step": 40900
},
{
"epoch": 44.63,
"learning_rate": 9.19550561797753e-07,
"loss": 0.2139,
"step": 40925
},
{
"epoch": 44.66,
"learning_rate": 9.13932584269663e-07,
"loss": 0.2349,
"step": 40950
},
{
"epoch": 44.68,
"learning_rate": 9.083146067415731e-07,
"loss": 0.2201,
"step": 40975
},
{
"epoch": 44.71,
"learning_rate": 9.026966292134832e-07,
"loss": 0.1994,
"step": 41000
},
{
"epoch": 44.71,
"eval_cer": 7.11794130676955,
"eval_loss": 0.46892717480659485,
"eval_runtime": 3141.0329,
"eval_samples_per_second": 0.69,
"eval_steps_per_second": 0.173,
"eval_wer": 22.380814431456063,
"step": 41000
},
{
"epoch": 44.74,
"learning_rate": 8.970786516853932e-07,
"loss": 0.1841,
"step": 41025
},
{
"epoch": 44.77,
"learning_rate": 8.914606741573035e-07,
"loss": 0.204,
"step": 41050
},
{
"epoch": 44.79,
"learning_rate": 8.858426966292136e-07,
"loss": 0.2144,
"step": 41075
},
{
"epoch": 44.82,
"learning_rate": 8.802247191011237e-07,
"loss": 0.2586,
"step": 41100
},
{
"epoch": 44.85,
"learning_rate": 8.746067415730337e-07,
"loss": 0.219,
"step": 41125
},
{
"epoch": 44.87,
"learning_rate": 8.689887640449439e-07,
"loss": 0.2091,
"step": 41150
},
{
"epoch": 44.9,
"learning_rate": 8.633707865168541e-07,
"loss": 0.1841,
"step": 41175
},
{
"epoch": 44.93,
"learning_rate": 8.577528089887641e-07,
"loss": 0.202,
"step": 41200
},
{
"epoch": 44.96,
"learning_rate": 8.521348314606742e-07,
"loss": 0.2057,
"step": 41225
},
{
"epoch": 44.98,
"learning_rate": 8.465168539325843e-07,
"loss": 0.2353,
"step": 41250
},
{
"epoch": 45.01,
"learning_rate": 8.408988764044944e-07,
"loss": 0.181,
"step": 41275
},
{
"epoch": 45.04,
"learning_rate": 8.352808988764046e-07,
"loss": 0.2289,
"step": 41300
},
{
"epoch": 45.07,
"learning_rate": 8.296629213483147e-07,
"loss": 0.2127,
"step": 41325
},
{
"epoch": 45.09,
"learning_rate": 8.240449438202248e-07,
"loss": 0.2119,
"step": 41350
},
{
"epoch": 45.12,
"learning_rate": 8.184269662921348e-07,
"loss": 0.2223,
"step": 41375
},
{
"epoch": 45.15,
"learning_rate": 8.12808988764045e-07,
"loss": 0.2207,
"step": 41400
},
{
"epoch": 45.17,
"learning_rate": 8.071910112359552e-07,
"loss": 0.213,
"step": 41425
},
{
"epoch": 45.2,
"learning_rate": 8.015730337078652e-07,
"loss": 0.2092,
"step": 41450
},
{
"epoch": 45.23,
"learning_rate": 7.959550561797753e-07,
"loss": 0.1926,
"step": 41475
},
{
"epoch": 45.26,
"learning_rate": 7.903370786516855e-07,
"loss": 0.2111,
"step": 41500
},
{
"epoch": 45.28,
"learning_rate": 7.847191011235955e-07,
"loss": 0.1974,
"step": 41525
},
{
"epoch": 45.31,
"learning_rate": 7.791011235955057e-07,
"loss": 0.1944,
"step": 41550
},
{
"epoch": 45.34,
"learning_rate": 7.734831460674158e-07,
"loss": 0.159,
"step": 41575
},
{
"epoch": 45.37,
"learning_rate": 7.678651685393259e-07,
"loss": 0.2071,
"step": 41600
},
{
"epoch": 45.39,
"learning_rate": 7.62247191011236e-07,
"loss": 0.2017,
"step": 41625
},
{
"epoch": 45.42,
"learning_rate": 7.566292134831462e-07,
"loss": 0.2139,
"step": 41650
},
{
"epoch": 45.45,
"learning_rate": 7.510112359550563e-07,
"loss": 0.1659,
"step": 41675
},
{
"epoch": 45.47,
"learning_rate": 7.453932584269663e-07,
"loss": 0.2089,
"step": 41700
},
{
"epoch": 45.5,
"learning_rate": 7.397752808988764e-07,
"loss": 0.1634,
"step": 41725
},
{
"epoch": 45.53,
"learning_rate": 7.341573033707866e-07,
"loss": 0.2303,
"step": 41750
},
{
"epoch": 45.56,
"learning_rate": 7.285393258426966e-07,
"loss": 0.2094,
"step": 41775
},
{
"epoch": 45.58,
"learning_rate": 7.229213483146068e-07,
"loss": 0.1817,
"step": 41800
},
{
"epoch": 45.61,
"learning_rate": 7.173033707865169e-07,
"loss": 0.1848,
"step": 41825
},
{
"epoch": 45.64,
"learning_rate": 7.116853932584271e-07,
"loss": 0.1971,
"step": 41850
},
{
"epoch": 45.67,
"learning_rate": 7.060674157303371e-07,
"loss": 0.2081,
"step": 41875
},
{
"epoch": 45.69,
"learning_rate": 7.004494382022473e-07,
"loss": 0.2245,
"step": 41900
},
{
"epoch": 45.72,
"learning_rate": 6.948314606741574e-07,
"loss": 0.1896,
"step": 41925
},
{
"epoch": 45.75,
"learning_rate": 6.892134831460674e-07,
"loss": 0.2193,
"step": 41950
},
{
"epoch": 45.77,
"learning_rate": 6.835955056179776e-07,
"loss": 0.1998,
"step": 41975
},
{
"epoch": 45.8,
"learning_rate": 6.779775280898877e-07,
"loss": 0.1865,
"step": 42000
},
{
"epoch": 45.8,
"eval_cer": 7.135145829838664,
"eval_loss": 0.47173011302948,
"eval_runtime": 3187.2,
"eval_samples_per_second": 0.68,
"eval_steps_per_second": 0.17,
"eval_wer": 22.566375145825667,
"step": 42000
},
{
"epoch": 45.83,
"learning_rate": 6.723595505617977e-07,
"loss": 0.2185,
"step": 42025
},
{
"epoch": 45.86,
"learning_rate": 6.667415730337079e-07,
"loss": 0.2142,
"step": 42050
},
{
"epoch": 45.88,
"learning_rate": 6.61123595505618e-07,
"loss": 0.203,
"step": 42075
},
{
"epoch": 45.91,
"learning_rate": 6.555056179775282e-07,
"loss": 0.1912,
"step": 42100
},
{
"epoch": 45.94,
"learning_rate": 6.498876404494382e-07,
"loss": 0.1853,
"step": 42125
},
{
"epoch": 45.97,
"learning_rate": 6.442696629213484e-07,
"loss": 0.2056,
"step": 42150
},
{
"epoch": 45.99,
"learning_rate": 6.386516853932585e-07,
"loss": 0.1564,
"step": 42175
},
{
"epoch": 46.02,
"learning_rate": 6.330337078651686e-07,
"loss": 0.1701,
"step": 42200
},
{
"epoch": 46.05,
"learning_rate": 6.274157303370787e-07,
"loss": 0.2156,
"step": 42225
},
{
"epoch": 46.07,
"learning_rate": 6.217977528089888e-07,
"loss": 0.1844,
"step": 42250
},
{
"epoch": 46.1,
"learning_rate": 6.161797752808989e-07,
"loss": 0.1641,
"step": 42275
},
{
"epoch": 46.13,
"learning_rate": 6.10561797752809e-07,
"loss": 0.1754,
"step": 42300
},
{
"epoch": 46.16,
"learning_rate": 6.049438202247192e-07,
"loss": 0.1857,
"step": 42325
},
{
"epoch": 46.18,
"learning_rate": 5.993258426966293e-07,
"loss": 0.159,
"step": 42350
},
{
"epoch": 46.21,
"learning_rate": 5.937078651685393e-07,
"loss": 0.2097,
"step": 42375
},
{
"epoch": 46.24,
"learning_rate": 5.880898876404495e-07,
"loss": 0.1941,
"step": 42400
},
{
"epoch": 46.26,
"learning_rate": 5.824719101123595e-07,
"loss": 0.1817,
"step": 42425
},
{
"epoch": 46.29,
"learning_rate": 5.768539325842698e-07,
"loss": 0.2022,
"step": 42450
},
{
"epoch": 46.32,
"learning_rate": 5.712359550561798e-07,
"loss": 0.1958,
"step": 42475
},
{
"epoch": 46.35,
"learning_rate": 5.656179775280899e-07,
"loss": 0.176,
"step": 42500
},
{
"epoch": 46.37,
"learning_rate": 5.6e-07,
"loss": 0.2181,
"step": 42525
},
{
"epoch": 46.4,
"learning_rate": 5.543820224719102e-07,
"loss": 0.2047,
"step": 42550
},
{
"epoch": 46.43,
"learning_rate": 5.487640449438203e-07,
"loss": 0.1942,
"step": 42575
},
{
"epoch": 46.46,
"learning_rate": 5.431460674157304e-07,
"loss": 0.1655,
"step": 42600
},
{
"epoch": 46.48,
"learning_rate": 5.375280898876404e-07,
"loss": 0.1958,
"step": 42625
},
{
"epoch": 46.51,
"learning_rate": 5.319101123595506e-07,
"loss": 0.2192,
"step": 42650
},
{
"epoch": 46.54,
"learning_rate": 5.262921348314607e-07,
"loss": 0.1425,
"step": 42675
},
{
"epoch": 46.56,
"learning_rate": 5.206741573033709e-07,
"loss": 0.1848,
"step": 42700
},
{
"epoch": 46.59,
"learning_rate": 5.150561797752809e-07,
"loss": 0.1621,
"step": 42725
},
{
"epoch": 46.62,
"learning_rate": 5.09438202247191e-07,
"loss": 0.177,
"step": 42750
},
{
"epoch": 46.65,
"learning_rate": 5.038202247191012e-07,
"loss": 0.1937,
"step": 42775
},
{
"epoch": 46.67,
"learning_rate": 4.982022471910113e-07,
"loss": 0.175,
"step": 42800
},
{
"epoch": 46.7,
"learning_rate": 4.925842696629214e-07,
"loss": 0.1738,
"step": 42825
},
{
"epoch": 46.73,
"learning_rate": 4.869662921348315e-07,
"loss": 0.1732,
"step": 42850
},
{
"epoch": 46.76,
"learning_rate": 4.813483146067415e-07,
"loss": 0.1871,
"step": 42875
},
{
"epoch": 46.78,
"learning_rate": 4.7573033707865176e-07,
"loss": 0.1949,
"step": 42900
},
{
"epoch": 46.81,
"learning_rate": 4.7011235955056183e-07,
"loss": 0.1999,
"step": 42925
},
{
"epoch": 46.84,
"learning_rate": 4.6449438202247196e-07,
"loss": 0.1805,
"step": 42950
},
{
"epoch": 46.86,
"learning_rate": 4.588764044943821e-07,
"loss": 0.1668,
"step": 42975
},
{
"epoch": 46.89,
"learning_rate": 4.5325842696629215e-07,
"loss": 0.2307,
"step": 43000
},
{
"epoch": 46.89,
"eval_cer": 7.136436169068848,
"eval_loss": 0.47538912296295166,
"eval_runtime": 3233.0256,
"eval_samples_per_second": 0.67,
"eval_steps_per_second": 0.168,
"eval_wer": 22.372201908848194,
"step": 43000
},
{
"epoch": 46.92,
"learning_rate": 4.476404494382023e-07,
"loss": 0.1901,
"step": 43025
},
{
"epoch": 46.95,
"learning_rate": 4.420224719101124e-07,
"loss": 0.197,
"step": 43050
},
{
"epoch": 46.97,
"learning_rate": 4.364044943820225e-07,
"loss": 0.2022,
"step": 43075
},
{
"epoch": 47.0,
"learning_rate": 4.3078651685393264e-07,
"loss": 0.1763,
"step": 43100
},
{
"epoch": 47.03,
"learning_rate": 4.251685393258427e-07,
"loss": 0.2063,
"step": 43125
},
{
"epoch": 47.06,
"learning_rate": 4.195505617977529e-07,
"loss": 0.1824,
"step": 43150
},
{
"epoch": 47.08,
"learning_rate": 4.1393258426966295e-07,
"loss": 0.2059,
"step": 43175
},
{
"epoch": 47.11,
"learning_rate": 4.0831460674157307e-07,
"loss": 0.194,
"step": 43200
},
{
"epoch": 47.14,
"learning_rate": 4.026966292134832e-07,
"loss": 0.155,
"step": 43225
},
{
"epoch": 47.16,
"learning_rate": 3.9707865168539326e-07,
"loss": 0.1933,
"step": 43250
},
{
"epoch": 47.19,
"learning_rate": 3.9146067415730344e-07,
"loss": 0.1939,
"step": 43275
},
{
"epoch": 47.22,
"learning_rate": 3.858426966292135e-07,
"loss": 0.1826,
"step": 43300
},
{
"epoch": 47.25,
"learning_rate": 3.802247191011237e-07,
"loss": 0.191,
"step": 43325
},
{
"epoch": 47.27,
"learning_rate": 3.7460674157303375e-07,
"loss": 0.1771,
"step": 43350
},
{
"epoch": 47.3,
"learning_rate": 3.689887640449438e-07,
"loss": 0.1942,
"step": 43375
},
{
"epoch": 47.33,
"learning_rate": 3.63370786516854e-07,
"loss": 0.1873,
"step": 43400
},
{
"epoch": 47.36,
"learning_rate": 3.5775280898876406e-07,
"loss": 0.1559,
"step": 43425
},
{
"epoch": 47.38,
"learning_rate": 3.5213483146067424e-07,
"loss": 0.1719,
"step": 43450
},
{
"epoch": 47.41,
"learning_rate": 3.465168539325843e-07,
"loss": 0.1971,
"step": 43475
},
{
"epoch": 47.44,
"learning_rate": 3.408988764044944e-07,
"loss": 0.1812,
"step": 43500
},
{
"epoch": 47.46,
"learning_rate": 3.3528089887640455e-07,
"loss": 0.1667,
"step": 43525
},
{
"epoch": 47.49,
"learning_rate": 3.296629213483146e-07,
"loss": 0.1625,
"step": 43550
},
{
"epoch": 47.52,
"learning_rate": 3.240449438202248e-07,
"loss": 0.1383,
"step": 43575
},
{
"epoch": 47.55,
"learning_rate": 3.1842696629213487e-07,
"loss": 0.1887,
"step": 43600
},
{
"epoch": 47.57,
"learning_rate": 3.1280898876404494e-07,
"loss": 0.2228,
"step": 43625
},
{
"epoch": 47.6,
"learning_rate": 3.0719101123595506e-07,
"loss": 0.18,
"step": 43650
},
{
"epoch": 47.63,
"learning_rate": 3.015730337078652e-07,
"loss": 0.1823,
"step": 43675
},
{
"epoch": 47.66,
"learning_rate": 2.959550561797753e-07,
"loss": 0.1498,
"step": 43700
},
{
"epoch": 47.68,
"learning_rate": 2.903370786516854e-07,
"loss": 0.1725,
"step": 43725
},
{
"epoch": 47.71,
"learning_rate": 2.8471910112359555e-07,
"loss": 0.1457,
"step": 43750
},
{
"epoch": 47.74,
"learning_rate": 2.791011235955056e-07,
"loss": 0.1575,
"step": 43775
},
{
"epoch": 47.76,
"learning_rate": 2.7348314606741574e-07,
"loss": 0.1722,
"step": 43800
},
{
"epoch": 47.79,
"learning_rate": 2.6786516853932586e-07,
"loss": 0.1841,
"step": 43825
},
{
"epoch": 47.82,
"learning_rate": 2.62247191011236e-07,
"loss": 0.1811,
"step": 43850
},
{
"epoch": 47.85,
"learning_rate": 2.566292134831461e-07,
"loss": 0.1808,
"step": 43875
},
{
"epoch": 47.87,
"learning_rate": 2.5101123595505617e-07,
"loss": 0.1564,
"step": 43900
},
{
"epoch": 47.9,
"learning_rate": 2.453932584269663e-07,
"loss": 0.1803,
"step": 43925
},
{
"epoch": 47.93,
"learning_rate": 2.397752808988764e-07,
"loss": 0.2052,
"step": 43950
},
{
"epoch": 47.96,
"learning_rate": 2.3415730337078654e-07,
"loss": 0.2026,
"step": 43975
},
{
"epoch": 47.98,
"learning_rate": 2.2853932584269666e-07,
"loss": 0.1705,
"step": 44000
},
{
"epoch": 47.98,
"eval_cer": 7.082958776529017,
"eval_loss": 0.47585317492485046,
"eval_runtime": 3126.347,
"eval_samples_per_second": 0.693,
"eval_steps_per_second": 0.173,
"eval_wer": 22.386295127661075,
"step": 44000
},
{
"epoch": 48.01,
"learning_rate": 2.2292134831460676e-07,
"loss": 0.1972,
"step": 44025
},
{
"epoch": 48.04,
"learning_rate": 2.1752808988764047e-07,
"loss": 0.156,
"step": 44050
},
{
"epoch": 48.06,
"learning_rate": 2.119101123595506e-07,
"loss": 0.1913,
"step": 44075
},
{
"epoch": 48.09,
"learning_rate": 2.062921348314607e-07,
"loss": 0.1576,
"step": 44100
},
{
"epoch": 48.12,
"learning_rate": 2.0067415730337078e-07,
"loss": 0.2132,
"step": 44125
},
{
"epoch": 48.15,
"learning_rate": 1.950561797752809e-07,
"loss": 0.1657,
"step": 44150
},
{
"epoch": 48.17,
"learning_rate": 1.8943820224719102e-07,
"loss": 0.1648,
"step": 44175
},
{
"epoch": 48.2,
"learning_rate": 1.8382022471910115e-07,
"loss": 0.1761,
"step": 44200
},
{
"epoch": 48.23,
"learning_rate": 1.7820224719101127e-07,
"loss": 0.1714,
"step": 44225
},
{
"epoch": 48.26,
"learning_rate": 1.7258426966292134e-07,
"loss": 0.1919,
"step": 44250
},
{
"epoch": 48.28,
"learning_rate": 1.6696629213483146e-07,
"loss": 0.1635,
"step": 44275
},
{
"epoch": 48.31,
"learning_rate": 1.6134831460674158e-07,
"loss": 0.1621,
"step": 44300
},
{
"epoch": 48.34,
"learning_rate": 1.557303370786517e-07,
"loss": 0.1812,
"step": 44325
},
{
"epoch": 48.36,
"learning_rate": 1.501123595505618e-07,
"loss": 0.1473,
"step": 44350
},
{
"epoch": 48.39,
"learning_rate": 1.4449438202247192e-07,
"loss": 0.1599,
"step": 44375
},
{
"epoch": 48.42,
"learning_rate": 1.3887640449438202e-07,
"loss": 0.1755,
"step": 44400
},
{
"epoch": 48.45,
"learning_rate": 1.3325842696629214e-07,
"loss": 0.1338,
"step": 44425
},
{
"epoch": 48.47,
"learning_rate": 1.2764044943820226e-07,
"loss": 0.1643,
"step": 44450
},
{
"epoch": 48.5,
"learning_rate": 1.2202247191011236e-07,
"loss": 0.1683,
"step": 44475
},
{
"epoch": 48.53,
"learning_rate": 1.1640449438202248e-07,
"loss": 0.2074,
"step": 44500
},
{
"epoch": 48.56,
"learning_rate": 1.1078651685393259e-07,
"loss": 0.1888,
"step": 44525
},
{
"epoch": 48.58,
"learning_rate": 1.0516853932584271e-07,
"loss": 0.1798,
"step": 44550
},
{
"epoch": 48.61,
"learning_rate": 9.955056179775281e-08,
"loss": 0.1636,
"step": 44575
},
{
"epoch": 48.64,
"learning_rate": 9.393258426966293e-08,
"loss": 0.1752,
"step": 44600
},
{
"epoch": 48.66,
"learning_rate": 8.831460674157305e-08,
"loss": 0.1478,
"step": 44625
},
{
"epoch": 48.69,
"learning_rate": 8.269662921348315e-08,
"loss": 0.1745,
"step": 44650
},
{
"epoch": 48.72,
"learning_rate": 7.707865168539327e-08,
"loss": 0.2115,
"step": 44675
},
{
"epoch": 48.75,
"learning_rate": 7.146067415730338e-08,
"loss": 0.1916,
"step": 44700
},
{
"epoch": 48.77,
"learning_rate": 6.584269662921349e-08,
"loss": 0.1798,
"step": 44725
},
{
"epoch": 48.8,
"learning_rate": 6.02247191011236e-08,
"loss": 0.1878,
"step": 44750
},
{
"epoch": 48.83,
"learning_rate": 5.460674157303371e-08,
"loss": 0.1734,
"step": 44775
},
{
"epoch": 48.85,
"learning_rate": 4.8988764044943827e-08,
"loss": 0.1588,
"step": 44800
},
{
"epoch": 48.88,
"learning_rate": 4.3370786516853935e-08,
"loss": 0.1622,
"step": 44825
},
{
"epoch": 48.91,
"learning_rate": 3.775280898876405e-08,
"loss": 0.1726,
"step": 44850
},
{
"epoch": 48.94,
"learning_rate": 3.213483146067416e-08,
"loss": 0.1523,
"step": 44875
},
{
"epoch": 48.96,
"learning_rate": 2.6516853932584272e-08,
"loss": 0.1753,
"step": 44900
},
{
"epoch": 48.99,
"learning_rate": 2.0898876404494384e-08,
"loss": 0.1672,
"step": 44925
},
{
"epoch": 49.02,
"learning_rate": 1.5280898876404497e-08,
"loss": 0.1675,
"step": 44950
},
{
"epoch": 49.05,
"learning_rate": 9.662921348314607e-09,
"loss": 0.1766,
"step": 44975
},
{
"epoch": 49.07,
"learning_rate": 4.044943820224719e-09,
"loss": 0.2007,
"step": 45000
},
{
"epoch": 49.07,
"eval_cer": 7.1186581618974305,
"eval_loss": 0.47667962312698364,
"eval_runtime": 3154.6082,
"eval_samples_per_second": 0.687,
"eval_steps_per_second": 0.172,
"eval_wer": 22.484947659351242,
"step": 45000
},
{
"epoch": 49.07,
"step": 45000,
"total_flos": 5.83519441453056e+18,
"train_loss": 0.0,
"train_runtime": 0.3863,
"train_samples_per_second": 90611.862,
"train_steps_per_second": 90611.862
},
{
"epoch": 49.07,
"eval_cer": 8.242936323479084,
"eval_loss": 0.5834927558898926,
"eval_runtime": 6238.1277,
"eval_samples_per_second": 0.745,
"eval_steps_per_second": 0.373,
"eval_wer": 24.854767937704718,
"step": 45000
}
],
"max_steps": 35000,
"num_train_epochs": 2,
"total_flos": 5.83519441453056e+18,
"trial_name": null,
"trial_params": null
}