whisper-base-nl-3 / trainer_state.json
SuperKogito's picture
End of training
cca04e4
raw
history blame
155 kB
{
"best_metric": 18.48141795311607,
"best_model_checkpoint": "whisper-base-nl-3/checkpoint-29000",
"epoch": 3.5599857600569598,
"global_step": 30000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.0,
"learning_rate": 4.0000000000000003e-07,
"loss": 1.3847,
"step": 25
},
{
"epoch": 0.0,
"learning_rate": 9.000000000000001e-07,
"loss": 1.4601,
"step": 50
},
{
"epoch": 0.0,
"learning_rate": 1.4000000000000001e-06,
"loss": 1.3556,
"step": 75
},
{
"epoch": 0.01,
"learning_rate": 1.9000000000000002e-06,
"loss": 1.1454,
"step": 100
},
{
"epoch": 0.01,
"learning_rate": 2.4000000000000003e-06,
"loss": 1.2552,
"step": 125
},
{
"epoch": 0.01,
"learning_rate": 2.9e-06,
"loss": 1.1695,
"step": 150
},
{
"epoch": 0.01,
"learning_rate": 3.4000000000000005e-06,
"loss": 0.9503,
"step": 175
},
{
"epoch": 0.01,
"learning_rate": 3.900000000000001e-06,
"loss": 0.9096,
"step": 200
},
{
"epoch": 0.01,
"learning_rate": 4.4e-06,
"loss": 0.8853,
"step": 225
},
{
"epoch": 0.02,
"learning_rate": 4.9000000000000005e-06,
"loss": 0.833,
"step": 250
},
{
"epoch": 0.02,
"learning_rate": 5.400000000000001e-06,
"loss": 0.8597,
"step": 275
},
{
"epoch": 0.02,
"learning_rate": 5.9e-06,
"loss": 0.8199,
"step": 300
},
{
"epoch": 0.02,
"learning_rate": 6.4000000000000006e-06,
"loss": 0.7158,
"step": 325
},
{
"epoch": 0.02,
"learning_rate": 6.9e-06,
"loss": 0.6896,
"step": 350
},
{
"epoch": 0.02,
"learning_rate": 7.4e-06,
"loss": 0.662,
"step": 375
},
{
"epoch": 0.03,
"learning_rate": 7.9e-06,
"loss": 0.8284,
"step": 400
},
{
"epoch": 0.03,
"learning_rate": 8.400000000000001e-06,
"loss": 0.6544,
"step": 425
},
{
"epoch": 0.03,
"learning_rate": 8.900000000000001e-06,
"loss": 0.7486,
"step": 450
},
{
"epoch": 0.03,
"learning_rate": 9.4e-06,
"loss": 0.5652,
"step": 475
},
{
"epoch": 0.03,
"learning_rate": 9.9e-06,
"loss": 0.6604,
"step": 500
},
{
"epoch": 0.03,
"learning_rate": 9.994202898550725e-06,
"loss": 0.7287,
"step": 525
},
{
"epoch": 0.04,
"learning_rate": 9.986956521739132e-06,
"loss": 0.6413,
"step": 550
},
{
"epoch": 0.04,
"learning_rate": 9.979710144927537e-06,
"loss": 0.6762,
"step": 575
},
{
"epoch": 0.04,
"learning_rate": 9.972463768115943e-06,
"loss": 0.6882,
"step": 600
},
{
"epoch": 0.04,
"learning_rate": 9.965217391304348e-06,
"loss": 0.7015,
"step": 625
},
{
"epoch": 0.04,
"learning_rate": 9.957971014492755e-06,
"loss": 0.6145,
"step": 650
},
{
"epoch": 0.04,
"learning_rate": 9.95072463768116e-06,
"loss": 0.6674,
"step": 675
},
{
"epoch": 0.05,
"learning_rate": 9.943478260869565e-06,
"loss": 0.5915,
"step": 700
},
{
"epoch": 0.05,
"learning_rate": 9.936231884057972e-06,
"loss": 0.6632,
"step": 725
},
{
"epoch": 0.05,
"learning_rate": 9.928985507246378e-06,
"loss": 0.6157,
"step": 750
},
{
"epoch": 0.05,
"learning_rate": 9.921739130434783e-06,
"loss": 0.7222,
"step": 775
},
{
"epoch": 0.05,
"learning_rate": 9.91449275362319e-06,
"loss": 0.6447,
"step": 800
},
{
"epoch": 0.05,
"learning_rate": 9.907246376811595e-06,
"loss": 0.6848,
"step": 825
},
{
"epoch": 0.06,
"learning_rate": 9.9e-06,
"loss": 0.6391,
"step": 850
},
{
"epoch": 0.06,
"learning_rate": 9.892753623188407e-06,
"loss": 0.6543,
"step": 875
},
{
"epoch": 0.06,
"learning_rate": 9.885507246376812e-06,
"loss": 0.5579,
"step": 900
},
{
"epoch": 0.06,
"learning_rate": 9.878260869565218e-06,
"loss": 0.5699,
"step": 925
},
{
"epoch": 0.06,
"learning_rate": 9.871014492753625e-06,
"loss": 0.5404,
"step": 950
},
{
"epoch": 0.06,
"learning_rate": 9.86376811594203e-06,
"loss": 0.6237,
"step": 975
},
{
"epoch": 0.06,
"learning_rate": 9.856521739130435e-06,
"loss": 0.5761,
"step": 1000
},
{
"epoch": 0.06,
"eval_cer": 10.115352452161936,
"eval_loss": 0.5675458908081055,
"eval_runtime": 3220.6897,
"eval_samples_per_second": 0.771,
"eval_steps_per_second": 0.385,
"eval_wer": 28.15323041738136,
"step": 1000
},
{
"epoch": 0.07,
"learning_rate": 9.84927536231884e-06,
"loss": 0.6175,
"step": 1025
},
{
"epoch": 0.07,
"learning_rate": 9.842028985507247e-06,
"loss": 0.6934,
"step": 1050
},
{
"epoch": 0.07,
"learning_rate": 9.834782608695654e-06,
"loss": 0.5818,
"step": 1075
},
{
"epoch": 0.07,
"learning_rate": 9.827536231884059e-06,
"loss": 0.6175,
"step": 1100
},
{
"epoch": 0.07,
"learning_rate": 9.820289855072465e-06,
"loss": 0.4952,
"step": 1125
},
{
"epoch": 0.07,
"learning_rate": 9.81304347826087e-06,
"loss": 0.6194,
"step": 1150
},
{
"epoch": 0.08,
"learning_rate": 9.805797101449275e-06,
"loss": 0.5897,
"step": 1175
},
{
"epoch": 0.08,
"learning_rate": 9.798550724637682e-06,
"loss": 0.5356,
"step": 1200
},
{
"epoch": 0.08,
"learning_rate": 9.791304347826089e-06,
"loss": 0.5805,
"step": 1225
},
{
"epoch": 0.08,
"learning_rate": 9.784057971014494e-06,
"loss": 0.5446,
"step": 1250
},
{
"epoch": 0.08,
"learning_rate": 9.776811594202899e-06,
"loss": 0.6734,
"step": 1275
},
{
"epoch": 0.08,
"learning_rate": 9.769565217391305e-06,
"loss": 0.5457,
"step": 1300
},
{
"epoch": 0.09,
"learning_rate": 9.76231884057971e-06,
"loss": 0.4686,
"step": 1325
},
{
"epoch": 0.09,
"learning_rate": 9.755072463768117e-06,
"loss": 0.5954,
"step": 1350
},
{
"epoch": 0.09,
"learning_rate": 9.747826086956522e-06,
"loss": 0.4973,
"step": 1375
},
{
"epoch": 0.09,
"learning_rate": 9.740579710144929e-06,
"loss": 0.5727,
"step": 1400
},
{
"epoch": 0.09,
"learning_rate": 9.733333333333334e-06,
"loss": 0.5767,
"step": 1425
},
{
"epoch": 0.09,
"learning_rate": 9.726086956521739e-06,
"loss": 0.4814,
"step": 1450
},
{
"epoch": 0.1,
"learning_rate": 9.718840579710146e-06,
"loss": 0.5544,
"step": 1475
},
{
"epoch": 0.1,
"learning_rate": 9.71159420289855e-06,
"loss": 0.5281,
"step": 1500
},
{
"epoch": 0.1,
"learning_rate": 9.704347826086957e-06,
"loss": 0.612,
"step": 1525
},
{
"epoch": 0.1,
"learning_rate": 9.697101449275364e-06,
"loss": 0.5293,
"step": 1550
},
{
"epoch": 0.1,
"learning_rate": 9.689855072463769e-06,
"loss": 0.5881,
"step": 1575
},
{
"epoch": 0.1,
"learning_rate": 9.682608695652174e-06,
"loss": 0.5571,
"step": 1600
},
{
"epoch": 0.11,
"learning_rate": 9.67536231884058e-06,
"loss": 0.429,
"step": 1625
},
{
"epoch": 0.11,
"learning_rate": 9.668115942028986e-06,
"loss": 0.4661,
"step": 1650
},
{
"epoch": 0.11,
"learning_rate": 9.660869565217392e-06,
"loss": 0.5181,
"step": 1675
},
{
"epoch": 0.11,
"learning_rate": 9.653623188405797e-06,
"loss": 0.5188,
"step": 1700
},
{
"epoch": 0.11,
"learning_rate": 9.646376811594204e-06,
"loss": 0.4881,
"step": 1725
},
{
"epoch": 0.11,
"learning_rate": 9.639130434782609e-06,
"loss": 0.6319,
"step": 1750
},
{
"epoch": 0.11,
"learning_rate": 9.631884057971014e-06,
"loss": 0.6,
"step": 1775
},
{
"epoch": 0.12,
"learning_rate": 9.624637681159421e-06,
"loss": 0.5251,
"step": 1800
},
{
"epoch": 0.12,
"learning_rate": 9.617391304347828e-06,
"loss": 0.4999,
"step": 1825
},
{
"epoch": 0.12,
"learning_rate": 9.610144927536233e-06,
"loss": 0.5612,
"step": 1850
},
{
"epoch": 0.12,
"learning_rate": 9.60289855072464e-06,
"loss": 0.456,
"step": 1875
},
{
"epoch": 0.12,
"learning_rate": 9.595652173913044e-06,
"loss": 0.5589,
"step": 1900
},
{
"epoch": 0.12,
"learning_rate": 9.58840579710145e-06,
"loss": 0.396,
"step": 1925
},
{
"epoch": 0.13,
"learning_rate": 9.581159420289856e-06,
"loss": 0.4713,
"step": 1950
},
{
"epoch": 0.13,
"learning_rate": 9.573913043478261e-06,
"loss": 0.5178,
"step": 1975
},
{
"epoch": 0.13,
"learning_rate": 9.566666666666668e-06,
"loss": 0.48,
"step": 2000
},
{
"epoch": 0.13,
"eval_cer": 9.69108170593733,
"eval_loss": 0.5239235162734985,
"eval_runtime": 3297.9692,
"eval_samples_per_second": 0.753,
"eval_steps_per_second": 0.376,
"eval_wer": 26.436439870402133,
"step": 2000
},
{
"epoch": 0.13,
"learning_rate": 9.559420289855074e-06,
"loss": 0.5154,
"step": 2025
},
{
"epoch": 0.13,
"learning_rate": 9.55217391304348e-06,
"loss": 0.5715,
"step": 2050
},
{
"epoch": 0.13,
"learning_rate": 9.545217391304349e-06,
"loss": 0.5522,
"step": 2075
},
{
"epoch": 0.14,
"learning_rate": 9.537971014492754e-06,
"loss": 0.5205,
"step": 2100
},
{
"epoch": 0.14,
"learning_rate": 9.53072463768116e-06,
"loss": 0.4494,
"step": 2125
},
{
"epoch": 0.14,
"learning_rate": 9.523478260869566e-06,
"loss": 0.5226,
"step": 2150
},
{
"epoch": 0.14,
"learning_rate": 9.516231884057972e-06,
"loss": 0.469,
"step": 2175
},
{
"epoch": 0.14,
"learning_rate": 9.508985507246377e-06,
"loss": 0.5067,
"step": 2200
},
{
"epoch": 0.14,
"learning_rate": 9.501739130434784e-06,
"loss": 0.5879,
"step": 2225
},
{
"epoch": 0.15,
"learning_rate": 9.494492753623189e-06,
"loss": 0.8063,
"step": 2250
},
{
"epoch": 0.15,
"learning_rate": 9.487246376811596e-06,
"loss": 0.5067,
"step": 2275
},
{
"epoch": 0.15,
"learning_rate": 9.48e-06,
"loss": 0.5124,
"step": 2300
},
{
"epoch": 0.15,
"learning_rate": 9.472753623188406e-06,
"loss": 0.4894,
"step": 2325
},
{
"epoch": 0.15,
"learning_rate": 9.465507246376812e-06,
"loss": 0.504,
"step": 2350
},
{
"epoch": 0.15,
"learning_rate": 9.458260869565217e-06,
"loss": 0.545,
"step": 2375
},
{
"epoch": 0.16,
"learning_rate": 9.451014492753624e-06,
"loss": 0.4962,
"step": 2400
},
{
"epoch": 0.16,
"learning_rate": 9.44376811594203e-06,
"loss": 0.4774,
"step": 2425
},
{
"epoch": 0.16,
"learning_rate": 9.436521739130436e-06,
"loss": 0.5429,
"step": 2450
},
{
"epoch": 0.16,
"learning_rate": 9.42927536231884e-06,
"loss": 0.445,
"step": 2475
},
{
"epoch": 0.16,
"learning_rate": 9.422028985507246e-06,
"loss": 0.4111,
"step": 2500
},
{
"epoch": 0.16,
"learning_rate": 9.414782608695653e-06,
"loss": 0.5188,
"step": 2525
},
{
"epoch": 0.17,
"learning_rate": 9.40753623188406e-06,
"loss": 0.4584,
"step": 2550
},
{
"epoch": 0.17,
"learning_rate": 9.400289855072464e-06,
"loss": 0.5017,
"step": 2575
},
{
"epoch": 0.17,
"learning_rate": 9.393043478260871e-06,
"loss": 0.593,
"step": 2600
},
{
"epoch": 0.17,
"learning_rate": 9.385797101449276e-06,
"loss": 0.5195,
"step": 2625
},
{
"epoch": 0.17,
"learning_rate": 9.378550724637681e-06,
"loss": 0.5083,
"step": 2650
},
{
"epoch": 0.17,
"learning_rate": 9.371304347826088e-06,
"loss": 0.5534,
"step": 2675
},
{
"epoch": 0.17,
"learning_rate": 9.364057971014493e-06,
"loss": 0.4893,
"step": 2700
},
{
"epoch": 0.18,
"learning_rate": 9.3568115942029e-06,
"loss": 0.4512,
"step": 2725
},
{
"epoch": 0.18,
"learning_rate": 9.349565217391306e-06,
"loss": 0.5876,
"step": 2750
},
{
"epoch": 0.18,
"learning_rate": 9.342318840579711e-06,
"loss": 0.4597,
"step": 2775
},
{
"epoch": 0.18,
"learning_rate": 9.335072463768116e-06,
"loss": 0.3634,
"step": 2800
},
{
"epoch": 0.18,
"learning_rate": 9.327826086956523e-06,
"loss": 0.4483,
"step": 2825
},
{
"epoch": 0.18,
"learning_rate": 9.320579710144928e-06,
"loss": 0.5484,
"step": 2850
},
{
"epoch": 0.19,
"learning_rate": 9.313333333333335e-06,
"loss": 0.4852,
"step": 2875
},
{
"epoch": 0.19,
"learning_rate": 9.306086956521741e-06,
"loss": 0.5576,
"step": 2900
},
{
"epoch": 0.19,
"learning_rate": 9.298840579710146e-06,
"loss": 0.5107,
"step": 2925
},
{
"epoch": 0.19,
"learning_rate": 9.291594202898551e-06,
"loss": 0.5286,
"step": 2950
},
{
"epoch": 0.19,
"learning_rate": 9.284347826086956e-06,
"loss": 0.5618,
"step": 2975
},
{
"epoch": 0.19,
"learning_rate": 9.277101449275363e-06,
"loss": 0.4094,
"step": 3000
},
{
"epoch": 0.19,
"eval_cer": 9.153180185941267,
"eval_loss": 0.49246901273727417,
"eval_runtime": 3242.5657,
"eval_samples_per_second": 0.765,
"eval_steps_per_second": 0.383,
"eval_wer": 24.835525061940157,
"step": 3000
},
{
"epoch": 0.2,
"learning_rate": 9.26985507246377e-06,
"loss": 0.5152,
"step": 3025
},
{
"epoch": 0.2,
"learning_rate": 9.262608695652175e-06,
"loss": 0.5572,
"step": 3050
},
{
"epoch": 0.2,
"learning_rate": 9.255362318840581e-06,
"loss": 0.4801,
"step": 3075
},
{
"epoch": 0.2,
"learning_rate": 9.248115942028986e-06,
"loss": 0.4005,
"step": 3100
},
{
"epoch": 0.2,
"learning_rate": 9.240869565217391e-06,
"loss": 0.4693,
"step": 3125
},
{
"epoch": 0.2,
"learning_rate": 9.233623188405798e-06,
"loss": 0.4487,
"step": 3150
},
{
"epoch": 0.21,
"learning_rate": 9.226376811594203e-06,
"loss": 0.4477,
"step": 3175
},
{
"epoch": 0.21,
"learning_rate": 9.21913043478261e-06,
"loss": 0.4,
"step": 3200
},
{
"epoch": 0.21,
"learning_rate": 9.211884057971015e-06,
"loss": 0.4358,
"step": 3225
},
{
"epoch": 0.21,
"learning_rate": 9.204637681159421e-06,
"loss": 0.4952,
"step": 3250
},
{
"epoch": 0.21,
"learning_rate": 9.197391304347826e-06,
"loss": 0.4526,
"step": 3275
},
{
"epoch": 0.21,
"learning_rate": 9.190144927536233e-06,
"loss": 0.3588,
"step": 3300
},
{
"epoch": 0.22,
"learning_rate": 9.182898550724638e-06,
"loss": 0.5127,
"step": 3325
},
{
"epoch": 0.22,
"learning_rate": 9.175652173913045e-06,
"loss": 0.6166,
"step": 3350
},
{
"epoch": 0.22,
"learning_rate": 9.16840579710145e-06,
"loss": 0.5032,
"step": 3375
},
{
"epoch": 0.22,
"learning_rate": 9.161159420289855e-06,
"loss": 0.5632,
"step": 3400
},
{
"epoch": 0.22,
"learning_rate": 9.153913043478262e-06,
"loss": 0.5268,
"step": 3425
},
{
"epoch": 0.22,
"learning_rate": 9.146666666666667e-06,
"loss": 0.4672,
"step": 3450
},
{
"epoch": 0.23,
"learning_rate": 9.139420289855073e-06,
"loss": 0.4342,
"step": 3475
},
{
"epoch": 0.23,
"learning_rate": 9.13217391304348e-06,
"loss": 0.4504,
"step": 3500
},
{
"epoch": 0.23,
"learning_rate": 9.124927536231885e-06,
"loss": 0.4076,
"step": 3525
},
{
"epoch": 0.23,
"learning_rate": 9.11768115942029e-06,
"loss": 0.5036,
"step": 3550
},
{
"epoch": 0.23,
"learning_rate": 9.110434782608695e-06,
"loss": 0.3835,
"step": 3575
},
{
"epoch": 0.23,
"learning_rate": 9.103188405797102e-06,
"loss": 0.3652,
"step": 3600
},
{
"epoch": 0.23,
"learning_rate": 9.095942028985508e-06,
"loss": 0.4231,
"step": 3625
},
{
"epoch": 0.24,
"learning_rate": 9.088695652173913e-06,
"loss": 0.4644,
"step": 3650
},
{
"epoch": 0.24,
"learning_rate": 9.08144927536232e-06,
"loss": 0.5602,
"step": 3675
},
{
"epoch": 0.24,
"learning_rate": 9.074202898550725e-06,
"loss": 0.4637,
"step": 3700
},
{
"epoch": 0.24,
"learning_rate": 9.06695652173913e-06,
"loss": 0.4324,
"step": 3725
},
{
"epoch": 0.24,
"learning_rate": 9.059710144927537e-06,
"loss": 0.446,
"step": 3750
},
{
"epoch": 0.24,
"learning_rate": 9.052463768115944e-06,
"loss": 0.5127,
"step": 3775
},
{
"epoch": 0.25,
"learning_rate": 9.045217391304349e-06,
"loss": 0.4453,
"step": 3800
},
{
"epoch": 0.25,
"learning_rate": 9.037971014492755e-06,
"loss": 0.4382,
"step": 3825
},
{
"epoch": 0.25,
"learning_rate": 9.03072463768116e-06,
"loss": 0.5816,
"step": 3850
},
{
"epoch": 0.25,
"learning_rate": 9.023478260869565e-06,
"loss": 0.397,
"step": 3875
},
{
"epoch": 0.25,
"learning_rate": 9.016231884057972e-06,
"loss": 0.4512,
"step": 3900
},
{
"epoch": 0.25,
"learning_rate": 9.008985507246377e-06,
"loss": 0.4541,
"step": 3925
},
{
"epoch": 0.26,
"learning_rate": 9.001739130434784e-06,
"loss": 0.3829,
"step": 3950
},
{
"epoch": 0.26,
"learning_rate": 8.99449275362319e-06,
"loss": 0.5275,
"step": 3975
},
{
"epoch": 0.26,
"learning_rate": 8.987246376811595e-06,
"loss": 0.4792,
"step": 4000
},
{
"epoch": 0.26,
"eval_cer": 8.841433420237099,
"eval_loss": 0.47019296884536743,
"eval_runtime": 3179.8405,
"eval_samples_per_second": 0.781,
"eval_steps_per_second": 0.39,
"eval_wer": 24.110539355822375,
"step": 4000
},
{
"epoch": 0.26,
"learning_rate": 8.98e-06,
"loss": 0.4638,
"step": 4025
},
{
"epoch": 0.26,
"learning_rate": 8.972753623188405e-06,
"loss": 0.5326,
"step": 4050
},
{
"epoch": 0.26,
"learning_rate": 8.965507246376812e-06,
"loss": 0.4799,
"step": 4075
},
{
"epoch": 0.27,
"learning_rate": 8.958260869565219e-06,
"loss": 0.4798,
"step": 4100
},
{
"epoch": 0.27,
"learning_rate": 8.951014492753624e-06,
"loss": 0.4938,
"step": 4125
},
{
"epoch": 0.27,
"learning_rate": 8.94376811594203e-06,
"loss": 0.4882,
"step": 4150
},
{
"epoch": 0.27,
"learning_rate": 8.936521739130436e-06,
"loss": 0.4136,
"step": 4175
},
{
"epoch": 0.27,
"learning_rate": 8.92927536231884e-06,
"loss": 0.5116,
"step": 4200
},
{
"epoch": 0.27,
"learning_rate": 8.922028985507247e-06,
"loss": 0.5381,
"step": 4225
},
{
"epoch": 0.28,
"learning_rate": 8.914782608695652e-06,
"loss": 0.3999,
"step": 4250
},
{
"epoch": 0.28,
"learning_rate": 8.907536231884059e-06,
"loss": 0.3925,
"step": 4275
},
{
"epoch": 0.28,
"learning_rate": 8.900289855072464e-06,
"loss": 0.469,
"step": 4300
},
{
"epoch": 0.28,
"learning_rate": 8.89304347826087e-06,
"loss": 0.4854,
"step": 4325
},
{
"epoch": 0.28,
"learning_rate": 8.885797101449276e-06,
"loss": 0.5086,
"step": 4350
},
{
"epoch": 0.28,
"learning_rate": 8.878550724637682e-06,
"loss": 0.4679,
"step": 4375
},
{
"epoch": 0.29,
"learning_rate": 8.871594202898552e-06,
"loss": 0.5175,
"step": 4400
},
{
"epoch": 0.29,
"learning_rate": 8.864347826086957e-06,
"loss": 0.4921,
"step": 4425
},
{
"epoch": 0.29,
"learning_rate": 8.857101449275362e-06,
"loss": 0.4375,
"step": 4450
},
{
"epoch": 0.29,
"learning_rate": 8.849855072463769e-06,
"loss": 0.6226,
"step": 4475
},
{
"epoch": 0.29,
"learning_rate": 8.842608695652175e-06,
"loss": 0.4383,
"step": 4500
},
{
"epoch": 0.29,
"learning_rate": 8.83536231884058e-06,
"loss": 0.4799,
"step": 4525
},
{
"epoch": 0.29,
"learning_rate": 8.828115942028987e-06,
"loss": 0.4063,
"step": 4550
},
{
"epoch": 0.3,
"learning_rate": 8.820869565217392e-06,
"loss": 0.4039,
"step": 4575
},
{
"epoch": 0.3,
"learning_rate": 8.813623188405797e-06,
"loss": 0.3688,
"step": 4600
},
{
"epoch": 0.3,
"learning_rate": 8.806376811594204e-06,
"loss": 0.4714,
"step": 4625
},
{
"epoch": 0.3,
"learning_rate": 8.799130434782609e-06,
"loss": 0.426,
"step": 4650
},
{
"epoch": 0.3,
"learning_rate": 8.791884057971015e-06,
"loss": 0.4623,
"step": 4675
},
{
"epoch": 0.3,
"learning_rate": 8.784637681159422e-06,
"loss": 0.4223,
"step": 4700
},
{
"epoch": 0.31,
"learning_rate": 8.777391304347827e-06,
"loss": 0.504,
"step": 4725
},
{
"epoch": 0.31,
"learning_rate": 8.770144927536232e-06,
"loss": 0.4396,
"step": 4750
},
{
"epoch": 0.31,
"learning_rate": 8.762898550724639e-06,
"loss": 0.4665,
"step": 4775
},
{
"epoch": 0.31,
"learning_rate": 8.755652173913044e-06,
"loss": 0.4356,
"step": 4800
},
{
"epoch": 0.31,
"learning_rate": 8.74840579710145e-06,
"loss": 0.4058,
"step": 4825
},
{
"epoch": 0.31,
"learning_rate": 8.741159420289856e-06,
"loss": 0.4825,
"step": 4850
},
{
"epoch": 0.32,
"learning_rate": 8.733913043478262e-06,
"loss": 0.5461,
"step": 4875
},
{
"epoch": 0.32,
"learning_rate": 8.726666666666667e-06,
"loss": 0.4718,
"step": 4900
},
{
"epoch": 0.32,
"learning_rate": 8.719420289855072e-06,
"loss": 0.5011,
"step": 4925
},
{
"epoch": 0.32,
"learning_rate": 8.712173913043479e-06,
"loss": 0.4281,
"step": 4950
},
{
"epoch": 0.32,
"learning_rate": 8.704927536231886e-06,
"loss": 0.5207,
"step": 4975
},
{
"epoch": 0.32,
"learning_rate": 8.69768115942029e-06,
"loss": 0.3444,
"step": 5000
},
{
"epoch": 0.32,
"eval_cer": 8.853116237886763,
"eval_loss": 0.45443984866142273,
"eval_runtime": 3270.5063,
"eval_samples_per_second": 0.759,
"eval_steps_per_second": 0.379,
"eval_wer": 23.901658090337335,
"step": 5000
},
{
"epoch": 0.33,
"learning_rate": 8.690434782608697e-06,
"loss": 0.4848,
"step": 5025
},
{
"epoch": 0.33,
"learning_rate": 8.683188405797102e-06,
"loss": 0.4012,
"step": 5050
},
{
"epoch": 0.33,
"learning_rate": 8.675942028985507e-06,
"loss": 0.3266,
"step": 5075
},
{
"epoch": 0.33,
"learning_rate": 8.668695652173914e-06,
"loss": 0.4751,
"step": 5100
},
{
"epoch": 0.33,
"learning_rate": 8.661449275362319e-06,
"loss": 0.5552,
"step": 5125
},
{
"epoch": 0.33,
"learning_rate": 8.654202898550726e-06,
"loss": 0.4079,
"step": 5150
},
{
"epoch": 0.34,
"learning_rate": 8.64695652173913e-06,
"loss": 0.4326,
"step": 5175
},
{
"epoch": 0.34,
"learning_rate": 8.639710144927538e-06,
"loss": 0.4591,
"step": 5200
},
{
"epoch": 0.34,
"learning_rate": 8.632463768115943e-06,
"loss": 0.3962,
"step": 5225
},
{
"epoch": 0.34,
"learning_rate": 8.625217391304348e-06,
"loss": 0.4825,
"step": 5250
},
{
"epoch": 0.34,
"learning_rate": 8.617971014492754e-06,
"loss": 0.4377,
"step": 5275
},
{
"epoch": 0.34,
"learning_rate": 8.610724637681161e-06,
"loss": 0.437,
"step": 5300
},
{
"epoch": 0.34,
"learning_rate": 8.603478260869566e-06,
"loss": 0.3836,
"step": 5325
},
{
"epoch": 0.35,
"learning_rate": 8.596231884057971e-06,
"loss": 0.4649,
"step": 5350
},
{
"epoch": 0.35,
"learning_rate": 8.588985507246378e-06,
"loss": 0.4631,
"step": 5375
},
{
"epoch": 0.35,
"learning_rate": 8.581739130434783e-06,
"loss": 0.5619,
"step": 5400
},
{
"epoch": 0.35,
"learning_rate": 8.57449275362319e-06,
"loss": 0.5031,
"step": 5425
},
{
"epoch": 0.35,
"learning_rate": 8.567246376811596e-06,
"loss": 0.3797,
"step": 5450
},
{
"epoch": 0.35,
"learning_rate": 8.560000000000001e-06,
"loss": 0.4993,
"step": 5475
},
{
"epoch": 0.36,
"learning_rate": 8.552753623188406e-06,
"loss": 0.4146,
"step": 5500
},
{
"epoch": 0.36,
"learning_rate": 8.545507246376811e-06,
"loss": 0.4524,
"step": 5525
},
{
"epoch": 0.36,
"learning_rate": 8.538260869565218e-06,
"loss": 0.4812,
"step": 5550
},
{
"epoch": 0.36,
"learning_rate": 8.531014492753624e-06,
"loss": 0.3781,
"step": 5575
},
{
"epoch": 0.36,
"learning_rate": 8.52376811594203e-06,
"loss": 0.4343,
"step": 5600
},
{
"epoch": 0.36,
"learning_rate": 8.516521739130436e-06,
"loss": 0.4226,
"step": 5625
},
{
"epoch": 0.37,
"learning_rate": 8.509275362318841e-06,
"loss": 0.4341,
"step": 5650
},
{
"epoch": 0.37,
"learning_rate": 8.502028985507246e-06,
"loss": 0.4008,
"step": 5675
},
{
"epoch": 0.37,
"learning_rate": 8.494782608695653e-06,
"loss": 0.4199,
"step": 5700
},
{
"epoch": 0.37,
"learning_rate": 8.487536231884058e-06,
"loss": 0.4822,
"step": 5725
},
{
"epoch": 0.37,
"learning_rate": 8.480289855072465e-06,
"loss": 0.3857,
"step": 5750
},
{
"epoch": 0.37,
"learning_rate": 8.473043478260871e-06,
"loss": 0.5646,
"step": 5775
},
{
"epoch": 0.38,
"learning_rate": 8.465797101449276e-06,
"loss": 0.3835,
"step": 5800
},
{
"epoch": 0.38,
"learning_rate": 8.458550724637681e-06,
"loss": 0.4856,
"step": 5825
},
{
"epoch": 0.38,
"learning_rate": 8.451304347826088e-06,
"loss": 0.4807,
"step": 5850
},
{
"epoch": 0.38,
"learning_rate": 8.444057971014493e-06,
"loss": 0.5281,
"step": 5875
},
{
"epoch": 0.38,
"learning_rate": 8.4368115942029e-06,
"loss": 0.4234,
"step": 5900
},
{
"epoch": 0.38,
"learning_rate": 8.429565217391305e-06,
"loss": 0.6375,
"step": 5925
},
{
"epoch": 0.39,
"learning_rate": 8.422318840579711e-06,
"loss": 0.4303,
"step": 5950
},
{
"epoch": 0.39,
"learning_rate": 8.415072463768116e-06,
"loss": 0.4196,
"step": 5975
},
{
"epoch": 0.39,
"learning_rate": 8.407826086956521e-06,
"loss": 0.3943,
"step": 6000
},
{
"epoch": 0.39,
"eval_cer": 8.360224310098873,
"eval_loss": 0.44455686211586,
"eval_runtime": 3263.9495,
"eval_samples_per_second": 0.76,
"eval_steps_per_second": 0.38,
"eval_wer": 22.735277301315037,
"step": 6000
},
{
"epoch": 0.39,
"learning_rate": 8.400579710144928e-06,
"loss": 0.4164,
"step": 6025
},
{
"epoch": 0.39,
"learning_rate": 8.393333333333335e-06,
"loss": 0.4818,
"step": 6050
},
{
"epoch": 0.39,
"learning_rate": 8.38608695652174e-06,
"loss": 0.5536,
"step": 6075
},
{
"epoch": 0.4,
"learning_rate": 8.378840579710147e-06,
"loss": 0.4731,
"step": 6100
},
{
"epoch": 0.4,
"learning_rate": 8.371594202898552e-06,
"loss": 0.4081,
"step": 6125
},
{
"epoch": 0.4,
"learning_rate": 8.364347826086957e-06,
"loss": 0.3741,
"step": 6150
},
{
"epoch": 0.4,
"learning_rate": 8.357101449275363e-06,
"loss": 0.4173,
"step": 6175
},
{
"epoch": 0.4,
"learning_rate": 8.349855072463768e-06,
"loss": 0.4954,
"step": 6200
},
{
"epoch": 0.4,
"learning_rate": 8.342608695652175e-06,
"loss": 0.461,
"step": 6225
},
{
"epoch": 0.4,
"learning_rate": 8.33536231884058e-06,
"loss": 0.4501,
"step": 6250
},
{
"epoch": 0.41,
"learning_rate": 8.328115942028987e-06,
"loss": 0.3652,
"step": 6275
},
{
"epoch": 0.41,
"learning_rate": 8.320869565217392e-06,
"loss": 0.4046,
"step": 6300
},
{
"epoch": 0.41,
"learning_rate": 8.313623188405798e-06,
"loss": 0.4184,
"step": 6325
},
{
"epoch": 0.41,
"learning_rate": 8.306376811594203e-06,
"loss": 0.4287,
"step": 6350
},
{
"epoch": 0.41,
"learning_rate": 8.29913043478261e-06,
"loss": 0.3938,
"step": 6375
},
{
"epoch": 0.41,
"learning_rate": 8.291884057971015e-06,
"loss": 0.4758,
"step": 6400
},
{
"epoch": 0.42,
"learning_rate": 8.28463768115942e-06,
"loss": 0.4716,
"step": 6425
},
{
"epoch": 0.42,
"learning_rate": 8.277391304347827e-06,
"loss": 0.3819,
"step": 6450
},
{
"epoch": 0.42,
"learning_rate": 8.270144927536232e-06,
"loss": 0.3889,
"step": 6475
},
{
"epoch": 0.42,
"learning_rate": 8.262898550724639e-06,
"loss": 0.4659,
"step": 6500
},
{
"epoch": 0.42,
"learning_rate": 8.255652173913045e-06,
"loss": 0.3274,
"step": 6525
},
{
"epoch": 0.42,
"learning_rate": 8.24840579710145e-06,
"loss": 0.4144,
"step": 6550
},
{
"epoch": 0.43,
"learning_rate": 8.241159420289855e-06,
"loss": 0.3875,
"step": 6575
},
{
"epoch": 0.43,
"learning_rate": 8.23391304347826e-06,
"loss": 0.452,
"step": 6600
},
{
"epoch": 0.43,
"learning_rate": 8.226666666666667e-06,
"loss": 0.4747,
"step": 6625
},
{
"epoch": 0.43,
"learning_rate": 8.219420289855074e-06,
"loss": 0.4448,
"step": 6650
},
{
"epoch": 0.43,
"learning_rate": 8.212173913043479e-06,
"loss": 0.5215,
"step": 6675
},
{
"epoch": 0.43,
"learning_rate": 8.204927536231885e-06,
"loss": 0.4261,
"step": 6700
},
{
"epoch": 0.44,
"learning_rate": 8.19768115942029e-06,
"loss": 0.4482,
"step": 6725
},
{
"epoch": 0.44,
"learning_rate": 8.190434782608695e-06,
"loss": 0.39,
"step": 6750
},
{
"epoch": 0.44,
"learning_rate": 8.183188405797102e-06,
"loss": 0.6096,
"step": 6775
},
{
"epoch": 0.44,
"learning_rate": 8.175942028985507e-06,
"loss": 0.3912,
"step": 6800
},
{
"epoch": 0.44,
"learning_rate": 8.168695652173914e-06,
"loss": 0.3141,
"step": 6825
},
{
"epoch": 0.44,
"learning_rate": 8.16144927536232e-06,
"loss": 0.3593,
"step": 6850
},
{
"epoch": 0.45,
"learning_rate": 8.154202898550725e-06,
"loss": 0.4331,
"step": 6875
},
{
"epoch": 0.45,
"learning_rate": 8.14695652173913e-06,
"loss": 0.4574,
"step": 6900
},
{
"epoch": 0.45,
"learning_rate": 8.139710144927537e-06,
"loss": 0.3546,
"step": 6925
},
{
"epoch": 0.45,
"learning_rate": 8.132463768115942e-06,
"loss": 0.3894,
"step": 6950
},
{
"epoch": 0.45,
"learning_rate": 8.125217391304349e-06,
"loss": 0.393,
"step": 6975
},
{
"epoch": 0.45,
"learning_rate": 8.117971014492756e-06,
"loss": 0.4925,
"step": 7000
},
{
"epoch": 0.45,
"eval_cer": 8.3723990358601,
"eval_loss": 0.4348393380641937,
"eval_runtime": 3254.2457,
"eval_samples_per_second": 0.763,
"eval_steps_per_second": 0.381,
"eval_wer": 22.178768820278254,
"step": 7000
},
{
"epoch": 0.46,
"learning_rate": 8.11072463768116e-06,
"loss": 0.3986,
"step": 7025
},
{
"epoch": 0.46,
"learning_rate": 8.103478260869566e-06,
"loss": 0.3943,
"step": 7050
},
{
"epoch": 0.46,
"learning_rate": 8.09623188405797e-06,
"loss": 0.4803,
"step": 7075
},
{
"epoch": 0.46,
"learning_rate": 8.088985507246377e-06,
"loss": 0.4128,
"step": 7100
},
{
"epoch": 0.46,
"learning_rate": 8.081739130434784e-06,
"loss": 0.5511,
"step": 7125
},
{
"epoch": 0.46,
"learning_rate": 8.074492753623189e-06,
"loss": 0.4377,
"step": 7150
},
{
"epoch": 0.46,
"learning_rate": 8.067246376811596e-06,
"loss": 0.453,
"step": 7175
},
{
"epoch": 0.47,
"learning_rate": 8.06e-06,
"loss": 0.4019,
"step": 7200
},
{
"epoch": 0.47,
"learning_rate": 8.052753623188406e-06,
"loss": 0.4934,
"step": 7225
},
{
"epoch": 0.47,
"learning_rate": 8.045507246376812e-06,
"loss": 0.3873,
"step": 7250
},
{
"epoch": 0.47,
"learning_rate": 8.038260869565217e-06,
"loss": 0.389,
"step": 7275
},
{
"epoch": 0.47,
"learning_rate": 8.031014492753624e-06,
"loss": 0.4086,
"step": 7300
},
{
"epoch": 0.47,
"learning_rate": 8.02376811594203e-06,
"loss": 0.3844,
"step": 7325
},
{
"epoch": 0.48,
"learning_rate": 8.016521739130436e-06,
"loss": 0.4577,
"step": 7350
},
{
"epoch": 0.48,
"learning_rate": 8.009275362318841e-06,
"loss": 0.383,
"step": 7375
},
{
"epoch": 0.48,
"learning_rate": 8.002028985507248e-06,
"loss": 0.5191,
"step": 7400
},
{
"epoch": 0.48,
"learning_rate": 7.994782608695653e-06,
"loss": 0.3293,
"step": 7425
},
{
"epoch": 0.48,
"learning_rate": 7.98753623188406e-06,
"loss": 0.4246,
"step": 7450
},
{
"epoch": 0.48,
"learning_rate": 7.980289855072464e-06,
"loss": 0.3811,
"step": 7475
},
{
"epoch": 0.49,
"learning_rate": 7.97304347826087e-06,
"loss": 0.3891,
"step": 7500
},
{
"epoch": 0.49,
"learning_rate": 7.965797101449276e-06,
"loss": 0.4367,
"step": 7525
},
{
"epoch": 0.49,
"learning_rate": 7.958550724637681e-06,
"loss": 0.4793,
"step": 7550
},
{
"epoch": 0.49,
"learning_rate": 7.951304347826088e-06,
"loss": 0.3993,
"step": 7575
},
{
"epoch": 0.49,
"learning_rate": 7.944347826086957e-06,
"loss": 0.3095,
"step": 7600
},
{
"epoch": 0.49,
"learning_rate": 7.937101449275362e-06,
"loss": 0.4002,
"step": 7625
},
{
"epoch": 0.5,
"learning_rate": 7.929855072463769e-06,
"loss": 0.4037,
"step": 7650
},
{
"epoch": 0.5,
"learning_rate": 7.922608695652174e-06,
"loss": 0.3694,
"step": 7675
},
{
"epoch": 0.5,
"learning_rate": 7.91536231884058e-06,
"loss": 0.3969,
"step": 7700
},
{
"epoch": 0.5,
"learning_rate": 7.908115942028987e-06,
"loss": 0.4404,
"step": 7725
},
{
"epoch": 0.5,
"learning_rate": 7.900869565217392e-06,
"loss": 0.4489,
"step": 7750
},
{
"epoch": 0.5,
"learning_rate": 7.893623188405797e-06,
"loss": 0.3542,
"step": 7775
},
{
"epoch": 0.51,
"learning_rate": 7.886376811594204e-06,
"loss": 0.4793,
"step": 7800
},
{
"epoch": 0.51,
"learning_rate": 7.879130434782609e-06,
"loss": 0.3876,
"step": 7825
},
{
"epoch": 0.51,
"learning_rate": 7.871884057971016e-06,
"loss": 0.3983,
"step": 7850
},
{
"epoch": 0.51,
"learning_rate": 7.86463768115942e-06,
"loss": 0.5017,
"step": 7875
},
{
"epoch": 0.51,
"learning_rate": 7.857391304347827e-06,
"loss": 0.3704,
"step": 7900
},
{
"epoch": 0.51,
"learning_rate": 7.850144927536232e-06,
"loss": 0.4443,
"step": 7925
},
{
"epoch": 0.51,
"learning_rate": 7.842898550724637e-06,
"loss": 0.3535,
"step": 7950
},
{
"epoch": 0.52,
"learning_rate": 7.835652173913044e-06,
"loss": 0.4255,
"step": 7975
},
{
"epoch": 0.52,
"learning_rate": 7.828405797101451e-06,
"loss": 0.4455,
"step": 8000
},
{
"epoch": 0.52,
"eval_cer": 8.29885877318117,
"eval_loss": 0.42695876955986023,
"eval_runtime": 3202.8428,
"eval_samples_per_second": 0.775,
"eval_steps_per_second": 0.387,
"eval_wer": 21.754907566228322,
"step": 8000
},
{
"epoch": 0.52,
"learning_rate": 7.821159420289856e-06,
"loss": 0.5201,
"step": 8025
},
{
"epoch": 0.52,
"learning_rate": 7.813913043478263e-06,
"loss": 0.4287,
"step": 8050
},
{
"epoch": 0.52,
"learning_rate": 7.806666666666668e-06,
"loss": 0.3597,
"step": 8075
},
{
"epoch": 0.52,
"learning_rate": 7.799420289855073e-06,
"loss": 0.2911,
"step": 8100
},
{
"epoch": 0.53,
"learning_rate": 7.79217391304348e-06,
"loss": 0.4192,
"step": 8125
},
{
"epoch": 0.53,
"learning_rate": 7.784927536231884e-06,
"loss": 0.328,
"step": 8150
},
{
"epoch": 0.53,
"learning_rate": 7.777681159420291e-06,
"loss": 0.4364,
"step": 8175
},
{
"epoch": 0.53,
"learning_rate": 7.770434782608696e-06,
"loss": 0.2877,
"step": 8200
},
{
"epoch": 0.53,
"learning_rate": 7.763188405797101e-06,
"loss": 0.3641,
"step": 8225
},
{
"epoch": 0.53,
"learning_rate": 7.755942028985508e-06,
"loss": 0.3338,
"step": 8250
},
{
"epoch": 0.54,
"learning_rate": 7.748695652173913e-06,
"loss": 0.3425,
"step": 8275
},
{
"epoch": 0.54,
"learning_rate": 7.74144927536232e-06,
"loss": 0.3633,
"step": 8300
},
{
"epoch": 0.54,
"learning_rate": 7.734202898550726e-06,
"loss": 0.4027,
"step": 8325
},
{
"epoch": 0.54,
"learning_rate": 7.726956521739131e-06,
"loss": 0.4075,
"step": 8350
},
{
"epoch": 0.54,
"learning_rate": 7.719710144927536e-06,
"loss": 0.4272,
"step": 8375
},
{
"epoch": 0.54,
"learning_rate": 7.712463768115943e-06,
"loss": 0.4463,
"step": 8400
},
{
"epoch": 0.55,
"learning_rate": 7.705217391304348e-06,
"loss": 0.4225,
"step": 8425
},
{
"epoch": 0.55,
"learning_rate": 7.697971014492755e-06,
"loss": 0.4155,
"step": 8450
},
{
"epoch": 0.55,
"learning_rate": 7.69072463768116e-06,
"loss": 0.3319,
"step": 8475
},
{
"epoch": 0.55,
"learning_rate": 7.683478260869566e-06,
"loss": 0.3675,
"step": 8500
},
{
"epoch": 0.55,
"learning_rate": 7.676231884057971e-06,
"loss": 0.4573,
"step": 8525
},
{
"epoch": 0.55,
"learning_rate": 7.668985507246376e-06,
"loss": 0.3742,
"step": 8550
},
{
"epoch": 0.56,
"learning_rate": 7.661739130434783e-06,
"loss": 0.4487,
"step": 8575
},
{
"epoch": 0.56,
"learning_rate": 7.65449275362319e-06,
"loss": 0.3993,
"step": 8600
},
{
"epoch": 0.56,
"learning_rate": 7.647246376811595e-06,
"loss": 0.3999,
"step": 8625
},
{
"epoch": 0.56,
"learning_rate": 7.640000000000001e-06,
"loss": 0.4322,
"step": 8650
},
{
"epoch": 0.56,
"learning_rate": 7.632753623188406e-06,
"loss": 0.2906,
"step": 8675
},
{
"epoch": 0.56,
"learning_rate": 7.625507246376812e-06,
"loss": 0.41,
"step": 8700
},
{
"epoch": 0.57,
"learning_rate": 7.618260869565218e-06,
"loss": 0.2934,
"step": 8725
},
{
"epoch": 0.57,
"learning_rate": 7.611014492753623e-06,
"loss": 0.3668,
"step": 8750
},
{
"epoch": 0.57,
"learning_rate": 7.60376811594203e-06,
"loss": 0.3826,
"step": 8775
},
{
"epoch": 0.57,
"learning_rate": 7.596521739130436e-06,
"loss": 0.4043,
"step": 8800
},
{
"epoch": 0.57,
"learning_rate": 7.589275362318841e-06,
"loss": 0.6248,
"step": 8825
},
{
"epoch": 0.57,
"learning_rate": 7.582028985507247e-06,
"loss": 0.4668,
"step": 8850
},
{
"epoch": 0.57,
"learning_rate": 7.574782608695653e-06,
"loss": 0.4407,
"step": 8875
},
{
"epoch": 0.58,
"learning_rate": 7.567536231884058e-06,
"loss": 0.3811,
"step": 8900
},
{
"epoch": 0.58,
"learning_rate": 7.560289855072465e-06,
"loss": 0.4717,
"step": 8925
},
{
"epoch": 0.58,
"learning_rate": 7.55304347826087e-06,
"loss": 0.3531,
"step": 8950
},
{
"epoch": 0.58,
"learning_rate": 7.545797101449276e-06,
"loss": 0.4022,
"step": 8975
},
{
"epoch": 0.58,
"learning_rate": 7.5385507246376825e-06,
"loss": 0.3987,
"step": 9000
},
{
"epoch": 0.58,
"eval_cer": 7.9417334841851535,
"eval_loss": 0.41387349367141724,
"eval_runtime": 3295.4388,
"eval_samples_per_second": 0.753,
"eval_steps_per_second": 0.377,
"eval_wer": 20.842386125404992,
"step": 9000
},
{
"epoch": 0.58,
"learning_rate": 7.5313043478260875e-06,
"loss": 0.2728,
"step": 9025
},
{
"epoch": 0.59,
"learning_rate": 7.524057971014493e-06,
"loss": 0.5125,
"step": 9050
},
{
"epoch": 0.59,
"learning_rate": 7.516811594202899e-06,
"loss": 0.3452,
"step": 9075
},
{
"epoch": 0.59,
"learning_rate": 7.509565217391305e-06,
"loss": 0.3387,
"step": 9100
},
{
"epoch": 0.59,
"learning_rate": 7.502318840579711e-06,
"loss": 0.5818,
"step": 9125
},
{
"epoch": 0.59,
"learning_rate": 7.495072463768116e-06,
"loss": 0.3494,
"step": 9150
},
{
"epoch": 0.59,
"learning_rate": 7.487826086956523e-06,
"loss": 0.2902,
"step": 9175
},
{
"epoch": 0.6,
"learning_rate": 7.4805797101449285e-06,
"loss": 0.3691,
"step": 9200
},
{
"epoch": 0.6,
"learning_rate": 7.4733333333333335e-06,
"loss": 0.3344,
"step": 9225
},
{
"epoch": 0.6,
"learning_rate": 7.466086956521739e-06,
"loss": 0.3612,
"step": 9250
},
{
"epoch": 0.6,
"learning_rate": 7.458840579710146e-06,
"loss": 0.4311,
"step": 9275
},
{
"epoch": 0.6,
"learning_rate": 7.451594202898551e-06,
"loss": 0.4298,
"step": 9300
},
{
"epoch": 0.6,
"learning_rate": 7.444347826086957e-06,
"loss": 0.3657,
"step": 9325
},
{
"epoch": 0.61,
"learning_rate": 7.437101449275363e-06,
"loss": 0.4382,
"step": 9350
},
{
"epoch": 0.61,
"learning_rate": 7.429855072463769e-06,
"loss": 0.3775,
"step": 9375
},
{
"epoch": 0.61,
"learning_rate": 7.4226086956521745e-06,
"loss": 0.3566,
"step": 9400
},
{
"epoch": 0.61,
"learning_rate": 7.4153623188405795e-06,
"loss": 0.3423,
"step": 9425
},
{
"epoch": 0.61,
"learning_rate": 7.408115942028986e-06,
"loss": 0.4855,
"step": 9450
},
{
"epoch": 0.61,
"learning_rate": 7.400869565217392e-06,
"loss": 0.3648,
"step": 9475
},
{
"epoch": 0.62,
"learning_rate": 7.393623188405797e-06,
"loss": 0.3294,
"step": 9500
},
{
"epoch": 0.62,
"learning_rate": 7.386376811594204e-06,
"loss": 0.3991,
"step": 9525
},
{
"epoch": 0.62,
"learning_rate": 7.37913043478261e-06,
"loss": 0.347,
"step": 9550
},
{
"epoch": 0.62,
"learning_rate": 7.371884057971015e-06,
"loss": 0.4011,
"step": 9575
},
{
"epoch": 0.62,
"learning_rate": 7.364637681159421e-06,
"loss": 0.3433,
"step": 9600
},
{
"epoch": 0.62,
"learning_rate": 7.357391304347826e-06,
"loss": 0.4642,
"step": 9625
},
{
"epoch": 0.63,
"learning_rate": 7.350144927536232e-06,
"loss": 0.3897,
"step": 9650
},
{
"epoch": 0.63,
"learning_rate": 7.342898550724639e-06,
"loss": 0.4562,
"step": 9675
},
{
"epoch": 0.63,
"learning_rate": 7.335652173913044e-06,
"loss": 0.4942,
"step": 9700
},
{
"epoch": 0.63,
"learning_rate": 7.32840579710145e-06,
"loss": 0.3497,
"step": 9725
},
{
"epoch": 0.63,
"learning_rate": 7.3211594202898564e-06,
"loss": 0.3713,
"step": 9750
},
{
"epoch": 0.63,
"learning_rate": 7.3139130434782614e-06,
"loss": 0.3558,
"step": 9775
},
{
"epoch": 0.63,
"learning_rate": 7.306666666666667e-06,
"loss": 0.4417,
"step": 9800
},
{
"epoch": 0.64,
"learning_rate": 7.299420289855072e-06,
"loss": 0.4752,
"step": 9825
},
{
"epoch": 0.64,
"learning_rate": 7.292173913043479e-06,
"loss": 0.3515,
"step": 9850
},
{
"epoch": 0.64,
"learning_rate": 7.284927536231885e-06,
"loss": 0.4731,
"step": 9875
},
{
"epoch": 0.64,
"learning_rate": 7.27768115942029e-06,
"loss": 0.3111,
"step": 9900
},
{
"epoch": 0.64,
"learning_rate": 7.2704347826086966e-06,
"loss": 0.3776,
"step": 9925
},
{
"epoch": 0.64,
"learning_rate": 7.263188405797102e-06,
"loss": 0.4209,
"step": 9950
},
{
"epoch": 0.65,
"learning_rate": 7.2559420289855074e-06,
"loss": 0.3707,
"step": 9975
},
{
"epoch": 0.65,
"learning_rate": 7.248695652173914e-06,
"loss": 0.3373,
"step": 10000
},
{
"epoch": 0.65,
"eval_cer": 7.887131683801465,
"eval_loss": 0.4116414785385132,
"eval_runtime": 3350.806,
"eval_samples_per_second": 0.741,
"eval_steps_per_second": 0.37,
"eval_wer": 21.214408233276156,
"step": 10000
},
{
"epoch": 0.65,
"learning_rate": 7.241449275362319e-06,
"loss": 0.3843,
"step": 10025
},
{
"epoch": 0.65,
"learning_rate": 7.234202898550725e-06,
"loss": 0.3891,
"step": 10050
},
{
"epoch": 0.65,
"learning_rate": 7.226956521739132e-06,
"loss": 0.4058,
"step": 10075
},
{
"epoch": 0.65,
"learning_rate": 7.219710144927537e-06,
"loss": 0.3908,
"step": 10100
},
{
"epoch": 0.66,
"learning_rate": 7.2124637681159426e-06,
"loss": 0.384,
"step": 10125
},
{
"epoch": 0.66,
"learning_rate": 7.205217391304348e-06,
"loss": 0.4804,
"step": 10150
},
{
"epoch": 0.66,
"learning_rate": 7.197971014492754e-06,
"loss": 0.2675,
"step": 10175
},
{
"epoch": 0.66,
"learning_rate": 7.19072463768116e-06,
"loss": 0.4003,
"step": 10200
},
{
"epoch": 0.66,
"learning_rate": 7.183478260869566e-06,
"loss": 0.4716,
"step": 10225
},
{
"epoch": 0.66,
"learning_rate": 7.176231884057972e-06,
"loss": 0.3955,
"step": 10250
},
{
"epoch": 0.67,
"learning_rate": 7.168985507246378e-06,
"loss": 0.4133,
"step": 10275
},
{
"epoch": 0.67,
"learning_rate": 7.161739130434783e-06,
"loss": 0.454,
"step": 10300
},
{
"epoch": 0.67,
"learning_rate": 7.1544927536231885e-06,
"loss": 0.4465,
"step": 10325
},
{
"epoch": 0.67,
"learning_rate": 7.147246376811595e-06,
"loss": 0.3997,
"step": 10350
},
{
"epoch": 0.67,
"learning_rate": 7.14e-06,
"loss": 0.43,
"step": 10375
},
{
"epoch": 0.67,
"learning_rate": 7.132753623188406e-06,
"loss": 0.373,
"step": 10400
},
{
"epoch": 0.68,
"learning_rate": 7.125507246376813e-06,
"loss": 0.4268,
"step": 10425
},
{
"epoch": 0.68,
"learning_rate": 7.118260869565218e-06,
"loss": 0.331,
"step": 10450
},
{
"epoch": 0.68,
"learning_rate": 7.111014492753624e-06,
"loss": 0.4018,
"step": 10475
},
{
"epoch": 0.68,
"learning_rate": 7.103768115942029e-06,
"loss": 0.3489,
"step": 10500
},
{
"epoch": 0.68,
"learning_rate": 7.096521739130435e-06,
"loss": 0.3914,
"step": 10525
},
{
"epoch": 0.68,
"learning_rate": 7.089275362318841e-06,
"loss": 0.3368,
"step": 10550
},
{
"epoch": 0.68,
"learning_rate": 7.082028985507246e-06,
"loss": 0.3999,
"step": 10575
},
{
"epoch": 0.69,
"learning_rate": 7.074782608695653e-06,
"loss": 0.334,
"step": 10600
},
{
"epoch": 0.69,
"learning_rate": 7.067536231884059e-06,
"loss": 0.4635,
"step": 10625
},
{
"epoch": 0.69,
"learning_rate": 7.060289855072464e-06,
"loss": 0.475,
"step": 10650
},
{
"epoch": 0.69,
"learning_rate": 7.0530434782608705e-06,
"loss": 0.3621,
"step": 10675
},
{
"epoch": 0.69,
"learning_rate": 7.0457971014492755e-06,
"loss": 0.4164,
"step": 10700
},
{
"epoch": 0.69,
"learning_rate": 7.038550724637681e-06,
"loss": 0.3648,
"step": 10725
},
{
"epoch": 0.7,
"learning_rate": 7.031304347826088e-06,
"loss": 0.4358,
"step": 10750
},
{
"epoch": 0.7,
"learning_rate": 7.024057971014493e-06,
"loss": 0.3316,
"step": 10775
},
{
"epoch": 0.7,
"learning_rate": 7.016811594202899e-06,
"loss": 0.4052,
"step": 10800
},
{
"epoch": 0.7,
"learning_rate": 7.009565217391306e-06,
"loss": 0.4474,
"step": 10825
},
{
"epoch": 0.7,
"learning_rate": 7.002318840579711e-06,
"loss": 0.339,
"step": 10850
},
{
"epoch": 0.7,
"learning_rate": 6.9950724637681165e-06,
"loss": 0.3653,
"step": 10875
},
{
"epoch": 0.71,
"learning_rate": 6.9878260869565215e-06,
"loss": 0.3337,
"step": 10900
},
{
"epoch": 0.71,
"learning_rate": 6.980579710144928e-06,
"loss": 0.3516,
"step": 10925
},
{
"epoch": 0.71,
"learning_rate": 6.973333333333334e-06,
"loss": 0.3092,
"step": 10950
},
{
"epoch": 0.71,
"learning_rate": 6.966086956521739e-06,
"loss": 0.4312,
"step": 10975
},
{
"epoch": 0.71,
"learning_rate": 6.958840579710146e-06,
"loss": 0.3808,
"step": 11000
},
{
"epoch": 0.71,
"eval_cer": 7.6264203846721434,
"eval_loss": 0.4016057252883911,
"eval_runtime": 3251.7215,
"eval_samples_per_second": 0.763,
"eval_steps_per_second": 0.382,
"eval_wer": 20.509243377167905,
"step": 11000
},
{
"epoch": 0.71,
"learning_rate": 6.951594202898552e-06,
"loss": 0.6109,
"step": 11025
},
{
"epoch": 0.72,
"learning_rate": 6.944347826086957e-06,
"loss": 0.4322,
"step": 11050
},
{
"epoch": 0.72,
"learning_rate": 6.937101449275363e-06,
"loss": 0.318,
"step": 11075
},
{
"epoch": 0.72,
"learning_rate": 6.929855072463769e-06,
"loss": 0.3855,
"step": 11100
},
{
"epoch": 0.72,
"learning_rate": 6.922608695652174e-06,
"loss": 0.3817,
"step": 11125
},
{
"epoch": 0.72,
"learning_rate": 6.915362318840581e-06,
"loss": 0.384,
"step": 11150
},
{
"epoch": 0.72,
"learning_rate": 6.908115942028986e-06,
"loss": 0.3451,
"step": 11175
},
{
"epoch": 0.73,
"learning_rate": 6.900869565217392e-06,
"loss": 0.3518,
"step": 11200
},
{
"epoch": 0.73,
"learning_rate": 6.8936231884057984e-06,
"loss": 0.4567,
"step": 11225
},
{
"epoch": 0.73,
"learning_rate": 6.886666666666667e-06,
"loss": 0.3848,
"step": 11250
},
{
"epoch": 0.73,
"learning_rate": 6.879420289855073e-06,
"loss": 0.4563,
"step": 11275
},
{
"epoch": 0.73,
"learning_rate": 6.872173913043478e-06,
"loss": 0.3633,
"step": 11300
},
{
"epoch": 0.73,
"learning_rate": 6.864927536231885e-06,
"loss": 0.425,
"step": 11325
},
{
"epoch": 0.74,
"learning_rate": 6.8576811594202905e-06,
"loss": 0.3508,
"step": 11350
},
{
"epoch": 0.74,
"learning_rate": 6.8504347826086955e-06,
"loss": 0.3351,
"step": 11375
},
{
"epoch": 0.74,
"learning_rate": 6.843188405797102e-06,
"loss": 0.4659,
"step": 11400
},
{
"epoch": 0.74,
"learning_rate": 6.835942028985508e-06,
"loss": 0.346,
"step": 11425
},
{
"epoch": 0.74,
"learning_rate": 6.828695652173913e-06,
"loss": 0.3896,
"step": 11450
},
{
"epoch": 0.74,
"learning_rate": 6.82144927536232e-06,
"loss": 0.4153,
"step": 11475
},
{
"epoch": 0.74,
"learning_rate": 6.814202898550725e-06,
"loss": 0.3759,
"step": 11500
},
{
"epoch": 0.75,
"learning_rate": 6.806956521739131e-06,
"loss": 0.3328,
"step": 11525
},
{
"epoch": 0.75,
"learning_rate": 6.799710144927537e-06,
"loss": 0.5639,
"step": 11550
},
{
"epoch": 0.75,
"learning_rate": 6.792463768115942e-06,
"loss": 0.3775,
"step": 11575
},
{
"epoch": 0.75,
"learning_rate": 6.785217391304348e-06,
"loss": 0.4081,
"step": 11600
},
{
"epoch": 0.75,
"learning_rate": 6.777971014492755e-06,
"loss": 0.4266,
"step": 11625
},
{
"epoch": 0.75,
"learning_rate": 6.77072463768116e-06,
"loss": 0.3683,
"step": 11650
},
{
"epoch": 0.76,
"learning_rate": 6.763478260869566e-06,
"loss": 0.4148,
"step": 11675
},
{
"epoch": 0.76,
"learning_rate": 6.756231884057971e-06,
"loss": 0.3413,
"step": 11700
},
{
"epoch": 0.76,
"learning_rate": 6.7489855072463775e-06,
"loss": 0.3954,
"step": 11725
},
{
"epoch": 0.76,
"learning_rate": 6.741739130434783e-06,
"loss": 0.3807,
"step": 11750
},
{
"epoch": 0.76,
"learning_rate": 6.734492753623188e-06,
"loss": 0.3475,
"step": 11775
},
{
"epoch": 0.76,
"learning_rate": 6.727246376811595e-06,
"loss": 0.3428,
"step": 11800
},
{
"epoch": 0.77,
"learning_rate": 6.720000000000001e-06,
"loss": 0.3614,
"step": 11825
},
{
"epoch": 0.77,
"learning_rate": 6.712753623188406e-06,
"loss": 0.3261,
"step": 11850
},
{
"epoch": 0.77,
"learning_rate": 6.705507246376813e-06,
"loss": 0.463,
"step": 11875
},
{
"epoch": 0.77,
"learning_rate": 6.6982608695652184e-06,
"loss": 0.3045,
"step": 11900
},
{
"epoch": 0.77,
"learning_rate": 6.6910144927536235e-06,
"loss": 0.3677,
"step": 11925
},
{
"epoch": 0.77,
"learning_rate": 6.68376811594203e-06,
"loss": 0.3405,
"step": 11950
},
{
"epoch": 0.78,
"learning_rate": 6.676521739130435e-06,
"loss": 0.3467,
"step": 11975
},
{
"epoch": 0.78,
"learning_rate": 6.669275362318841e-06,
"loss": 0.4214,
"step": 12000
},
{
"epoch": 0.78,
"eval_cer": 7.4152688277829695,
"eval_loss": 0.39488446712493896,
"eval_runtime": 3259.8037,
"eval_samples_per_second": 0.761,
"eval_steps_per_second": 0.381,
"eval_wer": 20.093767867352774,
"step": 12000
},
{
"epoch": 0.78,
"learning_rate": 6.662028985507248e-06,
"loss": 0.3608,
"step": 12025
},
{
"epoch": 0.78,
"learning_rate": 6.654782608695653e-06,
"loss": 0.3147,
"step": 12050
},
{
"epoch": 0.78,
"learning_rate": 6.647536231884059e-06,
"loss": 0.2764,
"step": 12075
},
{
"epoch": 0.78,
"learning_rate": 6.6402898550724644e-06,
"loss": 0.3447,
"step": 12100
},
{
"epoch": 0.79,
"learning_rate": 6.63304347826087e-06,
"loss": 0.3727,
"step": 12125
},
{
"epoch": 0.79,
"learning_rate": 6.625797101449276e-06,
"loss": 0.4042,
"step": 12150
},
{
"epoch": 0.79,
"learning_rate": 6.618550724637681e-06,
"loss": 0.3758,
"step": 12175
},
{
"epoch": 0.79,
"learning_rate": 6.611304347826088e-06,
"loss": 0.3582,
"step": 12200
},
{
"epoch": 0.79,
"learning_rate": 6.604057971014494e-06,
"loss": 0.3571,
"step": 12225
},
{
"epoch": 0.79,
"learning_rate": 6.596811594202899e-06,
"loss": 0.3676,
"step": 12250
},
{
"epoch": 0.8,
"learning_rate": 6.5895652173913046e-06,
"loss": 0.3224,
"step": 12275
},
{
"epoch": 0.8,
"learning_rate": 6.582318840579711e-06,
"loss": 0.3025,
"step": 12300
},
{
"epoch": 0.8,
"learning_rate": 6.575072463768116e-06,
"loss": 0.3686,
"step": 12325
},
{
"epoch": 0.8,
"learning_rate": 6.567826086956522e-06,
"loss": 0.3866,
"step": 12350
},
{
"epoch": 0.8,
"learning_rate": 6.560579710144928e-06,
"loss": 0.3662,
"step": 12375
},
{
"epoch": 0.8,
"learning_rate": 6.553333333333334e-06,
"loss": 0.3507,
"step": 12400
},
{
"epoch": 0.8,
"learning_rate": 6.54608695652174e-06,
"loss": 0.3165,
"step": 12425
},
{
"epoch": 0.81,
"learning_rate": 6.538840579710145e-06,
"loss": 0.3616,
"step": 12450
},
{
"epoch": 0.81,
"learning_rate": 6.531594202898551e-06,
"loss": 0.3466,
"step": 12475
},
{
"epoch": 0.81,
"learning_rate": 6.524347826086957e-06,
"loss": 0.5202,
"step": 12500
},
{
"epoch": 0.81,
"learning_rate": 6.517101449275362e-06,
"loss": 0.3789,
"step": 12525
},
{
"epoch": 0.81,
"learning_rate": 6.509855072463769e-06,
"loss": 0.5112,
"step": 12550
},
{
"epoch": 0.81,
"learning_rate": 6.502608695652174e-06,
"loss": 0.353,
"step": 12575
},
{
"epoch": 0.82,
"learning_rate": 6.49536231884058e-06,
"loss": 0.3469,
"step": 12600
},
{
"epoch": 0.82,
"learning_rate": 6.4881159420289865e-06,
"loss": 0.4366,
"step": 12625
},
{
"epoch": 0.82,
"learning_rate": 6.4808695652173915e-06,
"loss": 0.309,
"step": 12650
},
{
"epoch": 0.82,
"learning_rate": 6.473623188405797e-06,
"loss": 0.4358,
"step": 12675
},
{
"epoch": 0.82,
"learning_rate": 6.466376811594204e-06,
"loss": 0.3286,
"step": 12700
},
{
"epoch": 0.82,
"learning_rate": 6.459130434782609e-06,
"loss": 0.2837,
"step": 12725
},
{
"epoch": 0.83,
"learning_rate": 6.451884057971015e-06,
"loss": 0.3613,
"step": 12750
},
{
"epoch": 0.83,
"learning_rate": 6.444637681159422e-06,
"loss": 0.2637,
"step": 12775
},
{
"epoch": 0.83,
"learning_rate": 6.437391304347827e-06,
"loss": 0.3415,
"step": 12800
},
{
"epoch": 0.83,
"learning_rate": 6.4301449275362325e-06,
"loss": 0.371,
"step": 12825
},
{
"epoch": 0.83,
"learning_rate": 6.4228985507246375e-06,
"loss": 0.286,
"step": 12850
},
{
"epoch": 0.83,
"learning_rate": 6.415652173913044e-06,
"loss": 0.3646,
"step": 12875
},
{
"epoch": 0.84,
"learning_rate": 6.40840579710145e-06,
"loss": 0.4352,
"step": 12900
},
{
"epoch": 0.84,
"learning_rate": 6.401159420289855e-06,
"loss": 0.2876,
"step": 12925
},
{
"epoch": 0.84,
"learning_rate": 6.393913043478262e-06,
"loss": 0.3672,
"step": 12950
},
{
"epoch": 0.84,
"learning_rate": 6.386666666666668e-06,
"loss": 0.2878,
"step": 12975
},
{
"epoch": 0.84,
"learning_rate": 6.379420289855073e-06,
"loss": 0.3029,
"step": 13000
},
{
"epoch": 0.84,
"eval_cer": 7.358084509813567,
"eval_loss": 0.3902455270290375,
"eval_runtime": 3231.646,
"eval_samples_per_second": 0.768,
"eval_steps_per_second": 0.384,
"eval_wer": 19.7347055460263,
"step": 13000
},
{
"epoch": 1.55,
"learning_rate": 6.372173913043479e-06,
"loss": 0.3232,
"step": 13025
},
{
"epoch": 1.55,
"learning_rate": 6.364927536231884e-06,
"loss": 0.3888,
"step": 13050
},
{
"epoch": 1.55,
"learning_rate": 6.35768115942029e-06,
"loss": 0.3928,
"step": 13075
},
{
"epoch": 1.55,
"learning_rate": 6.350434782608697e-06,
"loss": 0.3615,
"step": 13100
},
{
"epoch": 1.56,
"learning_rate": 6.343188405797102e-06,
"loss": 0.4292,
"step": 13125
},
{
"epoch": 1.56,
"learning_rate": 6.335942028985508e-06,
"loss": 0.3445,
"step": 13150
},
{
"epoch": 1.56,
"learning_rate": 6.328695652173914e-06,
"loss": 0.3983,
"step": 13175
},
{
"epoch": 1.57,
"learning_rate": 6.3214492753623195e-06,
"loss": 0.3746,
"step": 13200
},
{
"epoch": 1.57,
"learning_rate": 6.314202898550725e-06,
"loss": 0.3714,
"step": 13225
},
{
"epoch": 1.57,
"learning_rate": 6.30695652173913e-06,
"loss": 0.369,
"step": 13250
},
{
"epoch": 1.58,
"learning_rate": 6.299710144927537e-06,
"loss": 0.3991,
"step": 13275
},
{
"epoch": 1.58,
"learning_rate": 6.292463768115943e-06,
"loss": 0.4264,
"step": 13300
},
{
"epoch": 1.58,
"learning_rate": 6.285217391304348e-06,
"loss": 0.2885,
"step": 13325
},
{
"epoch": 1.58,
"learning_rate": 6.277971014492754e-06,
"loss": 0.3356,
"step": 13350
},
{
"epoch": 1.59,
"learning_rate": 6.2707246376811605e-06,
"loss": 0.3758,
"step": 13375
},
{
"epoch": 1.59,
"learning_rate": 6.2634782608695655e-06,
"loss": 0.3424,
"step": 13400
},
{
"epoch": 1.59,
"learning_rate": 6.256231884057971e-06,
"loss": 0.3376,
"step": 13425
},
{
"epoch": 1.6,
"learning_rate": 6.248985507246378e-06,
"loss": 0.3928,
"step": 13450
},
{
"epoch": 1.6,
"learning_rate": 6.241739130434783e-06,
"loss": 0.3247,
"step": 13475
},
{
"epoch": 1.6,
"learning_rate": 6.234492753623189e-06,
"loss": 0.3002,
"step": 13500
},
{
"epoch": 1.6,
"learning_rate": 6.227246376811594e-06,
"loss": 0.2954,
"step": 13525
},
{
"epoch": 1.61,
"learning_rate": 6.220000000000001e-06,
"loss": 0.3292,
"step": 13550
},
{
"epoch": 1.61,
"learning_rate": 6.213043478260871e-06,
"loss": 0.3325,
"step": 13575
},
{
"epoch": 1.61,
"learning_rate": 6.205797101449276e-06,
"loss": 0.3929,
"step": 13600
},
{
"epoch": 1.62,
"learning_rate": 6.198550724637682e-06,
"loss": 0.3311,
"step": 13625
},
{
"epoch": 1.62,
"learning_rate": 6.191304347826087e-06,
"loss": 0.2803,
"step": 13650
},
{
"epoch": 1.62,
"learning_rate": 6.1840579710144935e-06,
"loss": 0.3777,
"step": 13675
},
{
"epoch": 1.63,
"learning_rate": 6.176811594202899e-06,
"loss": 0.387,
"step": 13700
},
{
"epoch": 1.63,
"learning_rate": 6.169565217391304e-06,
"loss": 0.3304,
"step": 13725
},
{
"epoch": 1.63,
"learning_rate": 6.162318840579711e-06,
"loss": 0.4854,
"step": 13750
},
{
"epoch": 1.63,
"learning_rate": 6.155072463768117e-06,
"loss": 0.3572,
"step": 13775
},
{
"epoch": 1.64,
"learning_rate": 6.147826086956522e-06,
"loss": 0.3484,
"step": 13800
},
{
"epoch": 1.64,
"learning_rate": 6.140579710144929e-06,
"loss": 0.3671,
"step": 13825
},
{
"epoch": 1.64,
"learning_rate": 6.133333333333334e-06,
"loss": 0.376,
"step": 13850
},
{
"epoch": 1.65,
"learning_rate": 6.1260869565217395e-06,
"loss": 0.3435,
"step": 13875
},
{
"epoch": 1.65,
"learning_rate": 6.118840579710146e-06,
"loss": 0.4171,
"step": 13900
},
{
"epoch": 1.65,
"learning_rate": 6.111594202898551e-06,
"loss": 0.3793,
"step": 13925
},
{
"epoch": 1.66,
"learning_rate": 6.104347826086957e-06,
"loss": 0.4026,
"step": 13950
},
{
"epoch": 1.66,
"learning_rate": 6.097101449275363e-06,
"loss": 0.3086,
"step": 13975
},
{
"epoch": 1.66,
"learning_rate": 6.089855072463769e-06,
"loss": 0.3549,
"step": 14000
},
{
"epoch": 1.66,
"eval_cer": 7.119509075704658,
"eval_loss": 0.39083221554756165,
"eval_runtime": 3180.5722,
"eval_samples_per_second": 0.78,
"eval_steps_per_second": 0.39,
"eval_wer": 19.411473222793976,
"step": 14000
},
{
"epoch": 1.66,
"learning_rate": 6.082608695652175e-06,
"loss": 0.3889,
"step": 14025
},
{
"epoch": 1.67,
"learning_rate": 6.07536231884058e-06,
"loss": 0.3197,
"step": 14050
},
{
"epoch": 1.67,
"learning_rate": 6.068115942028986e-06,
"loss": 0.3279,
"step": 14075
},
{
"epoch": 1.67,
"learning_rate": 6.060869565217392e-06,
"loss": 0.4178,
"step": 14100
},
{
"epoch": 1.68,
"learning_rate": 6.053623188405797e-06,
"loss": 0.3872,
"step": 14125
},
{
"epoch": 1.68,
"learning_rate": 6.046376811594203e-06,
"loss": 0.3375,
"step": 14150
},
{
"epoch": 1.68,
"learning_rate": 6.03913043478261e-06,
"loss": 0.4023,
"step": 14175
},
{
"epoch": 1.69,
"learning_rate": 6.031884057971015e-06,
"loss": 0.4128,
"step": 14200
},
{
"epoch": 1.69,
"learning_rate": 6.024637681159421e-06,
"loss": 0.3603,
"step": 14225
},
{
"epoch": 1.69,
"learning_rate": 6.0173913043478264e-06,
"loss": 0.3824,
"step": 14250
},
{
"epoch": 1.69,
"learning_rate": 6.010144927536232e-06,
"loss": 0.4071,
"step": 14275
},
{
"epoch": 1.7,
"learning_rate": 6.002898550724638e-06,
"loss": 0.2672,
"step": 14300
},
{
"epoch": 1.7,
"learning_rate": 5.995652173913043e-06,
"loss": 0.327,
"step": 14325
},
{
"epoch": 1.7,
"learning_rate": 5.98840579710145e-06,
"loss": 0.3569,
"step": 14350
},
{
"epoch": 1.71,
"learning_rate": 5.981159420289856e-06,
"loss": 0.3308,
"step": 14375
},
{
"epoch": 1.71,
"learning_rate": 5.973913043478261e-06,
"loss": 0.3802,
"step": 14400
},
{
"epoch": 1.71,
"learning_rate": 5.966666666666667e-06,
"loss": 0.4012,
"step": 14425
},
{
"epoch": 1.71,
"learning_rate": 5.959420289855073e-06,
"loss": 0.3191,
"step": 14450
},
{
"epoch": 1.72,
"learning_rate": 5.952173913043478e-06,
"loss": 0.2991,
"step": 14475
},
{
"epoch": 1.72,
"learning_rate": 5.944927536231885e-06,
"loss": 0.3889,
"step": 14500
},
{
"epoch": 1.72,
"learning_rate": 5.93768115942029e-06,
"loss": 0.3315,
"step": 14525
},
{
"epoch": 1.73,
"learning_rate": 5.930434782608696e-06,
"loss": 0.3925,
"step": 14550
},
{
"epoch": 1.73,
"learning_rate": 5.9231884057971025e-06,
"loss": 0.3661,
"step": 14575
},
{
"epoch": 1.73,
"learning_rate": 5.9159420289855076e-06,
"loss": 0.4426,
"step": 14600
},
{
"epoch": 1.74,
"learning_rate": 5.908695652173913e-06,
"loss": 0.4046,
"step": 14625
},
{
"epoch": 1.74,
"learning_rate": 5.90144927536232e-06,
"loss": 0.3361,
"step": 14650
},
{
"epoch": 1.74,
"learning_rate": 5.894202898550725e-06,
"loss": 0.4759,
"step": 14675
},
{
"epoch": 1.74,
"learning_rate": 5.886956521739131e-06,
"loss": 0.4326,
"step": 14700
},
{
"epoch": 1.75,
"learning_rate": 5.879710144927536e-06,
"loss": 0.2716,
"step": 14725
},
{
"epoch": 1.75,
"learning_rate": 5.872463768115943e-06,
"loss": 0.3416,
"step": 14750
},
{
"epoch": 1.75,
"learning_rate": 5.8652173913043485e-06,
"loss": 0.3715,
"step": 14775
},
{
"epoch": 1.76,
"learning_rate": 5.8579710144927535e-06,
"loss": 0.3737,
"step": 14800
},
{
"epoch": 1.76,
"learning_rate": 5.85072463768116e-06,
"loss": 0.309,
"step": 14825
},
{
"epoch": 1.76,
"learning_rate": 5.843478260869566e-06,
"loss": 0.3327,
"step": 14850
},
{
"epoch": 1.77,
"learning_rate": 5.836231884057971e-06,
"loss": 0.401,
"step": 14875
},
{
"epoch": 1.77,
"learning_rate": 5.828985507246378e-06,
"loss": 0.2827,
"step": 14900
},
{
"epoch": 1.77,
"learning_rate": 5.821739130434783e-06,
"loss": 0.3644,
"step": 14925
},
{
"epoch": 1.77,
"learning_rate": 5.814492753623189e-06,
"loss": 0.3638,
"step": 14950
},
{
"epoch": 1.78,
"learning_rate": 5.807246376811595e-06,
"loss": 0.4652,
"step": 14975
},
{
"epoch": 1.78,
"learning_rate": 5.8e-06,
"loss": 0.3385,
"step": 15000
},
{
"epoch": 1.78,
"eval_cer": 7.779157853313001,
"eval_loss": 0.39061304926872253,
"eval_runtime": 3221.9453,
"eval_samples_per_second": 0.77,
"eval_steps_per_second": 0.385,
"eval_wer": 20.20506956356013,
"step": 15000
},
{
"epoch": 1.78,
"learning_rate": 5.792753623188406e-06,
"loss": 0.4065,
"step": 15025
},
{
"epoch": 1.79,
"learning_rate": 5.785507246376812e-06,
"loss": 0.4354,
"step": 15050
},
{
"epoch": 1.79,
"learning_rate": 5.778260869565218e-06,
"loss": 0.3932,
"step": 15075
},
{
"epoch": 1.79,
"learning_rate": 5.771014492753624e-06,
"loss": 0.3212,
"step": 15100
},
{
"epoch": 1.79,
"learning_rate": 5.76376811594203e-06,
"loss": 0.4244,
"step": 15125
},
{
"epoch": 1.8,
"learning_rate": 5.7565217391304355e-06,
"loss": 0.306,
"step": 15150
},
{
"epoch": 1.8,
"learning_rate": 5.749275362318841e-06,
"loss": 0.3492,
"step": 15175
},
{
"epoch": 1.8,
"learning_rate": 5.742028985507246e-06,
"loss": 0.3573,
"step": 15200
},
{
"epoch": 1.81,
"learning_rate": 5.734782608695652e-06,
"loss": 0.3975,
"step": 15225
},
{
"epoch": 1.81,
"learning_rate": 5.727536231884059e-06,
"loss": 0.3276,
"step": 15250
},
{
"epoch": 1.81,
"learning_rate": 5.720289855072464e-06,
"loss": 0.3638,
"step": 15275
},
{
"epoch": 1.82,
"learning_rate": 5.71304347826087e-06,
"loss": 0.3312,
"step": 15300
},
{
"epoch": 1.82,
"learning_rate": 5.7057971014492765e-06,
"loss": 0.3026,
"step": 15325
},
{
"epoch": 1.82,
"learning_rate": 5.6985507246376815e-06,
"loss": 0.3493,
"step": 15350
},
{
"epoch": 1.82,
"learning_rate": 5.691304347826087e-06,
"loss": 0.309,
"step": 15375
},
{
"epoch": 1.83,
"learning_rate": 5.684057971014492e-06,
"loss": 0.2761,
"step": 15400
},
{
"epoch": 1.83,
"learning_rate": 5.676811594202899e-06,
"loss": 0.3507,
"step": 15425
},
{
"epoch": 1.83,
"learning_rate": 5.669565217391305e-06,
"loss": 0.3359,
"step": 15450
},
{
"epoch": 1.84,
"learning_rate": 5.66231884057971e-06,
"loss": 0.3132,
"step": 15475
},
{
"epoch": 1.84,
"learning_rate": 5.655072463768117e-06,
"loss": 0.2976,
"step": 15500
},
{
"epoch": 1.84,
"learning_rate": 5.6478260869565225e-06,
"loss": 0.3893,
"step": 15525
},
{
"epoch": 1.85,
"learning_rate": 5.6405797101449275e-06,
"loss": 0.3417,
"step": 15550
},
{
"epoch": 1.85,
"learning_rate": 5.633333333333334e-06,
"loss": 0.3462,
"step": 15575
},
{
"epoch": 1.85,
"learning_rate": 5.626086956521739e-06,
"loss": 0.3885,
"step": 15600
},
{
"epoch": 1.85,
"learning_rate": 5.618840579710145e-06,
"loss": 0.3844,
"step": 15625
},
{
"epoch": 1.86,
"learning_rate": 5.611594202898552e-06,
"loss": 0.3112,
"step": 15650
},
{
"epoch": 1.86,
"learning_rate": 5.604347826086957e-06,
"loss": 0.3266,
"step": 15675
},
{
"epoch": 1.86,
"learning_rate": 5.597101449275363e-06,
"loss": 0.3538,
"step": 15700
},
{
"epoch": 1.87,
"learning_rate": 5.589855072463769e-06,
"loss": 0.351,
"step": 15725
},
{
"epoch": 1.87,
"learning_rate": 5.582608695652174e-06,
"loss": 0.3373,
"step": 15750
},
{
"epoch": 1.87,
"learning_rate": 5.57536231884058e-06,
"loss": 0.4156,
"step": 15775
},
{
"epoch": 1.87,
"learning_rate": 5.568115942028985e-06,
"loss": 0.4124,
"step": 15800
},
{
"epoch": 1.88,
"learning_rate": 5.560869565217392e-06,
"loss": 0.3716,
"step": 15825
},
{
"epoch": 1.88,
"learning_rate": 5.553623188405798e-06,
"loss": 0.5276,
"step": 15850
},
{
"epoch": 1.88,
"learning_rate": 5.546376811594203e-06,
"loss": 0.3412,
"step": 15875
},
{
"epoch": 1.89,
"learning_rate": 5.5391304347826094e-06,
"loss": 0.3293,
"step": 15900
},
{
"epoch": 1.89,
"learning_rate": 5.531884057971015e-06,
"loss": 0.3759,
"step": 15925
},
{
"epoch": 1.89,
"learning_rate": 5.52463768115942e-06,
"loss": 0.3926,
"step": 15950
},
{
"epoch": 1.9,
"learning_rate": 5.517391304347827e-06,
"loss": 0.3686,
"step": 15975
},
{
"epoch": 1.9,
"learning_rate": 5.510144927536233e-06,
"loss": 0.3282,
"step": 16000
},
{
"epoch": 1.9,
"eval_cer": 7.108072212110778,
"eval_loss": 0.39232152700424194,
"eval_runtime": 3154.8615,
"eval_samples_per_second": 0.787,
"eval_steps_per_second": 0.393,
"eval_wer": 19.265103868877453,
"step": 16000
},
{
"epoch": 1.9,
"learning_rate": 5.502898550724638e-06,
"loss": 0.3279,
"step": 16025
},
{
"epoch": 1.9,
"learning_rate": 5.4956521739130446e-06,
"loss": 0.4442,
"step": 16050
},
{
"epoch": 1.91,
"learning_rate": 5.4884057971014496e-06,
"loss": 0.4354,
"step": 16075
},
{
"epoch": 1.91,
"learning_rate": 5.481159420289855e-06,
"loss": 0.362,
"step": 16100
},
{
"epoch": 1.91,
"learning_rate": 5.473913043478261e-06,
"loss": 0.3849,
"step": 16125
},
{
"epoch": 1.92,
"learning_rate": 5.466666666666667e-06,
"loss": 0.3956,
"step": 16150
},
{
"epoch": 1.92,
"learning_rate": 5.459420289855073e-06,
"loss": 0.2881,
"step": 16175
},
{
"epoch": 1.92,
"learning_rate": 5.452173913043479e-06,
"loss": 0.3321,
"step": 16200
},
{
"epoch": 1.93,
"learning_rate": 5.444927536231885e-06,
"loss": 0.3512,
"step": 16225
},
{
"epoch": 1.93,
"learning_rate": 5.4376811594202905e-06,
"loss": 0.3227,
"step": 16250
},
{
"epoch": 1.93,
"learning_rate": 5.4304347826086955e-06,
"loss": 0.3204,
"step": 16275
},
{
"epoch": 1.93,
"learning_rate": 5.423188405797101e-06,
"loss": 0.2884,
"step": 16300
},
{
"epoch": 1.94,
"learning_rate": 5.415942028985508e-06,
"loss": 0.3259,
"step": 16325
},
{
"epoch": 1.94,
"learning_rate": 5.408695652173913e-06,
"loss": 0.3611,
"step": 16350
},
{
"epoch": 1.94,
"learning_rate": 5.401449275362319e-06,
"loss": 0.3598,
"step": 16375
},
{
"epoch": 1.95,
"learning_rate": 5.394202898550726e-06,
"loss": 0.3911,
"step": 16400
},
{
"epoch": 1.95,
"learning_rate": 5.386956521739131e-06,
"loss": 0.4117,
"step": 16425
},
{
"epoch": 1.95,
"learning_rate": 5.3797101449275365e-06,
"loss": 0.4095,
"step": 16450
},
{
"epoch": 1.96,
"learning_rate": 5.3724637681159415e-06,
"loss": 0.3033,
"step": 16475
},
{
"epoch": 1.96,
"learning_rate": 5.365217391304348e-06,
"loss": 0.3534,
"step": 16500
},
{
"epoch": 1.96,
"learning_rate": 5.357971014492754e-06,
"loss": 0.2906,
"step": 16525
},
{
"epoch": 1.96,
"learning_rate": 5.350724637681159e-06,
"loss": 0.2948,
"step": 16550
},
{
"epoch": 1.97,
"learning_rate": 5.343478260869566e-06,
"loss": 0.2731,
"step": 16575
},
{
"epoch": 1.97,
"learning_rate": 5.336231884057972e-06,
"loss": 0.3218,
"step": 16600
},
{
"epoch": 1.97,
"learning_rate": 5.328985507246377e-06,
"loss": 0.328,
"step": 16625
},
{
"epoch": 1.98,
"learning_rate": 5.321739130434783e-06,
"loss": 0.274,
"step": 16650
},
{
"epoch": 1.98,
"learning_rate": 5.314492753623189e-06,
"loss": 0.2936,
"step": 16675
},
{
"epoch": 1.98,
"learning_rate": 5.307246376811594e-06,
"loss": 0.3601,
"step": 16700
},
{
"epoch": 1.98,
"learning_rate": 5.3002898550724646e-06,
"loss": 0.4228,
"step": 16725
},
{
"epoch": 1.99,
"learning_rate": 5.2930434782608696e-06,
"loss": 0.3024,
"step": 16750
},
{
"epoch": 1.99,
"learning_rate": 5.285797101449276e-06,
"loss": 0.3463,
"step": 16775
},
{
"epoch": 1.99,
"learning_rate": 5.278550724637682e-06,
"loss": 0.3282,
"step": 16800
},
{
"epoch": 2.0,
"learning_rate": 5.271304347826087e-06,
"loss": 0.3138,
"step": 16825
},
{
"epoch": 2.0,
"learning_rate": 5.264057971014494e-06,
"loss": 0.3608,
"step": 16850
},
{
"epoch": 2.0,
"learning_rate": 5.256811594202899e-06,
"loss": 0.2716,
"step": 16875
},
{
"epoch": 2.01,
"learning_rate": 5.249565217391305e-06,
"loss": 0.4661,
"step": 16900
},
{
"epoch": 2.01,
"learning_rate": 5.242318840579711e-06,
"loss": 0.2482,
"step": 16925
},
{
"epoch": 2.01,
"learning_rate": 5.235072463768116e-06,
"loss": 0.34,
"step": 16950
},
{
"epoch": 2.01,
"learning_rate": 5.227826086956522e-06,
"loss": 0.3228,
"step": 16975
},
{
"epoch": 2.02,
"learning_rate": 5.220579710144928e-06,
"loss": 0.3196,
"step": 17000
},
{
"epoch": 2.02,
"eval_cer": 7.224900388607408,
"eval_loss": 0.39229413866996765,
"eval_runtime": 3162.0207,
"eval_samples_per_second": 0.785,
"eval_steps_per_second": 0.392,
"eval_wer": 19.335239184295787,
"step": 17000
},
{
"epoch": 2.02,
"learning_rate": 5.213333333333334e-06,
"loss": 0.2583,
"step": 17025
},
{
"epoch": 2.02,
"learning_rate": 5.20608695652174e-06,
"loss": 0.248,
"step": 17050
},
{
"epoch": 2.03,
"learning_rate": 5.198840579710145e-06,
"loss": 0.2901,
"step": 17075
},
{
"epoch": 2.03,
"learning_rate": 5.191594202898551e-06,
"loss": 0.2492,
"step": 17100
},
{
"epoch": 2.03,
"learning_rate": 5.184347826086957e-06,
"loss": 0.3115,
"step": 17125
},
{
"epoch": 2.04,
"learning_rate": 5.177101449275362e-06,
"loss": 0.3328,
"step": 17150
},
{
"epoch": 2.04,
"learning_rate": 5.169855072463768e-06,
"loss": 0.2782,
"step": 17175
},
{
"epoch": 2.04,
"learning_rate": 5.162608695652175e-06,
"loss": 0.2778,
"step": 17200
},
{
"epoch": 2.04,
"learning_rate": 5.15536231884058e-06,
"loss": 0.2721,
"step": 17225
},
{
"epoch": 2.05,
"learning_rate": 5.148115942028986e-06,
"loss": 0.361,
"step": 17250
},
{
"epoch": 2.05,
"learning_rate": 5.140869565217391e-06,
"loss": 0.3612,
"step": 17275
},
{
"epoch": 2.05,
"learning_rate": 5.1336231884057975e-06,
"loss": 0.2824,
"step": 17300
},
{
"epoch": 2.06,
"learning_rate": 5.126376811594203e-06,
"loss": 0.2909,
"step": 17325
},
{
"epoch": 2.06,
"learning_rate": 5.119130434782608e-06,
"loss": 0.2773,
"step": 17350
},
{
"epoch": 2.06,
"learning_rate": 5.111884057971015e-06,
"loss": 0.3971,
"step": 17375
},
{
"epoch": 2.06,
"learning_rate": 5.104637681159421e-06,
"loss": 0.2334,
"step": 17400
},
{
"epoch": 2.07,
"learning_rate": 5.097391304347826e-06,
"loss": 0.3899,
"step": 17425
},
{
"epoch": 2.07,
"learning_rate": 5.090144927536233e-06,
"loss": 0.321,
"step": 17450
},
{
"epoch": 2.07,
"learning_rate": 5.082898550724638e-06,
"loss": 0.2295,
"step": 17475
},
{
"epoch": 2.08,
"learning_rate": 5.0756521739130435e-06,
"loss": 0.278,
"step": 17500
},
{
"epoch": 2.08,
"learning_rate": 5.06840579710145e-06,
"loss": 0.2696,
"step": 17525
},
{
"epoch": 2.08,
"learning_rate": 5.061159420289855e-06,
"loss": 0.2604,
"step": 17550
},
{
"epoch": 2.09,
"learning_rate": 5.053913043478261e-06,
"loss": 0.3015,
"step": 17575
},
{
"epoch": 2.09,
"learning_rate": 5.046666666666668e-06,
"loss": 0.1998,
"step": 17600
},
{
"epoch": 2.09,
"learning_rate": 5.039420289855073e-06,
"loss": 0.3426,
"step": 17625
},
{
"epoch": 2.09,
"learning_rate": 5.032173913043479e-06,
"loss": 0.3037,
"step": 17650
},
{
"epoch": 2.1,
"learning_rate": 5.024927536231885e-06,
"loss": 0.3063,
"step": 17675
},
{
"epoch": 2.1,
"learning_rate": 5.01768115942029e-06,
"loss": 0.2932,
"step": 17700
},
{
"epoch": 2.1,
"learning_rate": 5.010434782608696e-06,
"loss": 0.3028,
"step": 17725
},
{
"epoch": 2.11,
"learning_rate": 5.003188405797101e-06,
"loss": 0.2644,
"step": 17750
},
{
"epoch": 2.11,
"learning_rate": 4.995942028985508e-06,
"loss": 0.2902,
"step": 17775
},
{
"epoch": 2.11,
"learning_rate": 4.988695652173913e-06,
"loss": 0.2816,
"step": 17800
},
{
"epoch": 2.12,
"learning_rate": 4.98144927536232e-06,
"loss": 0.3323,
"step": 17825
},
{
"epoch": 2.12,
"learning_rate": 4.9742028985507255e-06,
"loss": 0.2923,
"step": 17850
},
{
"epoch": 2.12,
"learning_rate": 4.9669565217391305e-06,
"loss": 0.3281,
"step": 17875
},
{
"epoch": 2.12,
"learning_rate": 4.959710144927536e-06,
"loss": 0.3877,
"step": 17900
},
{
"epoch": 2.13,
"learning_rate": 4.952463768115943e-06,
"loss": 0.372,
"step": 17925
},
{
"epoch": 2.13,
"learning_rate": 4.945217391304348e-06,
"loss": 0.2854,
"step": 17950
},
{
"epoch": 2.13,
"learning_rate": 4.937971014492754e-06,
"loss": 0.3001,
"step": 17975
},
{
"epoch": 2.14,
"learning_rate": 4.93072463768116e-06,
"loss": 0.3251,
"step": 18000
},
{
"epoch": 2.14,
"eval_cer": 7.176078508534606,
"eval_loss": 0.39806175231933594,
"eval_runtime": 3134.0346,
"eval_samples_per_second": 0.792,
"eval_steps_per_second": 0.396,
"eval_wer": 19.483133218982278,
"step": 18000
},
{
"epoch": 2.14,
"learning_rate": 4.923478260869566e-06,
"loss": 0.3021,
"step": 18025
},
{
"epoch": 2.14,
"learning_rate": 4.9162318840579714e-06,
"loss": 0.2846,
"step": 18050
},
{
"epoch": 2.14,
"learning_rate": 4.908985507246377e-06,
"loss": 0.284,
"step": 18075
},
{
"epoch": 2.15,
"learning_rate": 4.901739130434783e-06,
"loss": 0.2423,
"step": 18100
},
{
"epoch": 2.15,
"learning_rate": 4.894492753623189e-06,
"loss": 0.2551,
"step": 18125
},
{
"epoch": 2.15,
"learning_rate": 4.887246376811595e-06,
"loss": 0.4317,
"step": 18150
},
{
"epoch": 2.16,
"learning_rate": 4.880000000000001e-06,
"loss": 0.4729,
"step": 18175
},
{
"epoch": 2.16,
"learning_rate": 4.872753623188406e-06,
"loss": 0.2887,
"step": 18200
},
{
"epoch": 2.16,
"learning_rate": 4.865507246376812e-06,
"loss": 0.4263,
"step": 18225
},
{
"epoch": 2.17,
"learning_rate": 4.8582608695652174e-06,
"loss": 0.3566,
"step": 18250
},
{
"epoch": 2.17,
"learning_rate": 4.851014492753623e-06,
"loss": 0.3274,
"step": 18275
},
{
"epoch": 2.17,
"learning_rate": 4.843768115942029e-06,
"loss": 0.2818,
"step": 18300
},
{
"epoch": 2.17,
"learning_rate": 4.836521739130435e-06,
"loss": 0.29,
"step": 18325
},
{
"epoch": 2.18,
"learning_rate": 4.829275362318841e-06,
"loss": 0.3009,
"step": 18350
},
{
"epoch": 2.18,
"learning_rate": 4.822028985507247e-06,
"loss": 0.3663,
"step": 18375
},
{
"epoch": 2.18,
"learning_rate": 4.8147826086956526e-06,
"loss": 0.2181,
"step": 18400
},
{
"epoch": 2.19,
"learning_rate": 4.807536231884058e-06,
"loss": 0.4402,
"step": 18425
},
{
"epoch": 2.19,
"learning_rate": 4.800289855072464e-06,
"loss": 0.3224,
"step": 18450
},
{
"epoch": 2.19,
"learning_rate": 4.79304347826087e-06,
"loss": 0.4503,
"step": 18475
},
{
"epoch": 2.2,
"learning_rate": 4.785797101449276e-06,
"loss": 0.3597,
"step": 18500
},
{
"epoch": 2.2,
"learning_rate": 4.778550724637682e-06,
"loss": 0.3584,
"step": 18525
},
{
"epoch": 2.2,
"learning_rate": 4.771304347826088e-06,
"loss": 0.3391,
"step": 18550
},
{
"epoch": 2.2,
"learning_rate": 4.764057971014493e-06,
"loss": 0.3192,
"step": 18575
},
{
"epoch": 2.21,
"learning_rate": 4.756811594202899e-06,
"loss": 0.3671,
"step": 18600
},
{
"epoch": 2.21,
"learning_rate": 4.749565217391305e-06,
"loss": 0.3506,
"step": 18625
},
{
"epoch": 2.21,
"learning_rate": 4.74231884057971e-06,
"loss": 0.3515,
"step": 18650
},
{
"epoch": 2.22,
"learning_rate": 4.735072463768116e-06,
"loss": 0.2615,
"step": 18675
},
{
"epoch": 2.22,
"learning_rate": 4.727826086956522e-06,
"loss": 0.2509,
"step": 18700
},
{
"epoch": 2.22,
"learning_rate": 4.720579710144928e-06,
"loss": 0.3,
"step": 18725
},
{
"epoch": 2.22,
"learning_rate": 4.713333333333334e-06,
"loss": 0.302,
"step": 18750
},
{
"epoch": 2.23,
"learning_rate": 4.7060869565217395e-06,
"loss": 0.2971,
"step": 18775
},
{
"epoch": 2.23,
"learning_rate": 4.698840579710145e-06,
"loss": 0.4138,
"step": 18800
},
{
"epoch": 2.23,
"learning_rate": 4.691594202898551e-06,
"loss": 0.296,
"step": 18825
},
{
"epoch": 2.24,
"learning_rate": 4.684347826086957e-06,
"loss": 0.2533,
"step": 18850
},
{
"epoch": 2.24,
"learning_rate": 4.677101449275362e-06,
"loss": 0.2477,
"step": 18875
},
{
"epoch": 2.24,
"learning_rate": 4.669855072463769e-06,
"loss": 0.2952,
"step": 18900
},
{
"epoch": 2.25,
"learning_rate": 4.662608695652175e-06,
"loss": 0.2471,
"step": 18925
},
{
"epoch": 2.25,
"learning_rate": 4.65536231884058e-06,
"loss": 0.2664,
"step": 18950
},
{
"epoch": 2.25,
"learning_rate": 4.6481159420289855e-06,
"loss": 0.2127,
"step": 18975
},
{
"epoch": 2.25,
"learning_rate": 4.640869565217392e-06,
"loss": 0.4162,
"step": 19000
},
{
"epoch": 2.25,
"eval_cer": 7.059004377982194,
"eval_loss": 0.39584028720855713,
"eval_runtime": 3153.6429,
"eval_samples_per_second": 0.787,
"eval_steps_per_second": 0.394,
"eval_wer": 19.057747284162378,
"step": 19000
},
{
"epoch": 2.26,
"learning_rate": 4.633623188405797e-06,
"loss": 0.286,
"step": 19025
},
{
"epoch": 2.26,
"learning_rate": 4.626376811594203e-06,
"loss": 0.2912,
"step": 19050
},
{
"epoch": 2.26,
"learning_rate": 4.619130434782609e-06,
"loss": 0.2905,
"step": 19075
},
{
"epoch": 2.27,
"learning_rate": 4.611884057971015e-06,
"loss": 0.333,
"step": 19100
},
{
"epoch": 2.27,
"learning_rate": 4.604637681159421e-06,
"loss": 0.2647,
"step": 19125
},
{
"epoch": 2.27,
"learning_rate": 4.5973913043478265e-06,
"loss": 0.2746,
"step": 19150
},
{
"epoch": 2.28,
"learning_rate": 4.590144927536232e-06,
"loss": 0.3317,
"step": 19175
},
{
"epoch": 2.28,
"learning_rate": 4.582898550724638e-06,
"loss": 0.2549,
"step": 19200
},
{
"epoch": 2.28,
"learning_rate": 4.575652173913044e-06,
"loss": 0.312,
"step": 19225
},
{
"epoch": 2.28,
"learning_rate": 4.56840579710145e-06,
"loss": 0.3177,
"step": 19250
},
{
"epoch": 2.29,
"learning_rate": 4.561159420289856e-06,
"loss": 0.3063,
"step": 19275
},
{
"epoch": 2.29,
"learning_rate": 4.553913043478262e-06,
"loss": 0.3964,
"step": 19300
},
{
"epoch": 2.29,
"learning_rate": 4.546666666666667e-06,
"loss": 0.3377,
"step": 19325
},
{
"epoch": 2.3,
"learning_rate": 4.5394202898550725e-06,
"loss": 0.2753,
"step": 19350
},
{
"epoch": 2.3,
"learning_rate": 4.532173913043479e-06,
"loss": 0.2735,
"step": 19375
},
{
"epoch": 2.3,
"learning_rate": 4.524927536231884e-06,
"loss": 0.292,
"step": 19400
},
{
"epoch": 2.31,
"learning_rate": 4.51768115942029e-06,
"loss": 0.2894,
"step": 19425
},
{
"epoch": 2.31,
"learning_rate": 4.510434782608696e-06,
"loss": 0.367,
"step": 19450
},
{
"epoch": 2.31,
"learning_rate": 4.503188405797102e-06,
"loss": 0.2483,
"step": 19475
},
{
"epoch": 2.31,
"learning_rate": 4.495942028985508e-06,
"loss": 0.4151,
"step": 19500
},
{
"epoch": 2.32,
"learning_rate": 4.4886956521739134e-06,
"loss": 0.269,
"step": 19525
},
{
"epoch": 2.32,
"learning_rate": 4.481449275362319e-06,
"loss": 0.3127,
"step": 19550
},
{
"epoch": 2.32,
"learning_rate": 4.474202898550725e-06,
"loss": 0.2615,
"step": 19575
},
{
"epoch": 2.33,
"learning_rate": 4.466956521739131e-06,
"loss": 0.2606,
"step": 19600
},
{
"epoch": 2.33,
"learning_rate": 4.459710144927537e-06,
"loss": 0.2855,
"step": 19625
},
{
"epoch": 2.33,
"learning_rate": 4.452463768115942e-06,
"loss": 0.2419,
"step": 19650
},
{
"epoch": 2.33,
"learning_rate": 4.4452173913043486e-06,
"loss": 0.3292,
"step": 19675
},
{
"epoch": 2.34,
"learning_rate": 4.4379710144927544e-06,
"loss": 0.2821,
"step": 19700
},
{
"epoch": 2.34,
"learning_rate": 4.4307246376811594e-06,
"loss": 0.3189,
"step": 19725
},
{
"epoch": 2.34,
"learning_rate": 4.423478260869565e-06,
"loss": 0.286,
"step": 19750
},
{
"epoch": 2.35,
"learning_rate": 4.416231884057971e-06,
"loss": 0.2853,
"step": 19775
},
{
"epoch": 2.35,
"learning_rate": 4.408985507246377e-06,
"loss": 0.2835,
"step": 19800
},
{
"epoch": 2.35,
"learning_rate": 4.401739130434783e-06,
"loss": 0.2626,
"step": 19825
},
{
"epoch": 2.36,
"learning_rate": 4.394492753623189e-06,
"loss": 0.3301,
"step": 19850
},
{
"epoch": 2.36,
"learning_rate": 4.3872463768115946e-06,
"loss": 0.3094,
"step": 19875
},
{
"epoch": 2.36,
"learning_rate": 4.380289855072464e-06,
"loss": 0.2322,
"step": 19900
},
{
"epoch": 2.36,
"learning_rate": 4.37304347826087e-06,
"loss": 0.3167,
"step": 19925
},
{
"epoch": 2.37,
"learning_rate": 4.365797101449276e-06,
"loss": 0.3029,
"step": 19950
},
{
"epoch": 2.37,
"learning_rate": 4.358550724637682e-06,
"loss": 0.2892,
"step": 19975
},
{
"epoch": 2.37,
"learning_rate": 4.3513043478260875e-06,
"loss": 0.2851,
"step": 20000
},
{
"epoch": 2.37,
"eval_cer": 7.0167002803876235,
"eval_loss": 0.39532455801963806,
"eval_runtime": 3151.9912,
"eval_samples_per_second": 0.787,
"eval_steps_per_second": 0.394,
"eval_wer": 19.209453020773775,
"step": 20000
},
{
"epoch": 2.38,
"learning_rate": 4.344057971014493e-06,
"loss": 0.2749,
"step": 20025
},
{
"epoch": 2.38,
"learning_rate": 4.336811594202899e-06,
"loss": 0.3344,
"step": 20050
},
{
"epoch": 2.38,
"learning_rate": 4.329565217391305e-06,
"loss": 0.2773,
"step": 20075
},
{
"epoch": 2.39,
"learning_rate": 4.322318840579711e-06,
"loss": 0.2361,
"step": 20100
},
{
"epoch": 2.39,
"learning_rate": 4.315072463768116e-06,
"loss": 0.2254,
"step": 20125
},
{
"epoch": 2.39,
"learning_rate": 4.307826086956522e-06,
"loss": 0.2396,
"step": 20150
},
{
"epoch": 2.39,
"learning_rate": 4.3005797101449284e-06,
"loss": 0.2621,
"step": 20175
},
{
"epoch": 2.4,
"learning_rate": 4.2933333333333334e-06,
"loss": 0.31,
"step": 20200
},
{
"epoch": 2.4,
"learning_rate": 4.286086956521739e-06,
"loss": 0.3039,
"step": 20225
},
{
"epoch": 2.4,
"learning_rate": 4.278840579710145e-06,
"loss": 0.2772,
"step": 20250
},
{
"epoch": 2.41,
"learning_rate": 4.271594202898551e-06,
"loss": 0.2535,
"step": 20275
},
{
"epoch": 2.41,
"learning_rate": 4.264347826086957e-06,
"loss": 0.2903,
"step": 20300
},
{
"epoch": 2.41,
"learning_rate": 4.257101449275363e-06,
"loss": 0.3347,
"step": 20325
},
{
"epoch": 2.41,
"learning_rate": 4.2498550724637686e-06,
"loss": 0.3133,
"step": 20350
},
{
"epoch": 2.42,
"learning_rate": 4.2426086956521744e-06,
"loss": 0.2631,
"step": 20375
},
{
"epoch": 2.42,
"learning_rate": 4.23536231884058e-06,
"loss": 0.2973,
"step": 20400
},
{
"epoch": 2.42,
"learning_rate": 4.228115942028986e-06,
"loss": 0.2731,
"step": 20425
},
{
"epoch": 2.43,
"learning_rate": 4.220869565217391e-06,
"loss": 0.3088,
"step": 20450
},
{
"epoch": 2.43,
"learning_rate": 4.213623188405798e-06,
"loss": 0.3291,
"step": 20475
},
{
"epoch": 2.43,
"learning_rate": 4.206376811594204e-06,
"loss": 0.2447,
"step": 20500
},
{
"epoch": 2.44,
"learning_rate": 4.199130434782609e-06,
"loss": 0.3862,
"step": 20525
},
{
"epoch": 2.44,
"learning_rate": 4.1918840579710146e-06,
"loss": 0.3494,
"step": 20550
},
{
"epoch": 2.44,
"learning_rate": 4.18463768115942e-06,
"loss": 0.314,
"step": 20575
},
{
"epoch": 2.44,
"learning_rate": 4.177391304347826e-06,
"loss": 0.3158,
"step": 20600
},
{
"epoch": 2.45,
"learning_rate": 4.170144927536232e-06,
"loss": 0.2839,
"step": 20625
},
{
"epoch": 2.45,
"learning_rate": 4.162898550724638e-06,
"loss": 0.2518,
"step": 20650
},
{
"epoch": 2.45,
"learning_rate": 4.155652173913044e-06,
"loss": 0.3692,
"step": 20675
},
{
"epoch": 2.46,
"learning_rate": 4.14840579710145e-06,
"loss": 0.2712,
"step": 20700
},
{
"epoch": 2.46,
"learning_rate": 4.1411594202898555e-06,
"loss": 0.2804,
"step": 20725
},
{
"epoch": 2.46,
"learning_rate": 4.1339130434782605e-06,
"loss": 0.3514,
"step": 20750
},
{
"epoch": 2.47,
"learning_rate": 4.126666666666667e-06,
"loss": 0.2892,
"step": 20775
},
{
"epoch": 2.47,
"learning_rate": 4.119420289855073e-06,
"loss": 0.2898,
"step": 20800
},
{
"epoch": 2.47,
"learning_rate": 4.112173913043478e-06,
"loss": 0.3071,
"step": 20825
},
{
"epoch": 2.47,
"learning_rate": 4.104927536231885e-06,
"loss": 0.2719,
"step": 20850
},
{
"epoch": 2.48,
"learning_rate": 4.097681159420291e-06,
"loss": 0.3628,
"step": 20875
},
{
"epoch": 2.48,
"learning_rate": 4.090434782608696e-06,
"loss": 0.3201,
"step": 20900
},
{
"epoch": 2.48,
"learning_rate": 4.0831884057971015e-06,
"loss": 0.3166,
"step": 20925
},
{
"epoch": 2.49,
"learning_rate": 4.075942028985508e-06,
"loss": 0.3418,
"step": 20950
},
{
"epoch": 2.49,
"learning_rate": 4.068695652173913e-06,
"loss": 0.288,
"step": 20975
},
{
"epoch": 2.49,
"learning_rate": 4.061449275362319e-06,
"loss": 0.2982,
"step": 21000
},
{
"epoch": 2.49,
"eval_cer": 6.842564808893699,
"eval_loss": 0.39293238520622253,
"eval_runtime": 3128.5672,
"eval_samples_per_second": 0.793,
"eval_steps_per_second": 0.397,
"eval_wer": 18.80998665904326,
"step": 21000
},
{
"epoch": 2.49,
"learning_rate": 4.054202898550725e-06,
"loss": 0.2191,
"step": 21025
},
{
"epoch": 2.5,
"learning_rate": 4.046956521739131e-06,
"loss": 0.3047,
"step": 21050
},
{
"epoch": 2.5,
"learning_rate": 4.039710144927537e-06,
"loss": 0.2752,
"step": 21075
},
{
"epoch": 2.5,
"learning_rate": 4.0324637681159425e-06,
"loss": 0.2675,
"step": 21100
},
{
"epoch": 2.51,
"learning_rate": 4.025217391304348e-06,
"loss": 0.2971,
"step": 21125
},
{
"epoch": 2.51,
"learning_rate": 4.017971014492754e-06,
"loss": 0.3199,
"step": 21150
},
{
"epoch": 2.51,
"learning_rate": 4.01072463768116e-06,
"loss": 0.2402,
"step": 21175
},
{
"epoch": 2.52,
"learning_rate": 4.003478260869565e-06,
"loss": 0.2752,
"step": 21200
},
{
"epoch": 2.52,
"learning_rate": 3.996231884057971e-06,
"loss": 0.3148,
"step": 21225
},
{
"epoch": 2.52,
"learning_rate": 3.988985507246378e-06,
"loss": 0.2471,
"step": 21250
},
{
"epoch": 2.52,
"learning_rate": 3.981739130434783e-06,
"loss": 0.2807,
"step": 21275
},
{
"epoch": 2.53,
"learning_rate": 3.9744927536231885e-06,
"loss": 0.2242,
"step": 21300
},
{
"epoch": 2.53,
"learning_rate": 3.967246376811594e-06,
"loss": 0.4252,
"step": 21325
},
{
"epoch": 2.53,
"learning_rate": 3.96e-06,
"loss": 0.2453,
"step": 21350
},
{
"epoch": 2.54,
"learning_rate": 3.952753623188406e-06,
"loss": 0.2282,
"step": 21375
},
{
"epoch": 2.54,
"learning_rate": 3.945507246376812e-06,
"loss": 0.353,
"step": 21400
},
{
"epoch": 2.54,
"learning_rate": 3.938260869565218e-06,
"loss": 0.3021,
"step": 21425
},
{
"epoch": 2.55,
"learning_rate": 3.931014492753624e-06,
"loss": 0.2803,
"step": 21450
},
{
"epoch": 2.55,
"learning_rate": 3.9237681159420295e-06,
"loss": 0.2523,
"step": 21475
},
{
"epoch": 2.55,
"learning_rate": 3.916521739130435e-06,
"loss": 0.2748,
"step": 21500
},
{
"epoch": 2.55,
"learning_rate": 3.90927536231884e-06,
"loss": 0.3106,
"step": 21525
},
{
"epoch": 2.56,
"learning_rate": 3.902028985507247e-06,
"loss": 0.3489,
"step": 21550
},
{
"epoch": 2.56,
"learning_rate": 3.894782608695653e-06,
"loss": 0.3188,
"step": 21575
},
{
"epoch": 2.56,
"learning_rate": 3.887536231884058e-06,
"loss": 0.3188,
"step": 21600
},
{
"epoch": 2.57,
"learning_rate": 3.880289855072465e-06,
"loss": 0.3178,
"step": 21625
},
{
"epoch": 2.57,
"learning_rate": 3.87304347826087e-06,
"loss": 0.2279,
"step": 21650
},
{
"epoch": 2.57,
"learning_rate": 3.8657971014492755e-06,
"loss": 0.2803,
"step": 21675
},
{
"epoch": 2.58,
"learning_rate": 3.858550724637681e-06,
"loss": 0.21,
"step": 21700
},
{
"epoch": 2.58,
"learning_rate": 3.851304347826087e-06,
"loss": 0.2753,
"step": 21725
},
{
"epoch": 2.58,
"learning_rate": 3.844057971014493e-06,
"loss": 0.4256,
"step": 21750
},
{
"epoch": 2.58,
"learning_rate": 3.836811594202899e-06,
"loss": 0.2934,
"step": 21775
},
{
"epoch": 2.59,
"learning_rate": 3.829565217391305e-06,
"loss": 0.3364,
"step": 21800
},
{
"epoch": 2.59,
"learning_rate": 3.822318840579711e-06,
"loss": 0.3053,
"step": 21825
},
{
"epoch": 2.59,
"learning_rate": 3.8150724637681164e-06,
"loss": 0.3143,
"step": 21850
},
{
"epoch": 2.6,
"learning_rate": 3.807826086956522e-06,
"loss": 0.2758,
"step": 21875
},
{
"epoch": 2.6,
"learning_rate": 3.8005797101449277e-06,
"loss": 0.2616,
"step": 21900
},
{
"epoch": 2.6,
"learning_rate": 3.793333333333334e-06,
"loss": 0.2949,
"step": 21925
},
{
"epoch": 2.6,
"learning_rate": 3.7860869565217394e-06,
"loss": 0.358,
"step": 21950
},
{
"epoch": 2.61,
"learning_rate": 3.7788405797101453e-06,
"loss": 0.2856,
"step": 21975
},
{
"epoch": 2.61,
"learning_rate": 3.7715942028985507e-06,
"loss": 0.3642,
"step": 22000
},
{
"epoch": 2.61,
"eval_cer": 6.886713561906636,
"eval_loss": 0.3953614830970764,
"eval_runtime": 3140.8887,
"eval_samples_per_second": 0.79,
"eval_steps_per_second": 0.395,
"eval_wer": 18.69716028206594,
"step": 22000
},
{
"epoch": 2.61,
"learning_rate": 3.764347826086957e-06,
"loss": 0.283,
"step": 22025
},
{
"epoch": 2.62,
"learning_rate": 3.757101449275363e-06,
"loss": 0.3267,
"step": 22050
},
{
"epoch": 2.62,
"learning_rate": 3.7498550724637683e-06,
"loss": 0.3271,
"step": 22075
},
{
"epoch": 2.62,
"learning_rate": 3.742608695652174e-06,
"loss": 0.3372,
"step": 22100
},
{
"epoch": 2.63,
"learning_rate": 3.7353623188405804e-06,
"loss": 0.2551,
"step": 22125
},
{
"epoch": 2.63,
"learning_rate": 3.728115942028986e-06,
"loss": 0.3063,
"step": 22150
},
{
"epoch": 2.63,
"learning_rate": 3.7208695652173917e-06,
"loss": 0.2902,
"step": 22175
},
{
"epoch": 2.63,
"learning_rate": 3.713623188405797e-06,
"loss": 0.255,
"step": 22200
},
{
"epoch": 2.64,
"learning_rate": 3.7063768115942034e-06,
"loss": 0.3041,
"step": 22225
},
{
"epoch": 2.64,
"learning_rate": 3.699130434782609e-06,
"loss": 0.3338,
"step": 22250
},
{
"epoch": 2.64,
"learning_rate": 3.6918840579710147e-06,
"loss": 0.2509,
"step": 22275
},
{
"epoch": 2.65,
"learning_rate": 3.68463768115942e-06,
"loss": 0.2996,
"step": 22300
},
{
"epoch": 2.65,
"learning_rate": 3.6773913043478264e-06,
"loss": 0.3299,
"step": 22325
},
{
"epoch": 2.65,
"learning_rate": 3.6701449275362323e-06,
"loss": 0.234,
"step": 22350
},
{
"epoch": 2.66,
"learning_rate": 3.6628985507246377e-06,
"loss": 0.304,
"step": 22375
},
{
"epoch": 2.66,
"learning_rate": 3.6556521739130435e-06,
"loss": 0.3406,
"step": 22400
},
{
"epoch": 2.66,
"learning_rate": 3.64840579710145e-06,
"loss": 0.2437,
"step": 22425
},
{
"epoch": 2.66,
"learning_rate": 3.6411594202898552e-06,
"loss": 0.4036,
"step": 22450
},
{
"epoch": 2.67,
"learning_rate": 3.633913043478261e-06,
"loss": 0.431,
"step": 22475
},
{
"epoch": 2.67,
"learning_rate": 3.6266666666666674e-06,
"loss": 0.2864,
"step": 22500
},
{
"epoch": 2.67,
"learning_rate": 3.619420289855073e-06,
"loss": 0.2791,
"step": 22525
},
{
"epoch": 2.68,
"learning_rate": 3.6121739130434787e-06,
"loss": 0.2975,
"step": 22550
},
{
"epoch": 2.68,
"learning_rate": 3.604927536231884e-06,
"loss": 0.3252,
"step": 22575
},
{
"epoch": 2.68,
"learning_rate": 3.5976811594202904e-06,
"loss": 0.2389,
"step": 22600
},
{
"epoch": 2.68,
"learning_rate": 3.5904347826086962e-06,
"loss": 0.3063,
"step": 22625
},
{
"epoch": 2.69,
"learning_rate": 3.5831884057971017e-06,
"loss": 0.2614,
"step": 22650
},
{
"epoch": 2.69,
"learning_rate": 3.5759420289855075e-06,
"loss": 0.2833,
"step": 22675
},
{
"epoch": 2.69,
"learning_rate": 3.5686956521739134e-06,
"loss": 0.3931,
"step": 22700
},
{
"epoch": 2.7,
"learning_rate": 3.5614492753623192e-06,
"loss": 0.2804,
"step": 22725
},
{
"epoch": 2.7,
"learning_rate": 3.554202898550725e-06,
"loss": 0.2688,
"step": 22750
},
{
"epoch": 2.7,
"learning_rate": 3.5469565217391305e-06,
"loss": 0.2059,
"step": 22775
},
{
"epoch": 2.71,
"learning_rate": 3.5397101449275368e-06,
"loss": 0.3133,
"step": 22800
},
{
"epoch": 2.71,
"learning_rate": 3.5324637681159422e-06,
"loss": 0.2725,
"step": 22825
},
{
"epoch": 2.71,
"learning_rate": 3.525217391304348e-06,
"loss": 0.2712,
"step": 22850
},
{
"epoch": 2.71,
"learning_rate": 3.5179710144927535e-06,
"loss": 0.264,
"step": 22875
},
{
"epoch": 2.72,
"learning_rate": 3.5107246376811598e-06,
"loss": 0.2404,
"step": 22900
},
{
"epoch": 2.72,
"learning_rate": 3.5034782608695656e-06,
"loss": 0.3211,
"step": 22925
},
{
"epoch": 2.72,
"learning_rate": 3.496231884057971e-06,
"loss": 0.2726,
"step": 22950
},
{
"epoch": 2.73,
"learning_rate": 3.488985507246377e-06,
"loss": 0.399,
"step": 22975
},
{
"epoch": 2.73,
"learning_rate": 3.481739130434783e-06,
"loss": 0.2297,
"step": 23000
},
{
"epoch": 2.73,
"eval_cer": 6.938363913620936,
"eval_loss": 0.3916235566139221,
"eval_runtime": 3180.568,
"eval_samples_per_second": 0.78,
"eval_steps_per_second": 0.39,
"eval_wer": 18.73299028016009,
"step": 23000
},
{
"epoch": 2.73,
"learning_rate": 3.4744927536231886e-06,
"loss": 0.3484,
"step": 23025
},
{
"epoch": 2.74,
"learning_rate": 3.4672463768115945e-06,
"loss": 0.2585,
"step": 23050
},
{
"epoch": 2.74,
"learning_rate": 3.46e-06,
"loss": 0.2843,
"step": 23075
},
{
"epoch": 2.74,
"learning_rate": 3.452753623188406e-06,
"loss": 0.3526,
"step": 23100
},
{
"epoch": 2.74,
"learning_rate": 3.445507246376812e-06,
"loss": 0.3063,
"step": 23125
},
{
"epoch": 2.75,
"learning_rate": 3.4382608695652175e-06,
"loss": 0.3701,
"step": 23150
},
{
"epoch": 2.75,
"learning_rate": 3.4310144927536233e-06,
"loss": 0.2438,
"step": 23175
},
{
"epoch": 2.75,
"learning_rate": 3.4237681159420296e-06,
"loss": 0.3001,
"step": 23200
},
{
"epoch": 2.76,
"learning_rate": 3.416521739130435e-06,
"loss": 0.3103,
"step": 23225
},
{
"epoch": 2.76,
"learning_rate": 3.409275362318841e-06,
"loss": 0.2769,
"step": 23250
},
{
"epoch": 2.76,
"learning_rate": 3.4020289855072467e-06,
"loss": 0.4483,
"step": 23275
},
{
"epoch": 2.76,
"learning_rate": 3.3947826086956526e-06,
"loss": 0.2777,
"step": 23300
},
{
"epoch": 2.77,
"learning_rate": 3.387536231884058e-06,
"loss": 0.2413,
"step": 23325
},
{
"epoch": 2.77,
"learning_rate": 3.380289855072464e-06,
"loss": 0.2911,
"step": 23350
},
{
"epoch": 2.77,
"learning_rate": 3.37304347826087e-06,
"loss": 0.3544,
"step": 23375
},
{
"epoch": 2.78,
"learning_rate": 3.3657971014492756e-06,
"loss": 0.349,
"step": 23400
},
{
"epoch": 2.78,
"learning_rate": 3.3585507246376814e-06,
"loss": 0.3243,
"step": 23425
},
{
"epoch": 2.78,
"learning_rate": 3.351304347826087e-06,
"loss": 0.2601,
"step": 23450
},
{
"epoch": 2.79,
"learning_rate": 3.344057971014493e-06,
"loss": 0.268,
"step": 23475
},
{
"epoch": 2.79,
"learning_rate": 3.336811594202899e-06,
"loss": 0.294,
"step": 23500
},
{
"epoch": 2.79,
"learning_rate": 3.3295652173913044e-06,
"loss": 0.3095,
"step": 23525
},
{
"epoch": 2.79,
"learning_rate": 3.3223188405797103e-06,
"loss": 0.2588,
"step": 23550
},
{
"epoch": 2.8,
"learning_rate": 3.3150724637681166e-06,
"loss": 0.4027,
"step": 23575
},
{
"epoch": 2.8,
"learning_rate": 3.307826086956522e-06,
"loss": 0.2887,
"step": 23600
},
{
"epoch": 2.8,
"learning_rate": 3.300579710144928e-06,
"loss": 0.2459,
"step": 23625
},
{
"epoch": 2.81,
"learning_rate": 3.2933333333333333e-06,
"loss": 0.2288,
"step": 23650
},
{
"epoch": 2.81,
"learning_rate": 3.2860869565217396e-06,
"loss": 0.2998,
"step": 23675
},
{
"epoch": 2.81,
"learning_rate": 3.2788405797101454e-06,
"loss": 0.3197,
"step": 23700
},
{
"epoch": 2.82,
"learning_rate": 3.271594202898551e-06,
"loss": 0.2931,
"step": 23725
},
{
"epoch": 2.82,
"learning_rate": 3.2643478260869567e-06,
"loss": 0.2451,
"step": 23750
},
{
"epoch": 2.82,
"learning_rate": 3.2571014492753626e-06,
"loss": 0.251,
"step": 23775
},
{
"epoch": 2.82,
"learning_rate": 3.2498550724637684e-06,
"loss": 0.291,
"step": 23800
},
{
"epoch": 2.83,
"learning_rate": 3.2426086956521743e-06,
"loss": 0.2916,
"step": 23825
},
{
"epoch": 2.83,
"learning_rate": 3.2353623188405797e-06,
"loss": 0.3365,
"step": 23850
},
{
"epoch": 2.83,
"learning_rate": 3.228115942028986e-06,
"loss": 0.2967,
"step": 23875
},
{
"epoch": 2.84,
"learning_rate": 3.2208695652173914e-06,
"loss": 0.2435,
"step": 23900
},
{
"epoch": 2.84,
"learning_rate": 3.2136231884057973e-06,
"loss": 0.3885,
"step": 23925
},
{
"epoch": 2.84,
"learning_rate": 3.2063768115942027e-06,
"loss": 0.2373,
"step": 23950
},
{
"epoch": 2.85,
"learning_rate": 3.199130434782609e-06,
"loss": 0.3457,
"step": 23975
},
{
"epoch": 2.85,
"learning_rate": 3.191884057971015e-06,
"loss": 0.2313,
"step": 24000
},
{
"epoch": 2.85,
"eval_cer": 6.778493777362389,
"eval_loss": 0.3930225968360901,
"eval_runtime": 3191.3103,
"eval_samples_per_second": 0.778,
"eval_steps_per_second": 0.389,
"eval_wer": 18.60339241471317,
"step": 24000
},
{
"epoch": 2.85,
"learning_rate": 3.1846376811594202e-06,
"loss": 0.2984,
"step": 24025
},
{
"epoch": 2.85,
"learning_rate": 3.1773913043478265e-06,
"loss": 0.2425,
"step": 24050
},
{
"epoch": 2.86,
"learning_rate": 3.1701449275362324e-06,
"loss": 0.3009,
"step": 24075
},
{
"epoch": 2.86,
"learning_rate": 3.162898550724638e-06,
"loss": 0.251,
"step": 24100
},
{
"epoch": 2.86,
"learning_rate": 3.1556521739130437e-06,
"loss": 0.2794,
"step": 24125
},
{
"epoch": 2.87,
"learning_rate": 3.14840579710145e-06,
"loss": 0.326,
"step": 24150
},
{
"epoch": 2.87,
"learning_rate": 3.1414492753623194e-06,
"loss": 0.2487,
"step": 24175
},
{
"epoch": 2.87,
"learning_rate": 3.134202898550725e-06,
"loss": 0.2793,
"step": 24200
},
{
"epoch": 2.87,
"learning_rate": 3.1269565217391307e-06,
"loss": 0.3093,
"step": 24225
},
{
"epoch": 2.88,
"learning_rate": 3.119710144927536e-06,
"loss": 0.2536,
"step": 24250
},
{
"epoch": 2.88,
"learning_rate": 3.1124637681159424e-06,
"loss": 0.3143,
"step": 24275
},
{
"epoch": 2.88,
"learning_rate": 3.1052173913043483e-06,
"loss": 0.2409,
"step": 24300
},
{
"epoch": 2.89,
"learning_rate": 3.0979710144927537e-06,
"loss": 0.3879,
"step": 24325
},
{
"epoch": 2.89,
"learning_rate": 3.0907246376811596e-06,
"loss": 0.3521,
"step": 24350
},
{
"epoch": 2.89,
"learning_rate": 3.083478260869566e-06,
"loss": 0.2628,
"step": 24375
},
{
"epoch": 2.9,
"learning_rate": 3.0762318840579713e-06,
"loss": 0.2127,
"step": 24400
},
{
"epoch": 2.9,
"learning_rate": 3.068985507246377e-06,
"loss": 0.3071,
"step": 24425
},
{
"epoch": 2.9,
"learning_rate": 3.0617391304347826e-06,
"loss": 0.2488,
"step": 24450
},
{
"epoch": 2.9,
"learning_rate": 3.054492753623189e-06,
"loss": 0.2462,
"step": 24475
},
{
"epoch": 2.91,
"learning_rate": 3.0472463768115947e-06,
"loss": 0.2651,
"step": 24500
},
{
"epoch": 2.91,
"learning_rate": 3.04e-06,
"loss": 0.2555,
"step": 24525
},
{
"epoch": 2.91,
"learning_rate": 3.032753623188406e-06,
"loss": 0.2511,
"step": 24550
},
{
"epoch": 2.92,
"learning_rate": 3.025507246376812e-06,
"loss": 0.2761,
"step": 24575
},
{
"epoch": 2.92,
"learning_rate": 3.0182608695652177e-06,
"loss": 0.3315,
"step": 24600
},
{
"epoch": 2.92,
"learning_rate": 3.0110144927536235e-06,
"loss": 0.4222,
"step": 24625
},
{
"epoch": 2.93,
"learning_rate": 3.003768115942029e-06,
"loss": 0.252,
"step": 24650
},
{
"epoch": 2.93,
"learning_rate": 2.9965217391304352e-06,
"loss": 0.3424,
"step": 24675
},
{
"epoch": 2.93,
"learning_rate": 2.9892753623188407e-06,
"loss": 0.3086,
"step": 24700
},
{
"epoch": 2.93,
"learning_rate": 2.9820289855072465e-06,
"loss": 0.3246,
"step": 24725
},
{
"epoch": 2.94,
"learning_rate": 2.974782608695652e-06,
"loss": 0.4331,
"step": 24750
},
{
"epoch": 2.94,
"learning_rate": 2.9675362318840582e-06,
"loss": 0.2933,
"step": 24775
},
{
"epoch": 2.94,
"learning_rate": 2.960289855072464e-06,
"loss": 0.3234,
"step": 24800
},
{
"epoch": 2.95,
"learning_rate": 2.9530434782608695e-06,
"loss": 0.2495,
"step": 24825
},
{
"epoch": 2.95,
"learning_rate": 2.9457971014492754e-06,
"loss": 0.2506,
"step": 24850
},
{
"epoch": 2.95,
"learning_rate": 2.9385507246376817e-06,
"loss": 0.2862,
"step": 24875
},
{
"epoch": 2.95,
"learning_rate": 2.931304347826087e-06,
"loss": 0.2804,
"step": 24900
},
{
"epoch": 2.96,
"learning_rate": 2.924057971014493e-06,
"loss": 0.2659,
"step": 24925
},
{
"epoch": 2.96,
"learning_rate": 2.9168115942028992e-06,
"loss": 0.2801,
"step": 24950
},
{
"epoch": 2.96,
"learning_rate": 2.9095652173913046e-06,
"loss": 0.3455,
"step": 24975
},
{
"epoch": 2.97,
"learning_rate": 2.902608695652174e-06,
"loss": 0.2833,
"step": 25000
},
{
"epoch": 2.97,
"eval_cer": 6.855231442766491,
"eval_loss": 0.39096301794052124,
"eval_runtime": 3187.6224,
"eval_samples_per_second": 0.779,
"eval_steps_per_second": 0.389,
"eval_wer": 18.598056032018295,
"step": 25000
},
{
"epoch": 2.97,
"learning_rate": 2.89536231884058e-06,
"loss": 0.2299,
"step": 25025
},
{
"epoch": 2.97,
"learning_rate": 2.8881159420289854e-06,
"loss": 0.2482,
"step": 25050
},
{
"epoch": 2.98,
"learning_rate": 2.8808695652173917e-06,
"loss": 0.3388,
"step": 25075
},
{
"epoch": 2.98,
"learning_rate": 2.8736231884057975e-06,
"loss": 0.4429,
"step": 25100
},
{
"epoch": 2.98,
"learning_rate": 2.866376811594203e-06,
"loss": 0.2245,
"step": 25125
},
{
"epoch": 2.98,
"learning_rate": 2.859130434782609e-06,
"loss": 0.2648,
"step": 25150
},
{
"epoch": 2.99,
"learning_rate": 2.851884057971015e-06,
"loss": 0.1995,
"step": 25175
},
{
"epoch": 2.99,
"learning_rate": 2.8446376811594205e-06,
"loss": 0.2652,
"step": 25200
},
{
"epoch": 2.99,
"learning_rate": 2.8373913043478264e-06,
"loss": 0.2587,
"step": 25225
},
{
"epoch": 3.0,
"learning_rate": 2.830144927536232e-06,
"loss": 0.2889,
"step": 25250
},
{
"epoch": 3.0,
"learning_rate": 2.822898550724638e-06,
"loss": 0.2257,
"step": 25275
},
{
"epoch": 3.0,
"learning_rate": 2.815652173913044e-06,
"loss": 0.1742,
"step": 25300
},
{
"epoch": 3.01,
"learning_rate": 2.8084057971014494e-06,
"loss": 0.1856,
"step": 25325
},
{
"epoch": 3.01,
"learning_rate": 2.8011594202898552e-06,
"loss": 0.1801,
"step": 25350
},
{
"epoch": 3.01,
"learning_rate": 2.7939130434782615e-06,
"loss": 0.2185,
"step": 25375
},
{
"epoch": 3.01,
"learning_rate": 2.786666666666667e-06,
"loss": 0.2565,
"step": 25400
},
{
"epoch": 3.02,
"learning_rate": 2.779420289855073e-06,
"loss": 0.2026,
"step": 25425
},
{
"epoch": 3.02,
"learning_rate": 2.7721739130434782e-06,
"loss": 0.2373,
"step": 25450
},
{
"epoch": 3.02,
"learning_rate": 2.7649275362318845e-06,
"loss": 0.2406,
"step": 25475
},
{
"epoch": 3.03,
"learning_rate": 2.75768115942029e-06,
"loss": 0.4514,
"step": 25500
},
{
"epoch": 3.03,
"learning_rate": 2.750434782608696e-06,
"loss": 0.1876,
"step": 25525
},
{
"epoch": 3.03,
"learning_rate": 2.7431884057971012e-06,
"loss": 0.2703,
"step": 25550
},
{
"epoch": 3.03,
"learning_rate": 2.7359420289855075e-06,
"loss": 0.1749,
"step": 25575
},
{
"epoch": 3.04,
"learning_rate": 2.7286956521739134e-06,
"loss": 0.2088,
"step": 25600
},
{
"epoch": 3.04,
"learning_rate": 2.721449275362319e-06,
"loss": 0.2087,
"step": 25625
},
{
"epoch": 3.04,
"learning_rate": 2.7142028985507246e-06,
"loss": 0.3172,
"step": 25650
},
{
"epoch": 3.05,
"learning_rate": 2.706956521739131e-06,
"loss": 0.1898,
"step": 25675
},
{
"epoch": 3.05,
"learning_rate": 2.6997101449275364e-06,
"loss": 0.1685,
"step": 25700
},
{
"epoch": 3.05,
"learning_rate": 2.692463768115942e-06,
"loss": 0.1918,
"step": 25725
},
{
"epoch": 3.06,
"learning_rate": 2.6852173913043476e-06,
"loss": 0.2734,
"step": 25750
},
{
"epoch": 3.06,
"learning_rate": 2.677971014492754e-06,
"loss": 0.1485,
"step": 25775
},
{
"epoch": 3.06,
"learning_rate": 2.6707246376811598e-06,
"loss": 0.1542,
"step": 25800
},
{
"epoch": 3.06,
"learning_rate": 2.663478260869565e-06,
"loss": 0.1694,
"step": 25825
},
{
"epoch": 3.07,
"learning_rate": 2.6562318840579715e-06,
"loss": 0.1685,
"step": 25850
},
{
"epoch": 3.07,
"learning_rate": 2.6489855072463773e-06,
"loss": 0.1719,
"step": 25875
},
{
"epoch": 3.07,
"learning_rate": 2.6417391304347828e-06,
"loss": 0.1573,
"step": 25900
},
{
"epoch": 3.08,
"learning_rate": 2.6344927536231886e-06,
"loss": 0.2429,
"step": 25925
},
{
"epoch": 3.08,
"learning_rate": 2.6272463768115945e-06,
"loss": 0.1751,
"step": 25950
},
{
"epoch": 3.08,
"learning_rate": 2.6202898550724644e-06,
"loss": 0.2976,
"step": 25975
},
{
"epoch": 3.09,
"learning_rate": 2.61304347826087e-06,
"loss": 0.2509,
"step": 26000
},
{
"epoch": 3.09,
"eval_cer": 6.816493678980766,
"eval_loss": 0.3948805630207062,
"eval_runtime": 3174.2689,
"eval_samples_per_second": 0.782,
"eval_steps_per_second": 0.391,
"eval_wer": 18.518010291595196,
"step": 26000
},
{
"epoch": 3.09,
"learning_rate": 2.6057971014492757e-06,
"loss": 0.377,
"step": 26025
},
{
"epoch": 3.09,
"learning_rate": 2.598550724637681e-06,
"loss": 0.1902,
"step": 26050
},
{
"epoch": 3.09,
"learning_rate": 2.5913043478260874e-06,
"loss": 0.2086,
"step": 26075
},
{
"epoch": 3.1,
"learning_rate": 2.5840579710144932e-06,
"loss": 0.269,
"step": 26100
},
{
"epoch": 3.1,
"learning_rate": 2.5768115942028987e-06,
"loss": 0.2287,
"step": 26125
},
{
"epoch": 3.1,
"learning_rate": 2.5695652173913045e-06,
"loss": 0.2673,
"step": 26150
},
{
"epoch": 3.11,
"learning_rate": 2.562318840579711e-06,
"loss": 0.1238,
"step": 26175
},
{
"epoch": 3.11,
"learning_rate": 2.5550724637681162e-06,
"loss": 0.2047,
"step": 26200
},
{
"epoch": 3.11,
"learning_rate": 2.547826086956522e-06,
"loss": 0.3,
"step": 26225
},
{
"epoch": 3.11,
"learning_rate": 2.5405797101449275e-06,
"loss": 0.201,
"step": 26250
},
{
"epoch": 3.12,
"learning_rate": 2.5333333333333338e-06,
"loss": 0.1864,
"step": 26275
},
{
"epoch": 3.12,
"learning_rate": 2.5260869565217392e-06,
"loss": 0.2565,
"step": 26300
},
{
"epoch": 3.12,
"learning_rate": 2.518840579710145e-06,
"loss": 0.189,
"step": 26325
},
{
"epoch": 3.13,
"learning_rate": 2.511594202898551e-06,
"loss": 0.2006,
"step": 26350
},
{
"epoch": 3.13,
"learning_rate": 2.5043478260869568e-06,
"loss": 0.1992,
"step": 26375
},
{
"epoch": 3.13,
"learning_rate": 2.4971014492753626e-06,
"loss": 0.1742,
"step": 26400
},
{
"epoch": 3.14,
"learning_rate": 2.489855072463768e-06,
"loss": 0.1909,
"step": 26425
},
{
"epoch": 3.14,
"learning_rate": 2.4826086956521743e-06,
"loss": 0.1935,
"step": 26450
},
{
"epoch": 3.14,
"learning_rate": 2.4753623188405798e-06,
"loss": 0.2335,
"step": 26475
},
{
"epoch": 3.14,
"learning_rate": 2.4681159420289856e-06,
"loss": 0.2635,
"step": 26500
},
{
"epoch": 3.15,
"learning_rate": 2.4608695652173915e-06,
"loss": 0.2079,
"step": 26525
},
{
"epoch": 3.15,
"learning_rate": 2.4536231884057973e-06,
"loss": 0.2006,
"step": 26550
},
{
"epoch": 3.15,
"learning_rate": 2.446376811594203e-06,
"loss": 0.244,
"step": 26575
},
{
"epoch": 3.16,
"learning_rate": 2.439130434782609e-06,
"loss": 0.32,
"step": 26600
},
{
"epoch": 3.16,
"learning_rate": 2.4318840579710145e-06,
"loss": 0.1757,
"step": 26625
},
{
"epoch": 3.16,
"learning_rate": 2.4246376811594203e-06,
"loss": 0.151,
"step": 26650
},
{
"epoch": 3.17,
"learning_rate": 2.417391304347826e-06,
"loss": 0.1985,
"step": 26675
},
{
"epoch": 3.17,
"learning_rate": 2.410144927536232e-06,
"loss": 0.2241,
"step": 26700
},
{
"epoch": 3.17,
"learning_rate": 2.402898550724638e-06,
"loss": 0.1411,
"step": 26725
},
{
"epoch": 3.17,
"learning_rate": 2.3956521739130437e-06,
"loss": 0.2348,
"step": 26750
},
{
"epoch": 3.18,
"learning_rate": 2.3884057971014496e-06,
"loss": 0.2529,
"step": 26775
},
{
"epoch": 3.18,
"learning_rate": 2.3811594202898555e-06,
"loss": 0.1819,
"step": 26800
},
{
"epoch": 3.18,
"learning_rate": 2.3739130434782613e-06,
"loss": 0.2473,
"step": 26825
},
{
"epoch": 3.19,
"learning_rate": 2.3666666666666667e-06,
"loss": 0.2902,
"step": 26850
},
{
"epoch": 3.19,
"learning_rate": 2.3594202898550726e-06,
"loss": 0.1368,
"step": 26875
},
{
"epoch": 3.19,
"learning_rate": 2.3521739130434784e-06,
"loss": 0.2857,
"step": 26900
},
{
"epoch": 3.2,
"learning_rate": 2.3449275362318843e-06,
"loss": 0.1613,
"step": 26925
},
{
"epoch": 3.2,
"learning_rate": 2.33768115942029e-06,
"loss": 0.2573,
"step": 26950
},
{
"epoch": 3.2,
"learning_rate": 2.330434782608696e-06,
"loss": 0.2029,
"step": 26975
},
{
"epoch": 3.2,
"learning_rate": 2.3231884057971014e-06,
"loss": 0.2085,
"step": 27000
},
{
"epoch": 3.2,
"eval_cer": 6.811328643809336,
"eval_loss": 0.3984606862068176,
"eval_runtime": 3176.0872,
"eval_samples_per_second": 0.781,
"eval_steps_per_second": 0.391,
"eval_wer": 18.613302839717935,
"step": 27000
},
{
"epoch": 3.21,
"learning_rate": 2.3159420289855077e-06,
"loss": 0.235,
"step": 27025
},
{
"epoch": 3.21,
"learning_rate": 2.308695652173913e-06,
"loss": 0.1992,
"step": 27050
},
{
"epoch": 3.21,
"learning_rate": 2.301449275362319e-06,
"loss": 0.2457,
"step": 27075
},
{
"epoch": 3.22,
"learning_rate": 2.294202898550725e-06,
"loss": 0.1871,
"step": 27100
},
{
"epoch": 3.22,
"learning_rate": 2.2869565217391307e-06,
"loss": 0.1464,
"step": 27125
},
{
"epoch": 3.22,
"learning_rate": 2.279710144927536e-06,
"loss": 0.2012,
"step": 27150
},
{
"epoch": 3.22,
"learning_rate": 2.2724637681159424e-06,
"loss": 0.1757,
"step": 27175
},
{
"epoch": 3.23,
"learning_rate": 2.265217391304348e-06,
"loss": 0.1795,
"step": 27200
},
{
"epoch": 3.23,
"learning_rate": 2.2579710144927537e-06,
"loss": 0.1706,
"step": 27225
},
{
"epoch": 3.23,
"learning_rate": 2.2507246376811596e-06,
"loss": 0.2044,
"step": 27250
},
{
"epoch": 3.24,
"learning_rate": 2.2434782608695654e-06,
"loss": 0.2155,
"step": 27275
},
{
"epoch": 3.24,
"learning_rate": 2.2362318840579713e-06,
"loss": 0.1811,
"step": 27300
},
{
"epoch": 3.24,
"learning_rate": 2.228985507246377e-06,
"loss": 0.2311,
"step": 27325
},
{
"epoch": 3.25,
"learning_rate": 2.2217391304347825e-06,
"loss": 0.3311,
"step": 27350
},
{
"epoch": 3.25,
"learning_rate": 2.2144927536231884e-06,
"loss": 0.1692,
"step": 27375
},
{
"epoch": 3.25,
"learning_rate": 2.2072463768115943e-06,
"loss": 0.2069,
"step": 27400
},
{
"epoch": 3.25,
"learning_rate": 2.2e-06,
"loss": 0.1755,
"step": 27425
},
{
"epoch": 3.26,
"learning_rate": 2.192753623188406e-06,
"loss": 0.2029,
"step": 27450
},
{
"epoch": 3.26,
"learning_rate": 2.185507246376812e-06,
"loss": 0.2542,
"step": 27475
},
{
"epoch": 3.26,
"learning_rate": 2.1782608695652177e-06,
"loss": 0.1882,
"step": 27500
},
{
"epoch": 3.27,
"learning_rate": 2.1710144927536235e-06,
"loss": 0.2374,
"step": 27525
},
{
"epoch": 3.27,
"learning_rate": 2.1637681159420294e-06,
"loss": 0.1967,
"step": 27550
},
{
"epoch": 3.27,
"learning_rate": 2.156521739130435e-06,
"loss": 0.1869,
"step": 27575
},
{
"epoch": 3.28,
"learning_rate": 2.1492753623188407e-06,
"loss": 0.2861,
"step": 27600
},
{
"epoch": 3.28,
"learning_rate": 2.1420289855072465e-06,
"loss": 0.2392,
"step": 27625
},
{
"epoch": 3.28,
"learning_rate": 2.1347826086956524e-06,
"loss": 0.18,
"step": 27650
},
{
"epoch": 3.28,
"learning_rate": 2.1275362318840582e-06,
"loss": 0.2496,
"step": 27675
},
{
"epoch": 3.29,
"learning_rate": 2.120289855072464e-06,
"loss": 0.1998,
"step": 27700
},
{
"epoch": 3.29,
"learning_rate": 2.1130434782608695e-06,
"loss": 0.259,
"step": 27725
},
{
"epoch": 3.29,
"learning_rate": 2.105797101449276e-06,
"loss": 0.3129,
"step": 27750
},
{
"epoch": 3.3,
"learning_rate": 2.0985507246376812e-06,
"loss": 0.1907,
"step": 27775
},
{
"epoch": 3.3,
"learning_rate": 2.091304347826087e-06,
"loss": 0.1343,
"step": 27800
},
{
"epoch": 3.3,
"learning_rate": 2.084057971014493e-06,
"loss": 0.1973,
"step": 27825
},
{
"epoch": 3.3,
"learning_rate": 2.0768115942028988e-06,
"loss": 0.1658,
"step": 27850
},
{
"epoch": 3.31,
"learning_rate": 2.0695652173913046e-06,
"loss": 0.1508,
"step": 27875
},
{
"epoch": 3.31,
"learning_rate": 2.0623188405797105e-06,
"loss": 0.1947,
"step": 27900
},
{
"epoch": 3.31,
"learning_rate": 2.055072463768116e-06,
"loss": 0.1812,
"step": 27925
},
{
"epoch": 3.32,
"learning_rate": 2.0478260869565218e-06,
"loss": 0.2154,
"step": 27950
},
{
"epoch": 3.32,
"learning_rate": 2.0405797101449276e-06,
"loss": 0.1456,
"step": 27975
},
{
"epoch": 3.32,
"learning_rate": 2.0333333333333335e-06,
"loss": 0.2055,
"step": 28000
},
{
"epoch": 3.32,
"eval_cer": 6.862364110384181,
"eval_loss": 0.39950060844421387,
"eval_runtime": 3191.9428,
"eval_samples_per_second": 0.778,
"eval_steps_per_second": 0.389,
"eval_wer": 18.76119687440442,
"step": 28000
},
{
"epoch": 3.33,
"learning_rate": 2.0260869565217393e-06,
"loss": 0.1855,
"step": 28025
},
{
"epoch": 3.33,
"learning_rate": 2.018840579710145e-06,
"loss": 0.2535,
"step": 28050
},
{
"epoch": 3.33,
"learning_rate": 2.0115942028985506e-06,
"loss": 0.2101,
"step": 28075
},
{
"epoch": 3.33,
"learning_rate": 2.004347826086957e-06,
"loss": 0.2977,
"step": 28100
},
{
"epoch": 3.34,
"learning_rate": 1.9971014492753623e-06,
"loss": 0.1915,
"step": 28125
},
{
"epoch": 3.34,
"learning_rate": 1.989855072463768e-06,
"loss": 0.1589,
"step": 28150
},
{
"epoch": 3.34,
"learning_rate": 1.982608695652174e-06,
"loss": 0.175,
"step": 28175
},
{
"epoch": 3.35,
"learning_rate": 1.97536231884058e-06,
"loss": 0.2892,
"step": 28200
},
{
"epoch": 3.35,
"learning_rate": 1.9681159420289853e-06,
"loss": 0.223,
"step": 28225
},
{
"epoch": 3.35,
"learning_rate": 1.9608695652173916e-06,
"loss": 0.1731,
"step": 28250
},
{
"epoch": 3.36,
"learning_rate": 1.9536231884057975e-06,
"loss": 0.2097,
"step": 28275
},
{
"epoch": 3.36,
"learning_rate": 1.946376811594203e-06,
"loss": 0.1909,
"step": 28300
},
{
"epoch": 3.36,
"learning_rate": 1.939130434782609e-06,
"loss": 0.2079,
"step": 28325
},
{
"epoch": 3.36,
"learning_rate": 1.9318840579710146e-06,
"loss": 0.1848,
"step": 28350
},
{
"epoch": 3.37,
"learning_rate": 1.9246376811594205e-06,
"loss": 0.1813,
"step": 28375
},
{
"epoch": 3.37,
"learning_rate": 1.9173913043478263e-06,
"loss": 0.1679,
"step": 28400
},
{
"epoch": 3.37,
"learning_rate": 1.910144927536232e-06,
"loss": 0.1787,
"step": 28425
},
{
"epoch": 3.38,
"learning_rate": 1.9028985507246378e-06,
"loss": 0.1718,
"step": 28450
},
{
"epoch": 3.38,
"learning_rate": 1.8956521739130437e-06,
"loss": 0.2553,
"step": 28475
},
{
"epoch": 3.38,
"learning_rate": 1.8884057971014493e-06,
"loss": 0.2249,
"step": 28500
},
{
"epoch": 3.38,
"learning_rate": 1.8811594202898554e-06,
"loss": 0.1657,
"step": 28525
},
{
"epoch": 3.39,
"learning_rate": 1.873913043478261e-06,
"loss": 0.1738,
"step": 28550
},
{
"epoch": 3.39,
"learning_rate": 1.8666666666666669e-06,
"loss": 0.1935,
"step": 28575
},
{
"epoch": 3.39,
"learning_rate": 1.8594202898550725e-06,
"loss": 0.2179,
"step": 28600
},
{
"epoch": 3.4,
"learning_rate": 1.8521739130434786e-06,
"loss": 0.2696,
"step": 28625
},
{
"epoch": 3.4,
"learning_rate": 1.8449275362318842e-06,
"loss": 0.1657,
"step": 28650
},
{
"epoch": 3.4,
"learning_rate": 1.83768115942029e-06,
"loss": 0.2302,
"step": 28675
},
{
"epoch": 3.41,
"learning_rate": 1.8304347826086957e-06,
"loss": 0.2888,
"step": 28700
},
{
"epoch": 3.41,
"learning_rate": 1.8231884057971016e-06,
"loss": 0.193,
"step": 28725
},
{
"epoch": 3.41,
"learning_rate": 1.8159420289855072e-06,
"loss": 0.2122,
"step": 28750
},
{
"epoch": 3.41,
"learning_rate": 1.8086956521739133e-06,
"loss": 0.1602,
"step": 28775
},
{
"epoch": 3.42,
"learning_rate": 1.801449275362319e-06,
"loss": 0.2419,
"step": 28800
},
{
"epoch": 3.42,
"learning_rate": 1.7942028985507248e-06,
"loss": 0.4138,
"step": 28825
},
{
"epoch": 3.42,
"learning_rate": 1.7869565217391304e-06,
"loss": 0.2473,
"step": 28850
},
{
"epoch": 3.43,
"learning_rate": 1.7797101449275365e-06,
"loss": 0.1792,
"step": 28875
},
{
"epoch": 3.43,
"learning_rate": 1.7724637681159421e-06,
"loss": 0.1822,
"step": 28900
},
{
"epoch": 3.43,
"learning_rate": 1.765217391304348e-06,
"loss": 0.1505,
"step": 28925
},
{
"epoch": 3.44,
"learning_rate": 1.7579710144927536e-06,
"loss": 0.1418,
"step": 28950
},
{
"epoch": 3.44,
"learning_rate": 1.7507246376811595e-06,
"loss": 0.1262,
"step": 28975
},
{
"epoch": 3.44,
"learning_rate": 1.7434782608695653e-06,
"loss": 0.175,
"step": 29000
},
{
"epoch": 3.44,
"eval_cer": 6.772713857051503,
"eval_loss": 0.40093937516212463,
"eval_runtime": 3157.1944,
"eval_samples_per_second": 0.786,
"eval_steps_per_second": 0.393,
"eval_wer": 18.48141795311607,
"step": 29000
},
{
"epoch": 3.44,
"learning_rate": 1.7362318840579712e-06,
"loss": 0.2065,
"step": 29025
},
{
"epoch": 3.45,
"learning_rate": 1.7289855072463768e-06,
"loss": 0.1723,
"step": 29050
},
{
"epoch": 3.45,
"learning_rate": 1.7217391304347827e-06,
"loss": 0.1419,
"step": 29075
},
{
"epoch": 3.45,
"learning_rate": 1.7144927536231887e-06,
"loss": 0.2607,
"step": 29100
},
{
"epoch": 3.46,
"learning_rate": 1.7072463768115944e-06,
"loss": 0.1884,
"step": 29125
},
{
"epoch": 3.46,
"learning_rate": 1.7000000000000002e-06,
"loss": 0.1824,
"step": 29150
},
{
"epoch": 3.46,
"learning_rate": 1.6927536231884059e-06,
"loss": 0.1657,
"step": 29175
},
{
"epoch": 3.47,
"learning_rate": 1.685507246376812e-06,
"loss": 0.248,
"step": 29200
},
{
"epoch": 3.47,
"learning_rate": 1.6782608695652176e-06,
"loss": 0.2124,
"step": 29225
},
{
"epoch": 3.47,
"learning_rate": 1.6710144927536234e-06,
"loss": 0.1964,
"step": 29250
},
{
"epoch": 3.47,
"learning_rate": 1.663768115942029e-06,
"loss": 0.3202,
"step": 29275
},
{
"epoch": 3.48,
"learning_rate": 1.656521739130435e-06,
"loss": 0.194,
"step": 29300
},
{
"epoch": 3.48,
"learning_rate": 1.6492753623188406e-06,
"loss": 0.2738,
"step": 29325
},
{
"epoch": 3.48,
"learning_rate": 1.6420289855072467e-06,
"loss": 0.1667,
"step": 29350
},
{
"epoch": 3.49,
"learning_rate": 1.6347826086956523e-06,
"loss": 0.2819,
"step": 29375
},
{
"epoch": 3.49,
"learning_rate": 1.6275362318840581e-06,
"loss": 0.1894,
"step": 29400
},
{
"epoch": 3.49,
"learning_rate": 1.6202898550724638e-06,
"loss": 0.1791,
"step": 29425
},
{
"epoch": 3.49,
"learning_rate": 1.6130434782608699e-06,
"loss": 0.1853,
"step": 29450
},
{
"epoch": 3.5,
"learning_rate": 1.6057971014492755e-06,
"loss": 0.2618,
"step": 29475
},
{
"epoch": 3.5,
"learning_rate": 1.5985507246376814e-06,
"loss": 0.2052,
"step": 29500
},
{
"epoch": 3.5,
"learning_rate": 1.591304347826087e-06,
"loss": 0.2185,
"step": 29525
},
{
"epoch": 3.51,
"learning_rate": 1.5840579710144928e-06,
"loss": 0.1305,
"step": 29550
},
{
"epoch": 3.51,
"learning_rate": 1.5768115942028985e-06,
"loss": 0.233,
"step": 29575
},
{
"epoch": 3.51,
"learning_rate": 1.5695652173913046e-06,
"loss": 0.2164,
"step": 29600
},
{
"epoch": 3.52,
"learning_rate": 1.5623188405797102e-06,
"loss": 0.1524,
"step": 29625
},
{
"epoch": 3.52,
"learning_rate": 1.555072463768116e-06,
"loss": 0.1961,
"step": 29650
},
{
"epoch": 3.52,
"learning_rate": 1.5478260869565217e-06,
"loss": 0.2242,
"step": 29675
},
{
"epoch": 3.52,
"learning_rate": 1.5405797101449278e-06,
"loss": 0.1997,
"step": 29700
},
{
"epoch": 3.53,
"learning_rate": 1.5333333333333334e-06,
"loss": 0.2001,
"step": 29725
},
{
"epoch": 3.53,
"learning_rate": 1.5260869565217393e-06,
"loss": 0.1888,
"step": 29750
},
{
"epoch": 3.53,
"learning_rate": 1.518840579710145e-06,
"loss": 0.2124,
"step": 29775
},
{
"epoch": 3.54,
"learning_rate": 1.5115942028985508e-06,
"loss": 0.2145,
"step": 29800
},
{
"epoch": 3.54,
"learning_rate": 1.5043478260869566e-06,
"loss": 0.2512,
"step": 29825
},
{
"epoch": 3.54,
"learning_rate": 1.4971014492753625e-06,
"loss": 0.1625,
"step": 29850
},
{
"epoch": 3.55,
"learning_rate": 1.4898550724637683e-06,
"loss": 0.1556,
"step": 29875
},
{
"epoch": 3.55,
"learning_rate": 1.482608695652174e-06,
"loss": 0.2134,
"step": 29900
},
{
"epoch": 3.55,
"learning_rate": 1.47536231884058e-06,
"loss": 0.1959,
"step": 29925
},
{
"epoch": 3.55,
"learning_rate": 1.4681159420289857e-06,
"loss": 0.197,
"step": 29950
},
{
"epoch": 3.56,
"learning_rate": 1.4608695652173915e-06,
"loss": 0.1825,
"step": 29975
},
{
"epoch": 3.56,
"learning_rate": 1.4536231884057972e-06,
"loss": 0.1701,
"step": 30000
},
{
"epoch": 3.56,
"eval_cer": 7.013625854690344,
"eval_loss": 0.3998452425003052,
"eval_runtime": 3192.2868,
"eval_samples_per_second": 0.777,
"eval_steps_per_second": 0.389,
"eval_wer": 18.834381551362682,
"step": 30000
},
{
"epoch": 3.56,
"step": 30000,
"total_flos": 1.9457998848e+18,
"train_loss": 0.0,
"train_runtime": 0.3469,
"train_samples_per_second": 14412.297,
"train_steps_per_second": 14412.297
},
{
"epoch": 3.56,
"eval_cer": 9.956974355224656,
"eval_loss": 0.7926790118217468,
"eval_runtime": 3112.2219,
"eval_samples_per_second": 0.696,
"eval_steps_per_second": 0.348,
"eval_wer": 31.400474471700036,
"step": 30000
}
],
"max_steps": 5000,
"num_train_epochs": 2,
"total_flos": 1.9457998848e+18,
"trial_name": null,
"trial_params": null
}