wav2vec2-xls-r-1b-cv9-fr / trainer_state.json
bofenghuang's picture
Initial commit
6e1a7c6
{
"best_metric": 0.12453306507935491,
"best_model_checkpoint": "./outputs/common_voice_9_0_fr/wav2vec2-xls-r-1b-ft-ep10/checkpoint-36000",
"epoch": 9.99996533675344,
"global_step": 36060,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.03,
"learning_rate": 2.6899611758180813e-06,
"loss": 9.4595,
"step": 100
},
{
"epoch": 0.06,
"learning_rate": 5.463117027176928e-06,
"loss": 3.1185,
"step": 200
},
{
"epoch": 0.08,
"learning_rate": 8.236272878535774e-06,
"loss": 2.9237,
"step": 300
},
{
"epoch": 0.11,
"learning_rate": 1.1009428729894621e-05,
"loss": 1.5923,
"step": 400
},
{
"epoch": 0.14,
"learning_rate": 1.3782584581253465e-05,
"loss": 0.9229,
"step": 500
},
{
"epoch": 0.14,
"eval_loss": 0.5048818588256836,
"eval_runtime": 835.7546,
"eval_samples_per_second": 19.193,
"eval_steps_per_second": 2.4,
"eval_wer": 0.4007663178937791,
"step": 500
},
{
"epoch": 0.17,
"learning_rate": 1.6555740432612314e-05,
"loss": 0.7777,
"step": 600
},
{
"epoch": 0.19,
"learning_rate": 1.932889628397116e-05,
"loss": 0.5771,
"step": 700
},
{
"epoch": 0.22,
"learning_rate": 2.2102052135330005e-05,
"loss": 0.4572,
"step": 800
},
{
"epoch": 0.25,
"learning_rate": 2.4875207986688854e-05,
"loss": 0.4048,
"step": 900
},
{
"epoch": 0.28,
"learning_rate": 2.7648363838047696e-05,
"loss": 0.3823,
"step": 1000
},
{
"epoch": 0.28,
"eval_loss": 0.2831491231918335,
"eval_runtime": 739.7164,
"eval_samples_per_second": 21.685,
"eval_steps_per_second": 2.712,
"eval_wer": 0.2296647038847704,
"step": 1000
},
{
"epoch": 0.31,
"learning_rate": 3.042151968940655e-05,
"loss": 0.3549,
"step": 1100
},
{
"epoch": 0.33,
"learning_rate": 3.319467554076539e-05,
"loss": 0.3433,
"step": 1200
},
{
"epoch": 0.36,
"learning_rate": 3.596783139212424e-05,
"loss": 0.328,
"step": 1300
},
{
"epoch": 0.39,
"learning_rate": 3.874098724348308e-05,
"loss": 0.3114,
"step": 1400
},
{
"epoch": 0.42,
"learning_rate": 4.1514143094841934e-05,
"loss": 0.3079,
"step": 1500
},
{
"epoch": 0.42,
"eval_loss": 0.23849168419837952,
"eval_runtime": 738.9338,
"eval_samples_per_second": 21.708,
"eval_steps_per_second": 2.715,
"eval_wer": 0.19510351058172243,
"step": 1500
},
{
"epoch": 0.44,
"learning_rate": 4.428729894620078e-05,
"loss": 0.3002,
"step": 1600
},
{
"epoch": 0.47,
"learning_rate": 4.7060454797559625e-05,
"loss": 0.2895,
"step": 1700
},
{
"epoch": 0.5,
"learning_rate": 4.983361064891847e-05,
"loss": 0.2936,
"step": 1800
},
{
"epoch": 0.53,
"learning_rate": 5.2606766500277316e-05,
"loss": 0.2908,
"step": 1900
},
{
"epoch": 0.55,
"learning_rate": 5.537992235163616e-05,
"loss": 0.2899,
"step": 2000
},
{
"epoch": 0.55,
"eval_loss": 0.22730602324008942,
"eval_runtime": 733.7734,
"eval_samples_per_second": 21.861,
"eval_steps_per_second": 2.734,
"eval_wer": 0.19783303752779183,
"step": 2000
},
{
"epoch": 0.58,
"learning_rate": 5.8153078202995014e-05,
"loss": 0.2815,
"step": 2100
},
{
"epoch": 0.61,
"learning_rate": 6.092623405435386e-05,
"loss": 0.2866,
"step": 2200
},
{
"epoch": 0.64,
"learning_rate": 6.36993899057127e-05,
"loss": 0.285,
"step": 2300
},
{
"epoch": 0.67,
"learning_rate": 6.647254575707154e-05,
"loss": 0.2864,
"step": 2400
},
{
"epoch": 0.69,
"learning_rate": 6.92457016084304e-05,
"loss": 0.2795,
"step": 2500
},
{
"epoch": 0.69,
"eval_loss": 0.23286376893520355,
"eval_runtime": 745.9448,
"eval_samples_per_second": 21.504,
"eval_steps_per_second": 2.689,
"eval_wer": 0.19834562474771097,
"step": 2500
},
{
"epoch": 0.72,
"learning_rate": 7.201885745978925e-05,
"loss": 0.2801,
"step": 2600
},
{
"epoch": 0.75,
"learning_rate": 7.47920133111481e-05,
"loss": 0.2814,
"step": 2700
},
{
"epoch": 0.78,
"learning_rate": 7.756516916250694e-05,
"loss": 0.2809,
"step": 2800
},
{
"epoch": 0.8,
"learning_rate": 8.033832501386578e-05,
"loss": 0.2846,
"step": 2900
},
{
"epoch": 0.83,
"learning_rate": 8.311148086522463e-05,
"loss": 0.2863,
"step": 3000
},
{
"epoch": 0.83,
"eval_loss": 0.22894535958766937,
"eval_runtime": 746.0584,
"eval_samples_per_second": 21.501,
"eval_steps_per_second": 2.689,
"eval_wer": 0.19914013493858565,
"step": 3000
},
{
"epoch": 0.86,
"learning_rate": 8.588463671658348e-05,
"loss": 0.2899,
"step": 3100
},
{
"epoch": 0.89,
"learning_rate": 8.865779256794232e-05,
"loss": 0.2825,
"step": 3200
},
{
"epoch": 0.92,
"learning_rate": 9.143094841930117e-05,
"loss": 0.2826,
"step": 3300
},
{
"epoch": 0.94,
"learning_rate": 9.420410427066003e-05,
"loss": 0.2896,
"step": 3400
},
{
"epoch": 0.97,
"learning_rate": 9.697726012201886e-05,
"loss": 0.3063,
"step": 3500
},
{
"epoch": 0.97,
"eval_loss": 0.2369552105665207,
"eval_runtime": 741.3652,
"eval_samples_per_second": 21.637,
"eval_steps_per_second": 2.706,
"eval_wer": 0.20460559617097346,
"step": 3500
},
{
"epoch": 1.0,
"learning_rate": 9.97504159733777e-05,
"loss": 0.2928,
"step": 3600
},
{
"epoch": 1.03,
"learning_rate": 9.971960313058483e-05,
"loss": 0.2767,
"step": 3700
},
{
"epoch": 1.05,
"learning_rate": 9.941147470265608e-05,
"loss": 0.2819,
"step": 3800
},
{
"epoch": 1.08,
"learning_rate": 9.910334627472732e-05,
"loss": 0.2789,
"step": 3900
},
{
"epoch": 1.11,
"learning_rate": 9.879521784679855e-05,
"loss": 0.2766,
"step": 4000
},
{
"epoch": 1.11,
"eval_loss": 0.23217500746250153,
"eval_runtime": 739.5397,
"eval_samples_per_second": 21.691,
"eval_steps_per_second": 2.712,
"eval_wer": 0.20213877017511261,
"step": 4000
},
{
"epoch": 1.14,
"learning_rate": 9.848708941886979e-05,
"loss": 0.2784,
"step": 4100
},
{
"epoch": 1.16,
"learning_rate": 9.817896099094103e-05,
"loss": 0.2712,
"step": 4200
},
{
"epoch": 1.19,
"learning_rate": 9.787083256301228e-05,
"loss": 0.2757,
"step": 4300
},
{
"epoch": 1.22,
"learning_rate": 9.75627041350835e-05,
"loss": 0.2775,
"step": 4400
},
{
"epoch": 1.25,
"learning_rate": 9.725457570715475e-05,
"loss": 0.2749,
"step": 4500
},
{
"epoch": 1.25,
"eval_loss": 0.23323854804039001,
"eval_runtime": 741.5404,
"eval_samples_per_second": 21.632,
"eval_steps_per_second": 2.705,
"eval_wer": 0.20545136508384004,
"step": 4500
},
{
"epoch": 1.28,
"learning_rate": 9.694644727922599e-05,
"loss": 0.2716,
"step": 4600
},
{
"epoch": 1.3,
"learning_rate": 9.663831885129723e-05,
"loss": 0.2718,
"step": 4700
},
{
"epoch": 1.33,
"learning_rate": 9.633019042336846e-05,
"loss": 0.2749,
"step": 4800
},
{
"epoch": 1.36,
"learning_rate": 9.60220619954397e-05,
"loss": 0.2718,
"step": 4900
},
{
"epoch": 1.39,
"learning_rate": 9.571393356751093e-05,
"loss": 0.2769,
"step": 5000
},
{
"epoch": 1.39,
"eval_loss": 0.23219896852970123,
"eval_runtime": 739.3463,
"eval_samples_per_second": 21.696,
"eval_steps_per_second": 2.713,
"eval_wer": 0.20350353364814733,
"step": 5000
},
{
"epoch": 1.41,
"learning_rate": 9.540580513958219e-05,
"loss": 0.2659,
"step": 5100
},
{
"epoch": 1.44,
"learning_rate": 9.509767671165342e-05,
"loss": 0.2668,
"step": 5200
},
{
"epoch": 1.47,
"learning_rate": 9.478954828372466e-05,
"loss": 0.2611,
"step": 5300
},
{
"epoch": 1.5,
"learning_rate": 9.44814198557959e-05,
"loss": 0.2678,
"step": 5400
},
{
"epoch": 1.53,
"learning_rate": 9.417329142786714e-05,
"loss": 0.2628,
"step": 5500
},
{
"epoch": 1.53,
"eval_loss": 0.22423435747623444,
"eval_runtime": 735.686,
"eval_samples_per_second": 21.804,
"eval_steps_per_second": 2.727,
"eval_wer": 0.19482799495101588,
"step": 5500
},
{
"epoch": 1.55,
"learning_rate": 9.386516299993839e-05,
"loss": 0.2608,
"step": 5600
},
{
"epoch": 1.58,
"learning_rate": 9.355703457200961e-05,
"loss": 0.2609,
"step": 5700
},
{
"epoch": 1.61,
"learning_rate": 9.324890614408086e-05,
"loss": 0.2592,
"step": 5800
},
{
"epoch": 1.64,
"learning_rate": 9.29407777161521e-05,
"loss": 0.2544,
"step": 5900
},
{
"epoch": 1.66,
"learning_rate": 9.263264928822334e-05,
"loss": 0.2614,
"step": 6000
},
{
"epoch": 1.66,
"eval_loss": 0.23026546835899353,
"eval_runtime": 738.1222,
"eval_samples_per_second": 21.732,
"eval_steps_per_second": 2.718,
"eval_wer": 0.19623760980579352,
"step": 6000
},
{
"epoch": 1.69,
"learning_rate": 9.232452086029457e-05,
"loss": 0.2555,
"step": 6100
},
{
"epoch": 1.72,
"learning_rate": 9.201639243236581e-05,
"loss": 0.2649,
"step": 6200
},
{
"epoch": 1.75,
"learning_rate": 9.170826400443706e-05,
"loss": 0.2518,
"step": 6300
},
{
"epoch": 1.77,
"learning_rate": 9.14001355765083e-05,
"loss": 0.2548,
"step": 6400
},
{
"epoch": 1.8,
"learning_rate": 9.109200714857953e-05,
"loss": 0.2547,
"step": 6500
},
{
"epoch": 1.8,
"eval_loss": 0.22376440465450287,
"eval_runtime": 739.914,
"eval_samples_per_second": 21.68,
"eval_steps_per_second": 2.711,
"eval_wer": 0.19202798726220757,
"step": 6500
},
{
"epoch": 1.83,
"learning_rate": 9.078387872065077e-05,
"loss": 0.2498,
"step": 6600
},
{
"epoch": 1.86,
"learning_rate": 9.047575029272201e-05,
"loss": 0.2545,
"step": 6700
},
{
"epoch": 1.89,
"learning_rate": 9.016762186479325e-05,
"loss": 0.2545,
"step": 6800
},
{
"epoch": 1.91,
"learning_rate": 8.98594934368645e-05,
"loss": 0.2438,
"step": 6900
},
{
"epoch": 1.94,
"learning_rate": 8.955136500893573e-05,
"loss": 0.2458,
"step": 7000
},
{
"epoch": 1.94,
"eval_loss": 0.21862062811851501,
"eval_runtime": 742.7999,
"eval_samples_per_second": 21.595,
"eval_steps_per_second": 2.701,
"eval_wer": 0.18936253371862807,
"step": 7000
},
{
"epoch": 1.97,
"learning_rate": 8.924323658100697e-05,
"loss": 0.2495,
"step": 7100
},
{
"epoch": 2.0,
"learning_rate": 8.893510815307821e-05,
"loss": 0.2477,
"step": 7200
},
{
"epoch": 2.02,
"learning_rate": 8.862697972514945e-05,
"loss": 0.2383,
"step": 7300
},
{
"epoch": 2.05,
"learning_rate": 8.831885129722068e-05,
"loss": 0.2373,
"step": 7400
},
{
"epoch": 2.08,
"learning_rate": 8.801072286929192e-05,
"loss": 0.231,
"step": 7500
},
{
"epoch": 2.08,
"eval_loss": 0.21694478392601013,
"eval_runtime": 747.3244,
"eval_samples_per_second": 21.465,
"eval_steps_per_second": 2.684,
"eval_wer": 0.1895291245651018,
"step": 7500
},
{
"epoch": 2.11,
"learning_rate": 8.770259444136317e-05,
"loss": 0.2338,
"step": 7600
},
{
"epoch": 2.14,
"learning_rate": 8.739446601343441e-05,
"loss": 0.2307,
"step": 7700
},
{
"epoch": 2.16,
"learning_rate": 8.708633758550564e-05,
"loss": 0.2375,
"step": 7800
},
{
"epoch": 2.19,
"learning_rate": 8.677820915757688e-05,
"loss": 0.2359,
"step": 7900
},
{
"epoch": 2.22,
"learning_rate": 8.647008072964812e-05,
"loss": 0.2309,
"step": 8000
},
{
"epoch": 2.22,
"eval_loss": 0.21314306557178497,
"eval_runtime": 736.606,
"eval_samples_per_second": 21.777,
"eval_steps_per_second": 2.723,
"eval_wer": 0.187011039847249,
"step": 8000
},
{
"epoch": 2.25,
"learning_rate": 8.616195230171936e-05,
"loss": 0.2342,
"step": 8100
},
{
"epoch": 2.27,
"learning_rate": 8.58538238737906e-05,
"loss": 0.2313,
"step": 8200
},
{
"epoch": 2.3,
"learning_rate": 8.554569544586184e-05,
"loss": 0.2299,
"step": 8300
},
{
"epoch": 2.33,
"learning_rate": 8.523756701793308e-05,
"loss": 0.2323,
"step": 8400
},
{
"epoch": 2.36,
"learning_rate": 8.492943859000432e-05,
"loss": 0.2258,
"step": 8500
},
{
"epoch": 2.36,
"eval_loss": 0.21330955624580383,
"eval_runtime": 733.2181,
"eval_samples_per_second": 21.878,
"eval_steps_per_second": 2.736,
"eval_wer": 0.18179546488457177,
"step": 8500
},
{
"epoch": 2.38,
"learning_rate": 8.462131016207556e-05,
"loss": 0.2263,
"step": 8600
},
{
"epoch": 2.41,
"learning_rate": 8.431318173414679e-05,
"loss": 0.2253,
"step": 8700
},
{
"epoch": 2.44,
"learning_rate": 8.400505330621803e-05,
"loss": 0.2302,
"step": 8800
},
{
"epoch": 2.47,
"learning_rate": 8.369692487828928e-05,
"loss": 0.2266,
"step": 8900
},
{
"epoch": 2.5,
"learning_rate": 8.338879645036052e-05,
"loss": 0.2278,
"step": 9000
},
{
"epoch": 2.5,
"eval_loss": 0.21764406561851501,
"eval_runtime": 744.2016,
"eval_samples_per_second": 21.555,
"eval_steps_per_second": 2.696,
"eval_wer": 0.1877799206771277,
"step": 9000
},
{
"epoch": 2.52,
"learning_rate": 8.308066802243175e-05,
"loss": 0.2313,
"step": 9100
},
{
"epoch": 2.55,
"learning_rate": 8.277253959450299e-05,
"loss": 0.2319,
"step": 9200
},
{
"epoch": 2.58,
"learning_rate": 8.246441116657423e-05,
"loss": 0.2264,
"step": 9300
},
{
"epoch": 2.61,
"learning_rate": 8.215628273864548e-05,
"loss": 0.2301,
"step": 9400
},
{
"epoch": 2.63,
"learning_rate": 8.18481543107167e-05,
"loss": 0.2263,
"step": 9500
},
{
"epoch": 2.63,
"eval_loss": 0.2029789835214615,
"eval_runtime": 742.9206,
"eval_samples_per_second": 21.592,
"eval_steps_per_second": 2.7,
"eval_wer": 0.18131491436589758,
"step": 9500
},
{
"epoch": 2.66,
"learning_rate": 8.154002588278795e-05,
"loss": 0.2287,
"step": 9600
},
{
"epoch": 2.69,
"learning_rate": 8.123189745485919e-05,
"loss": 0.2285,
"step": 9700
},
{
"epoch": 2.72,
"learning_rate": 8.092376902693043e-05,
"loss": 0.2272,
"step": 9800
},
{
"epoch": 2.75,
"learning_rate": 8.061564059900166e-05,
"loss": 0.226,
"step": 9900
},
{
"epoch": 2.77,
"learning_rate": 8.03075121710729e-05,
"loss": 0.2262,
"step": 10000
},
{
"epoch": 2.77,
"eval_loss": 0.2076706886291504,
"eval_runtime": 744.0741,
"eval_samples_per_second": 21.558,
"eval_steps_per_second": 2.696,
"eval_wer": 0.1823785328472298,
"step": 10000
},
{
"epoch": 2.8,
"learning_rate": 7.999938374314416e-05,
"loss": 0.2232,
"step": 10100
},
{
"epoch": 2.83,
"learning_rate": 7.969433659949467e-05,
"loss": 0.2214,
"step": 10200
},
{
"epoch": 2.86,
"learning_rate": 7.938620817156591e-05,
"loss": 0.2257,
"step": 10300
},
{
"epoch": 2.88,
"learning_rate": 7.907807974363715e-05,
"loss": 0.2191,
"step": 10400
},
{
"epoch": 2.91,
"learning_rate": 7.87699513157084e-05,
"loss": 0.2228,
"step": 10500
},
{
"epoch": 2.91,
"eval_loss": 0.21150091290473938,
"eval_runtime": 744.436,
"eval_samples_per_second": 21.548,
"eval_steps_per_second": 2.695,
"eval_wer": 0.1839739605692281,
"step": 10500
},
{
"epoch": 2.94,
"learning_rate": 7.846182288777964e-05,
"loss": 0.2249,
"step": 10600
},
{
"epoch": 2.97,
"learning_rate": 7.815369445985087e-05,
"loss": 0.2181,
"step": 10700
},
{
"epoch": 2.99,
"learning_rate": 7.784556603192211e-05,
"loss": 0.2203,
"step": 10800
},
{
"epoch": 3.02,
"learning_rate": 7.753743760399335e-05,
"loss": 0.2174,
"step": 10900
},
{
"epoch": 3.05,
"learning_rate": 7.72293091760646e-05,
"loss": 0.2118,
"step": 11000
},
{
"epoch": 3.05,
"eval_loss": 0.20934706926345825,
"eval_runtime": 749.3869,
"eval_samples_per_second": 21.405,
"eval_steps_per_second": 2.677,
"eval_wer": 0.17822016902563576,
"step": 11000
},
{
"epoch": 3.08,
"learning_rate": 7.692118074813582e-05,
"loss": 0.2136,
"step": 11100
},
{
"epoch": 3.11,
"learning_rate": 7.661305232020707e-05,
"loss": 0.2042,
"step": 11200
},
{
"epoch": 3.13,
"learning_rate": 7.630492389227831e-05,
"loss": 0.2078,
"step": 11300
},
{
"epoch": 3.16,
"learning_rate": 7.599679546434955e-05,
"loss": 0.2066,
"step": 11400
},
{
"epoch": 3.19,
"learning_rate": 7.568866703642078e-05,
"loss": 0.2073,
"step": 11500
},
{
"epoch": 3.19,
"eval_loss": 0.20042090117931366,
"eval_runtime": 741.0274,
"eval_samples_per_second": 21.647,
"eval_steps_per_second": 2.707,
"eval_wer": 0.1756380109052931,
"step": 11500
},
{
"epoch": 3.22,
"learning_rate": 7.538053860849202e-05,
"loss": 0.2026,
"step": 11600
},
{
"epoch": 3.24,
"learning_rate": 7.507241018056326e-05,
"loss": 0.2057,
"step": 11700
},
{
"epoch": 3.27,
"learning_rate": 7.47642817526345e-05,
"loss": 0.2023,
"step": 11800
},
{
"epoch": 3.3,
"learning_rate": 7.445615332470575e-05,
"loss": 0.2023,
"step": 11900
},
{
"epoch": 3.33,
"learning_rate": 7.414802489677698e-05,
"loss": 0.2015,
"step": 12000
},
{
"epoch": 3.33,
"eval_loss": 0.19883444905281067,
"eval_runtime": 747.9432,
"eval_samples_per_second": 21.447,
"eval_steps_per_second": 2.682,
"eval_wer": 0.17481787135342247,
"step": 12000
},
{
"epoch": 3.36,
"learning_rate": 7.383989646884822e-05,
"loss": 0.209,
"step": 12100
},
{
"epoch": 3.38,
"learning_rate": 7.353176804091946e-05,
"loss": 0.2073,
"step": 12200
},
{
"epoch": 3.41,
"learning_rate": 7.32236396129907e-05,
"loss": 0.2113,
"step": 12300
},
{
"epoch": 3.44,
"learning_rate": 7.291551118506193e-05,
"loss": 0.2087,
"step": 12400
},
{
"epoch": 3.47,
"learning_rate": 7.261046404141246e-05,
"loss": 0.214,
"step": 12500
},
{
"epoch": 3.47,
"eval_loss": 0.20877334475517273,
"eval_runtime": 743.8468,
"eval_samples_per_second": 21.565,
"eval_steps_per_second": 2.697,
"eval_wer": 0.18157120797585713,
"step": 12500
},
{
"epoch": 3.49,
"learning_rate": 7.230233561348371e-05,
"loss": 0.2059,
"step": 12600
},
{
"epoch": 3.52,
"learning_rate": 7.199420718555494e-05,
"loss": 0.2027,
"step": 12700
},
{
"epoch": 3.55,
"learning_rate": 7.168607875762618e-05,
"loss": 0.2057,
"step": 12800
},
{
"epoch": 3.58,
"learning_rate": 7.137795032969741e-05,
"loss": 0.2074,
"step": 12900
},
{
"epoch": 3.61,
"learning_rate": 7.106982190176867e-05,
"loss": 0.2075,
"step": 13000
},
{
"epoch": 3.61,
"eval_loss": 0.19755592942237854,
"eval_runtime": 739.5406,
"eval_samples_per_second": 21.69,
"eval_steps_per_second": 2.712,
"eval_wer": 0.1746256511459528,
"step": 13000
},
{
"epoch": 3.63,
"learning_rate": 7.07616934738399e-05,
"loss": 0.2004,
"step": 13100
},
{
"epoch": 3.66,
"learning_rate": 7.045356504591114e-05,
"loss": 0.2007,
"step": 13200
},
{
"epoch": 3.69,
"learning_rate": 7.014543661798237e-05,
"loss": 0.2027,
"step": 13300
},
{
"epoch": 3.72,
"learning_rate": 6.983730819005361e-05,
"loss": 0.2021,
"step": 13400
},
{
"epoch": 3.74,
"learning_rate": 6.952917976212485e-05,
"loss": 0.2039,
"step": 13500
},
{
"epoch": 3.74,
"eval_loss": 0.19584038853645325,
"eval_runtime": 734.9317,
"eval_samples_per_second": 21.827,
"eval_steps_per_second": 2.73,
"eval_wer": 0.17436935753599322,
"step": 13500
},
{
"epoch": 3.77,
"learning_rate": 6.922413261847538e-05,
"loss": 0.2054,
"step": 13600
},
{
"epoch": 3.8,
"learning_rate": 6.891600419054662e-05,
"loss": 0.2017,
"step": 13700
},
{
"epoch": 3.83,
"learning_rate": 6.860787576261786e-05,
"loss": 0.2021,
"step": 13800
},
{
"epoch": 3.85,
"learning_rate": 6.82997473346891e-05,
"loss": 0.1961,
"step": 13900
},
{
"epoch": 3.88,
"learning_rate": 6.799161890676035e-05,
"loss": 0.2003,
"step": 14000
},
{
"epoch": 3.88,
"eval_loss": 0.19312596321105957,
"eval_runtime": 744.5794,
"eval_samples_per_second": 21.544,
"eval_steps_per_second": 2.694,
"eval_wer": 0.16931396607954072,
"step": 14000
},
{
"epoch": 3.91,
"learning_rate": 6.768349047883158e-05,
"loss": 0.1996,
"step": 14100
},
{
"epoch": 3.94,
"learning_rate": 6.737536205090282e-05,
"loss": 0.1966,
"step": 14200
},
{
"epoch": 3.97,
"learning_rate": 6.706723362297406e-05,
"loss": 0.1976,
"step": 14300
},
{
"epoch": 3.99,
"learning_rate": 6.67591051950453e-05,
"loss": 0.201,
"step": 14400
},
{
"epoch": 4.02,
"learning_rate": 6.645097676711653e-05,
"loss": 0.1886,
"step": 14500
},
{
"epoch": 4.02,
"eval_loss": 0.19637233018875122,
"eval_runtime": 744.2941,
"eval_samples_per_second": 21.552,
"eval_steps_per_second": 2.695,
"eval_wer": 0.1686091586521519,
"step": 14500
},
{
"epoch": 4.05,
"learning_rate": 6.614284833918778e-05,
"loss": 0.1867,
"step": 14600
},
{
"epoch": 4.08,
"learning_rate": 6.583471991125902e-05,
"loss": 0.1885,
"step": 14700
},
{
"epoch": 4.1,
"learning_rate": 6.552659148333026e-05,
"loss": 0.1909,
"step": 14800
},
{
"epoch": 4.13,
"learning_rate": 6.521846305540149e-05,
"loss": 0.189,
"step": 14900
},
{
"epoch": 4.16,
"learning_rate": 6.491033462747273e-05,
"loss": 0.1943,
"step": 15000
},
{
"epoch": 4.16,
"eval_loss": 0.19862689077854156,
"eval_runtime": 743.0072,
"eval_samples_per_second": 21.589,
"eval_steps_per_second": 2.7,
"eval_wer": 0.1745615777434629,
"step": 15000
},
{
"epoch": 4.19,
"learning_rate": 6.460220619954397e-05,
"loss": 0.1936,
"step": 15100
},
{
"epoch": 4.22,
"learning_rate": 6.429407777161522e-05,
"loss": 0.1916,
"step": 15200
},
{
"epoch": 4.24,
"learning_rate": 6.398594934368644e-05,
"loss": 0.1916,
"step": 15300
},
{
"epoch": 4.27,
"learning_rate": 6.367782091575769e-05,
"loss": 0.1871,
"step": 15400
},
{
"epoch": 4.3,
"learning_rate": 6.336969248782893e-05,
"loss": 0.1919,
"step": 15500
},
{
"epoch": 4.3,
"eval_loss": 0.19568254053592682,
"eval_runtime": 742.9429,
"eval_samples_per_second": 21.591,
"eval_steps_per_second": 2.7,
"eval_wer": 0.17001877350692954,
"step": 15500
},
{
"epoch": 4.33,
"learning_rate": 6.306156405990017e-05,
"loss": 0.1955,
"step": 15600
},
{
"epoch": 4.35,
"learning_rate": 6.275343563197141e-05,
"loss": 0.1907,
"step": 15700
},
{
"epoch": 4.38,
"learning_rate": 6.244530720404264e-05,
"loss": 0.1931,
"step": 15800
},
{
"epoch": 4.41,
"learning_rate": 6.213717877611389e-05,
"loss": 0.1889,
"step": 15900
},
{
"epoch": 4.44,
"learning_rate": 6.182905034818513e-05,
"loss": 0.1857,
"step": 16000
},
{
"epoch": 4.44,
"eval_loss": 0.19073382019996643,
"eval_runtime": 741.2082,
"eval_samples_per_second": 21.642,
"eval_steps_per_second": 2.706,
"eval_wer": 0.16714828507538235,
"step": 16000
},
{
"epoch": 4.46,
"learning_rate": 6.152092192025637e-05,
"loss": 0.1768,
"step": 16100
},
{
"epoch": 4.49,
"learning_rate": 6.12127934923276e-05,
"loss": 0.1841,
"step": 16200
},
{
"epoch": 4.52,
"learning_rate": 6.090466506439885e-05,
"loss": 0.1874,
"step": 16300
},
{
"epoch": 4.55,
"learning_rate": 6.059653663647008e-05,
"loss": 0.1845,
"step": 16400
},
{
"epoch": 4.58,
"learning_rate": 6.0288408208541326e-05,
"loss": 0.1834,
"step": 16500
},
{
"epoch": 4.58,
"eval_loss": 0.18768635392189026,
"eval_runtime": 727.4352,
"eval_samples_per_second": 22.051,
"eval_steps_per_second": 2.758,
"eval_wer": 0.16405994707536956,
"step": 16500
},
{
"epoch": 4.6,
"learning_rate": 5.9980279780612555e-05,
"loss": 0.1811,
"step": 16600
},
{
"epoch": 4.63,
"learning_rate": 5.9675232636963086e-05,
"loss": 0.1828,
"step": 16700
},
{
"epoch": 4.66,
"learning_rate": 5.936710420903433e-05,
"loss": 0.1811,
"step": 16800
},
{
"epoch": 4.69,
"learning_rate": 5.9058975781105564e-05,
"loss": 0.1788,
"step": 16900
},
{
"epoch": 4.71,
"learning_rate": 5.8750847353176806e-05,
"loss": 0.18,
"step": 17000
},
{
"epoch": 4.71,
"eval_loss": 0.18282969295978546,
"eval_runtime": 737.0087,
"eval_samples_per_second": 21.765,
"eval_steps_per_second": 2.722,
"eval_wer": 0.16002332271850633,
"step": 17000
},
{
"epoch": 4.74,
"learning_rate": 5.844271892524804e-05,
"loss": 0.1777,
"step": 17100
},
{
"epoch": 4.77,
"learning_rate": 5.8134590497319284e-05,
"loss": 0.1831,
"step": 17200
},
{
"epoch": 4.8,
"learning_rate": 5.782646206939053e-05,
"loss": 0.1811,
"step": 17300
},
{
"epoch": 4.83,
"learning_rate": 5.751833364146176e-05,
"loss": 0.1772,
"step": 17400
},
{
"epoch": 4.85,
"learning_rate": 5.7210205213533005e-05,
"loss": 0.1774,
"step": 17500
},
{
"epoch": 4.85,
"eval_loss": 0.1862887740135193,
"eval_runtime": 738.0056,
"eval_samples_per_second": 21.736,
"eval_steps_per_second": 2.718,
"eval_wer": 0.1604590218554376,
"step": 17500
},
{
"epoch": 4.88,
"learning_rate": 5.690207678560424e-05,
"loss": 0.1761,
"step": 17600
},
{
"epoch": 4.91,
"learning_rate": 5.659394835767548e-05,
"loss": 0.1764,
"step": 17700
},
{
"epoch": 4.94,
"learning_rate": 5.628581992974672e-05,
"loss": 0.1781,
"step": 17800
},
{
"epoch": 4.96,
"learning_rate": 5.597769150181796e-05,
"loss": 0.1781,
"step": 17900
},
{
"epoch": 4.99,
"learning_rate": 5.5669563073889196e-05,
"loss": 0.1755,
"step": 18000
},
{
"epoch": 4.99,
"eval_loss": 0.18325339257717133,
"eval_runtime": 728.9102,
"eval_samples_per_second": 22.007,
"eval_steps_per_second": 2.752,
"eval_wer": 0.15946588411684426,
"step": 18000
},
{
"epoch": 5.02,
"learning_rate": 5.536143464596044e-05,
"loss": 0.1758,
"step": 18100
},
{
"epoch": 5.05,
"learning_rate": 5.5053306218031675e-05,
"loss": 0.163,
"step": 18200
},
{
"epoch": 5.07,
"learning_rate": 5.474517779010292e-05,
"loss": 0.1671,
"step": 18300
},
{
"epoch": 5.1,
"learning_rate": 5.443704936217415e-05,
"loss": 0.1723,
"step": 18400
},
{
"epoch": 5.13,
"learning_rate": 5.4128920934245395e-05,
"loss": 0.1692,
"step": 18500
},
{
"epoch": 5.13,
"eval_loss": 0.18143832683563232,
"eval_runtime": 741.2319,
"eval_samples_per_second": 21.641,
"eval_steps_per_second": 2.706,
"eval_wer": 0.15686450397575463,
"step": 18500
},
{
"epoch": 5.16,
"learning_rate": 5.382079250631663e-05,
"loss": 0.1714,
"step": 18600
},
{
"epoch": 5.19,
"learning_rate": 5.351266407838787e-05,
"loss": 0.1638,
"step": 18700
},
{
"epoch": 5.21,
"learning_rate": 5.320453565045911e-05,
"loss": 0.1626,
"step": 18800
},
{
"epoch": 5.24,
"learning_rate": 5.289640722253035e-05,
"loss": 0.1657,
"step": 18900
},
{
"epoch": 5.27,
"learning_rate": 5.25882787946016e-05,
"loss": 0.1674,
"step": 19000
},
{
"epoch": 5.27,
"eval_loss": 0.18194520473480225,
"eval_runtime": 737.6255,
"eval_samples_per_second": 21.747,
"eval_steps_per_second": 2.72,
"eval_wer": 0.15655054430355414,
"step": 19000
},
{
"epoch": 5.3,
"learning_rate": 5.228015036667283e-05,
"loss": 0.1657,
"step": 19100
},
{
"epoch": 5.32,
"learning_rate": 5.197202193874408e-05,
"loss": 0.1663,
"step": 19200
},
{
"epoch": 5.35,
"learning_rate": 5.166389351081531e-05,
"loss": 0.1683,
"step": 19300
},
{
"epoch": 5.38,
"learning_rate": 5.135884636716584e-05,
"loss": 0.1716,
"step": 19400
},
{
"epoch": 5.41,
"learning_rate": 5.105071793923708e-05,
"loss": 0.1664,
"step": 19500
},
{
"epoch": 5.41,
"eval_loss": 0.18048684298992157,
"eval_runtime": 745.2746,
"eval_samples_per_second": 21.524,
"eval_steps_per_second": 2.692,
"eval_wer": 0.15724894439069398,
"step": 19500
},
{
"epoch": 5.44,
"learning_rate": 5.0742589511308316e-05,
"loss": 0.1714,
"step": 19600
},
{
"epoch": 5.46,
"learning_rate": 5.043446108337956e-05,
"loss": 0.1686,
"step": 19700
},
{
"epoch": 5.49,
"learning_rate": 5.0126332655450794e-05,
"loss": 0.1672,
"step": 19800
},
{
"epoch": 5.52,
"learning_rate": 4.9818204227522036e-05,
"loss": 0.1657,
"step": 19900
},
{
"epoch": 5.55,
"learning_rate": 4.951007579959328e-05,
"loss": 0.1677,
"step": 20000
},
{
"epoch": 5.55,
"eval_loss": 0.1802615374326706,
"eval_runtime": 735.367,
"eval_samples_per_second": 21.814,
"eval_steps_per_second": 2.728,
"eval_wer": 0.15595466166039815,
"step": 20000
},
{
"epoch": 5.57,
"learning_rate": 4.9201947371664514e-05,
"loss": 0.1659,
"step": 20100
},
{
"epoch": 5.6,
"learning_rate": 4.889381894373575e-05,
"loss": 0.1663,
"step": 20200
},
{
"epoch": 5.63,
"learning_rate": 4.858569051580699e-05,
"loss": 0.167,
"step": 20300
},
{
"epoch": 5.66,
"learning_rate": 4.827756208787823e-05,
"loss": 0.1667,
"step": 20400
},
{
"epoch": 5.68,
"learning_rate": 4.796943365994947e-05,
"loss": 0.1637,
"step": 20500
},
{
"epoch": 5.68,
"eval_loss": 0.17502419650554657,
"eval_runtime": 733.6051,
"eval_samples_per_second": 21.866,
"eval_steps_per_second": 2.734,
"eval_wer": 0.15248188324544598,
"step": 20500
},
{
"epoch": 5.71,
"learning_rate": 4.7661305232020706e-05,
"loss": 0.1609,
"step": 20600
},
{
"epoch": 5.74,
"learning_rate": 4.735317680409195e-05,
"loss": 0.1658,
"step": 20700
},
{
"epoch": 5.77,
"learning_rate": 4.7045048376163184e-05,
"loss": 0.1671,
"step": 20800
},
{
"epoch": 5.8,
"learning_rate": 4.6736919948234426e-05,
"loss": 0.1631,
"step": 20900
},
{
"epoch": 5.82,
"learning_rate": 4.643187280458495e-05,
"loss": 0.1628,
"step": 21000
},
{
"epoch": 5.82,
"eval_loss": 0.17739933729171753,
"eval_runtime": 734.3058,
"eval_samples_per_second": 21.845,
"eval_steps_per_second": 2.732,
"eval_wer": 0.1531866906728348,
"step": 21000
},
{
"epoch": 5.85,
"learning_rate": 4.612374437665619e-05,
"loss": 0.166,
"step": 21100
},
{
"epoch": 5.88,
"learning_rate": 4.581561594872743e-05,
"loss": 0.1666,
"step": 21200
},
{
"epoch": 5.91,
"learning_rate": 4.550748752079867e-05,
"loss": 0.1623,
"step": 21300
},
{
"epoch": 5.93,
"learning_rate": 4.5199359092869906e-05,
"loss": 0.166,
"step": 21400
},
{
"epoch": 5.96,
"learning_rate": 4.489123066494115e-05,
"loss": 0.1645,
"step": 21500
},
{
"epoch": 5.96,
"eval_loss": 0.1743806153535843,
"eval_runtime": 735.7033,
"eval_samples_per_second": 21.804,
"eval_steps_per_second": 2.727,
"eval_wer": 0.15269332547366263,
"step": 21500
},
{
"epoch": 5.99,
"learning_rate": 4.4583102237012384e-05,
"loss": 0.1625,
"step": 21600
},
{
"epoch": 6.02,
"learning_rate": 4.427497380908363e-05,
"loss": 0.1587,
"step": 21700
},
{
"epoch": 6.05,
"learning_rate": 4.396684538115487e-05,
"loss": 0.1545,
"step": 21800
},
{
"epoch": 6.07,
"learning_rate": 4.365871695322611e-05,
"loss": 0.1524,
"step": 21900
},
{
"epoch": 6.1,
"learning_rate": 4.335058852529735e-05,
"loss": 0.1551,
"step": 22000
},
{
"epoch": 6.1,
"eval_loss": 0.17782124876976013,
"eval_runtime": 736.3789,
"eval_samples_per_second": 21.784,
"eval_steps_per_second": 2.724,
"eval_wer": 0.15429516053590994,
"step": 22000
},
{
"epoch": 6.13,
"learning_rate": 4.304246009736859e-05,
"loss": 0.1528,
"step": 22100
},
{
"epoch": 6.16,
"learning_rate": 4.2734331669439825e-05,
"loss": 0.1513,
"step": 22200
},
{
"epoch": 6.18,
"learning_rate": 4.242620324151107e-05,
"loss": 0.1527,
"step": 22300
},
{
"epoch": 6.21,
"learning_rate": 4.21180748135823e-05,
"loss": 0.1522,
"step": 22400
},
{
"epoch": 6.24,
"learning_rate": 4.1809946385653545e-05,
"loss": 0.1505,
"step": 22500
},
{
"epoch": 6.24,
"eval_loss": 0.1753922700881958,
"eval_runtime": 732.6709,
"eval_samples_per_second": 21.894,
"eval_steps_per_second": 2.738,
"eval_wer": 0.15279584291764645,
"step": 22500
},
{
"epoch": 6.27,
"learning_rate": 4.150181795772478e-05,
"loss": 0.1528,
"step": 22600
},
{
"epoch": 6.3,
"learning_rate": 4.119368952979602e-05,
"loss": 0.1533,
"step": 22700
},
{
"epoch": 6.32,
"learning_rate": 4.088556110186726e-05,
"loss": 0.1529,
"step": 22800
},
{
"epoch": 6.35,
"learning_rate": 4.05774326739385e-05,
"loss": 0.1516,
"step": 22900
},
{
"epoch": 6.38,
"learning_rate": 4.026930424600974e-05,
"loss": 0.1499,
"step": 23000
},
{
"epoch": 6.38,
"eval_loss": 0.17432022094726562,
"eval_runtime": 727.4564,
"eval_samples_per_second": 22.051,
"eval_steps_per_second": 2.758,
"eval_wer": 0.14998302054834017,
"step": 23000
},
{
"epoch": 6.41,
"learning_rate": 3.996117581808097e-05,
"loss": 0.1494,
"step": 23100
},
{
"epoch": 6.43,
"learning_rate": 3.9653047390152215e-05,
"loss": 0.1517,
"step": 23200
},
{
"epoch": 6.46,
"learning_rate": 3.934491896222346e-05,
"loss": 0.1485,
"step": 23300
},
{
"epoch": 6.49,
"learning_rate": 3.90367905342947e-05,
"loss": 0.1472,
"step": 23400
},
{
"epoch": 6.52,
"learning_rate": 3.8728662106365935e-05,
"loss": 0.1491,
"step": 23500
},
{
"epoch": 6.52,
"eval_loss": 0.1684291511774063,
"eval_runtime": 725.7122,
"eval_samples_per_second": 22.104,
"eval_steps_per_second": 2.764,
"eval_wer": 0.1472855303035157,
"step": 23500
},
{
"epoch": 6.54,
"learning_rate": 3.842053367843718e-05,
"loss": 0.1466,
"step": 23600
},
{
"epoch": 6.57,
"learning_rate": 3.8112405250508413e-05,
"loss": 0.1454,
"step": 23700
},
{
"epoch": 6.6,
"learning_rate": 3.7804276822579656e-05,
"loss": 0.1473,
"step": 23800
},
{
"epoch": 6.63,
"learning_rate": 3.749614839465089e-05,
"loss": 0.1447,
"step": 23900
},
{
"epoch": 6.66,
"learning_rate": 3.7188019966722134e-05,
"loss": 0.1477,
"step": 24000
},
{
"epoch": 6.66,
"eval_loss": 0.16609960794448853,
"eval_runtime": 737.8035,
"eval_samples_per_second": 21.742,
"eval_steps_per_second": 2.719,
"eval_wer": 0.14721504956077683,
"step": 24000
},
{
"epoch": 6.68,
"learning_rate": 3.687989153879337e-05,
"loss": 0.1499,
"step": 24100
},
{
"epoch": 6.71,
"learning_rate": 3.657176311086461e-05,
"loss": 0.1468,
"step": 24200
},
{
"epoch": 6.74,
"learning_rate": 3.626363468293585e-05,
"loss": 0.1481,
"step": 24300
},
{
"epoch": 6.77,
"learning_rate": 3.595550625500709e-05,
"loss": 0.1485,
"step": 24400
},
{
"epoch": 6.79,
"learning_rate": 3.5647377827078326e-05,
"loss": 0.1456,
"step": 24500
},
{
"epoch": 6.79,
"eval_loss": 0.1653786450624466,
"eval_runtime": 730.3018,
"eval_samples_per_second": 21.965,
"eval_steps_per_second": 2.747,
"eval_wer": 0.14399856475578424,
"step": 24500
},
{
"epoch": 6.82,
"learning_rate": 3.533924939914957e-05,
"loss": 0.1442,
"step": 24600
},
{
"epoch": 6.85,
"learning_rate": 3.5031120971220804e-05,
"loss": 0.1434,
"step": 24700
},
{
"epoch": 6.88,
"learning_rate": 3.4722992543292046e-05,
"loss": 0.1494,
"step": 24800
},
{
"epoch": 6.91,
"learning_rate": 3.441486411536329e-05,
"loss": 0.1463,
"step": 24900
},
{
"epoch": 6.93,
"learning_rate": 3.4106735687434524e-05,
"loss": 0.1415,
"step": 25000
},
{
"epoch": 6.93,
"eval_loss": 0.16542479395866394,
"eval_runtime": 729.304,
"eval_samples_per_second": 21.995,
"eval_steps_per_second": 2.751,
"eval_wer": 0.14476744558566293,
"step": 25000
},
{
"epoch": 6.96,
"learning_rate": 3.3798607259505766e-05,
"loss": 0.1413,
"step": 25100
},
{
"epoch": 6.99,
"learning_rate": 3.3490478831577e-05,
"loss": 0.1461,
"step": 25200
},
{
"epoch": 7.02,
"learning_rate": 3.3182350403648244e-05,
"loss": 0.1392,
"step": 25300
},
{
"epoch": 7.04,
"learning_rate": 3.287422197571948e-05,
"loss": 0.1311,
"step": 25400
},
{
"epoch": 7.07,
"learning_rate": 3.256609354779072e-05,
"loss": 0.136,
"step": 25500
},
{
"epoch": 7.07,
"eval_loss": 0.1615738570690155,
"eval_runtime": 742.2272,
"eval_samples_per_second": 21.612,
"eval_steps_per_second": 2.703,
"eval_wer": 0.1406667478263098,
"step": 25500
},
{
"epoch": 7.1,
"learning_rate": 3.225796511986196e-05,
"loss": 0.1328,
"step": 25600
},
{
"epoch": 7.13,
"learning_rate": 3.19498366919332e-05,
"loss": 0.1355,
"step": 25700
},
{
"epoch": 7.15,
"learning_rate": 3.164787083256301e-05,
"loss": 0.1378,
"step": 25800
},
{
"epoch": 7.18,
"learning_rate": 3.1339742404634255e-05,
"loss": 0.1321,
"step": 25900
},
{
"epoch": 7.21,
"learning_rate": 3.103161397670549e-05,
"loss": 0.132,
"step": 26000
},
{
"epoch": 7.21,
"eval_loss": 0.16245120763778687,
"eval_runtime": 782.6075,
"eval_samples_per_second": 20.497,
"eval_steps_per_second": 2.563,
"eval_wer": 0.14099992951925727,
"step": 26000
},
{
"epoch": 7.24,
"learning_rate": 3.072348554877673e-05,
"loss": 0.133,
"step": 26100
},
{
"epoch": 7.27,
"learning_rate": 3.0415357120847972e-05,
"loss": 0.1325,
"step": 26200
},
{
"epoch": 7.29,
"learning_rate": 3.010722869291921e-05,
"loss": 0.1323,
"step": 26300
},
{
"epoch": 7.32,
"learning_rate": 2.9799100264990447e-05,
"loss": 0.1347,
"step": 26400
},
{
"epoch": 7.35,
"learning_rate": 2.9490971837061686e-05,
"loss": 0.1323,
"step": 26500
},
{
"epoch": 7.35,
"eval_loss": 0.16042262315750122,
"eval_runtime": 776.612,
"eval_samples_per_second": 20.655,
"eval_steps_per_second": 2.583,
"eval_wer": 0.14037201017485632,
"step": 26500
},
{
"epoch": 7.38,
"learning_rate": 2.9182843409132925e-05,
"loss": 0.1321,
"step": 26600
},
{
"epoch": 7.4,
"learning_rate": 2.8874714981204164e-05,
"loss": 0.1328,
"step": 26700
},
{
"epoch": 7.43,
"learning_rate": 2.8566586553275403e-05,
"loss": 0.1312,
"step": 26800
},
{
"epoch": 7.46,
"learning_rate": 2.825845812534665e-05,
"loss": 0.1328,
"step": 26900
},
{
"epoch": 7.49,
"learning_rate": 2.7950329697417887e-05,
"loss": 0.1338,
"step": 27000
},
{
"epoch": 7.49,
"eval_loss": 0.1574241816997528,
"eval_runtime": 761.9403,
"eval_samples_per_second": 21.053,
"eval_steps_per_second": 2.633,
"eval_wer": 0.1386484356478782,
"step": 27000
},
{
"epoch": 7.52,
"learning_rate": 2.7642201269489126e-05,
"loss": 0.1318,
"step": 27100
},
{
"epoch": 7.54,
"learning_rate": 2.7334072841560365e-05,
"loss": 0.1319,
"step": 27200
},
{
"epoch": 7.57,
"learning_rate": 2.7025944413631604e-05,
"loss": 0.1315,
"step": 27300
},
{
"epoch": 7.6,
"learning_rate": 2.6717815985702843e-05,
"loss": 0.1328,
"step": 27400
},
{
"epoch": 7.63,
"learning_rate": 2.6409687557774082e-05,
"loss": 0.13,
"step": 27500
},
{
"epoch": 7.63,
"eval_loss": 0.15763409435749054,
"eval_runtime": 758.2506,
"eval_samples_per_second": 21.155,
"eval_steps_per_second": 2.646,
"eval_wer": 0.13843058607941258,
"step": 27500
},
{
"epoch": 7.65,
"learning_rate": 2.610155912984532e-05,
"loss": 0.1278,
"step": 27600
},
{
"epoch": 7.68,
"learning_rate": 2.579343070191656e-05,
"loss": 0.1299,
"step": 27700
},
{
"epoch": 7.71,
"learning_rate": 2.54853022739878e-05,
"loss": 0.13,
"step": 27800
},
{
"epoch": 7.74,
"learning_rate": 2.517717384605904e-05,
"loss": 0.1306,
"step": 27900
},
{
"epoch": 7.76,
"learning_rate": 2.4869045418130278e-05,
"loss": 0.1291,
"step": 28000
},
{
"epoch": 7.76,
"eval_loss": 0.15506793558597565,
"eval_runtime": 748.8913,
"eval_samples_per_second": 21.42,
"eval_steps_per_second": 2.679,
"eval_wer": 0.1365660500669567,
"step": 28000
},
{
"epoch": 7.79,
"learning_rate": 2.456091699020152e-05,
"loss": 0.1277,
"step": 28100
},
{
"epoch": 7.82,
"learning_rate": 2.425278856227276e-05,
"loss": 0.1292,
"step": 28200
},
{
"epoch": 7.85,
"learning_rate": 2.3944660134343998e-05,
"loss": 0.1304,
"step": 28300
},
{
"epoch": 7.88,
"learning_rate": 2.3636531706415237e-05,
"loss": 0.1306,
"step": 28400
},
{
"epoch": 7.9,
"learning_rate": 2.3328403278486473e-05,
"loss": 0.1277,
"step": 28500
},
{
"epoch": 7.9,
"eval_loss": 0.15418410301208496,
"eval_runtime": 753.0273,
"eval_samples_per_second": 21.302,
"eval_steps_per_second": 2.664,
"eval_wer": 0.1355536903076164,
"step": 28500
},
{
"epoch": 7.93,
"learning_rate": 2.302027485055771e-05,
"loss": 0.127,
"step": 28600
},
{
"epoch": 7.96,
"learning_rate": 2.271214642262895e-05,
"loss": 0.1283,
"step": 28700
},
{
"epoch": 7.99,
"learning_rate": 2.240401799470019e-05,
"loss": 0.1316,
"step": 28800
},
{
"epoch": 8.01,
"learning_rate": 2.2095889566771432e-05,
"loss": 0.1246,
"step": 28900
},
{
"epoch": 8.04,
"learning_rate": 2.178776113884267e-05,
"loss": 0.1241,
"step": 29000
},
{
"epoch": 8.04,
"eval_loss": 0.15454024076461792,
"eval_runtime": 764.5389,
"eval_samples_per_second": 20.981,
"eval_steps_per_second": 2.624,
"eval_wer": 0.13500906638645233,
"step": 29000
},
{
"epoch": 8.07,
"learning_rate": 2.147963271091391e-05,
"loss": 0.1229,
"step": 29100
},
{
"epoch": 8.1,
"learning_rate": 2.117150428298515e-05,
"loss": 0.1252,
"step": 29200
},
{
"epoch": 8.13,
"learning_rate": 2.0863375855056388e-05,
"loss": 0.123,
"step": 29300
},
{
"epoch": 8.15,
"learning_rate": 2.0555247427127627e-05,
"loss": 0.1198,
"step": 29400
},
{
"epoch": 8.18,
"learning_rate": 2.0247118999198866e-05,
"loss": 0.1198,
"step": 29500
},
{
"epoch": 8.18,
"eval_loss": 0.15356162190437317,
"eval_runtime": 730.0324,
"eval_samples_per_second": 21.973,
"eval_steps_per_second": 2.748,
"eval_wer": 0.13224109539888898,
"step": 29500
},
{
"epoch": 8.21,
"learning_rate": 1.9938990571270105e-05,
"loss": 0.1203,
"step": 29600
},
{
"epoch": 8.24,
"learning_rate": 1.9630862143341347e-05,
"loss": 0.1225,
"step": 29700
},
{
"epoch": 8.26,
"learning_rate": 1.9322733715412586e-05,
"loss": 0.1192,
"step": 29800
},
{
"epoch": 8.29,
"learning_rate": 1.9014605287483825e-05,
"loss": 0.1218,
"step": 29900
},
{
"epoch": 8.32,
"learning_rate": 1.8706476859555064e-05,
"loss": 0.1204,
"step": 30000
},
{
"epoch": 8.32,
"eval_loss": 0.15469121932983398,
"eval_runtime": 731.8162,
"eval_samples_per_second": 21.919,
"eval_steps_per_second": 2.741,
"eval_wer": 0.13368915429516054,
"step": 30000
},
{
"epoch": 8.35,
"learning_rate": 1.8398348431626303e-05,
"loss": 0.1202,
"step": 30100
},
{
"epoch": 8.37,
"learning_rate": 1.8090220003697542e-05,
"loss": 0.1198,
"step": 30200
},
{
"epoch": 8.4,
"learning_rate": 1.778209157576878e-05,
"loss": 0.1159,
"step": 30300
},
{
"epoch": 8.43,
"learning_rate": 1.747396314784002e-05,
"loss": 0.1193,
"step": 30400
},
{
"epoch": 8.46,
"learning_rate": 1.716583471991126e-05,
"loss": 0.1195,
"step": 30500
},
{
"epoch": 8.46,
"eval_loss": 0.14937089383602142,
"eval_runtime": 730.1876,
"eval_samples_per_second": 21.968,
"eval_steps_per_second": 2.747,
"eval_wer": 0.13088273926610325,
"step": 30500
},
{
"epoch": 8.49,
"learning_rate": 1.68577062919825e-05,
"loss": 0.1176,
"step": 30600
},
{
"epoch": 8.51,
"learning_rate": 1.6549577864053738e-05,
"loss": 0.1162,
"step": 30700
},
{
"epoch": 8.54,
"learning_rate": 1.6241449436124977e-05,
"loss": 0.1185,
"step": 30800
},
{
"epoch": 8.57,
"learning_rate": 1.5936402292475504e-05,
"loss": 0.1164,
"step": 30900
},
{
"epoch": 8.6,
"learning_rate": 1.5628273864546743e-05,
"loss": 0.1169,
"step": 31000
},
{
"epoch": 8.6,
"eval_loss": 0.14900121092796326,
"eval_runtime": 740.5566,
"eval_samples_per_second": 21.661,
"eval_steps_per_second": 2.709,
"eval_wer": 0.12999852631174275,
"step": 31000
},
{
"epoch": 8.62,
"learning_rate": 1.5320145436617982e-05,
"loss": 0.1173,
"step": 31100
},
{
"epoch": 8.65,
"learning_rate": 1.5012017008689223e-05,
"loss": 0.1163,
"step": 31200
},
{
"epoch": 8.68,
"learning_rate": 1.4703888580760462e-05,
"loss": 0.1169,
"step": 31300
},
{
"epoch": 8.71,
"learning_rate": 1.43957601528317e-05,
"loss": 0.1172,
"step": 31400
},
{
"epoch": 8.74,
"learning_rate": 1.4087631724902941e-05,
"loss": 0.1159,
"step": 31500
},
{
"epoch": 8.74,
"eval_loss": 0.14852623641490936,
"eval_runtime": 733.0221,
"eval_samples_per_second": 21.883,
"eval_steps_per_second": 2.737,
"eval_wer": 0.13053033555240884,
"step": 31500
},
{
"epoch": 8.76,
"learning_rate": 1.377950329697418e-05,
"loss": 0.1147,
"step": 31600
},
{
"epoch": 8.79,
"learning_rate": 1.347137486904542e-05,
"loss": 0.1161,
"step": 31700
},
{
"epoch": 8.82,
"learning_rate": 1.3163246441116658e-05,
"loss": 0.1145,
"step": 31800
},
{
"epoch": 8.85,
"learning_rate": 1.2855118013187897e-05,
"loss": 0.1156,
"step": 31900
},
{
"epoch": 8.87,
"learning_rate": 1.2546989585259136e-05,
"loss": 0.1142,
"step": 32000
},
{
"epoch": 8.87,
"eval_loss": 0.1478671133518219,
"eval_runtime": 734.6914,
"eval_samples_per_second": 21.834,
"eval_steps_per_second": 2.73,
"eval_wer": 0.12915275739887616,
"step": 32000
},
{
"epoch": 8.9,
"learning_rate": 1.2238861157330375e-05,
"loss": 0.116,
"step": 32100
},
{
"epoch": 8.93,
"learning_rate": 1.1930732729401616e-05,
"loss": 0.1132,
"step": 32200
},
{
"epoch": 8.96,
"learning_rate": 1.1622604301472855e-05,
"loss": 0.1141,
"step": 32300
},
{
"epoch": 8.98,
"learning_rate": 1.1314475873544094e-05,
"loss": 0.1142,
"step": 32400
},
{
"epoch": 9.01,
"learning_rate": 1.1006347445615333e-05,
"loss": 0.1087,
"step": 32500
},
{
"epoch": 9.01,
"eval_loss": 0.14710813760757446,
"eval_runtime": 730.6434,
"eval_samples_per_second": 21.955,
"eval_steps_per_second": 2.746,
"eval_wer": 0.12841591327024238,
"step": 32500
},
{
"epoch": 9.04,
"learning_rate": 1.0698219017686572e-05,
"loss": 0.1094,
"step": 32600
},
{
"epoch": 9.07,
"learning_rate": 1.0390090589757811e-05,
"loss": 0.1072,
"step": 32700
},
{
"epoch": 9.1,
"learning_rate": 1.008196216182905e-05,
"loss": 0.1082,
"step": 32800
},
{
"epoch": 9.12,
"learning_rate": 9.773833733900289e-06,
"loss": 0.1097,
"step": 32900
},
{
"epoch": 9.15,
"learning_rate": 9.46570530597153e-06,
"loss": 0.1076,
"step": 33000
},
{
"epoch": 9.15,
"eval_loss": 0.14665587246418,
"eval_runtime": 789.1119,
"eval_samples_per_second": 20.328,
"eval_steps_per_second": 2.542,
"eval_wer": 0.12696144703372184,
"step": 33000
},
{
"epoch": 9.18,
"learning_rate": 9.157576878042769e-06,
"loss": 0.111,
"step": 33100
},
{
"epoch": 9.21,
"learning_rate": 8.849448450114008e-06,
"loss": 0.1092,
"step": 33200
},
{
"epoch": 9.23,
"learning_rate": 8.541320022185247e-06,
"loss": 0.1103,
"step": 33300
},
{
"epoch": 9.26,
"learning_rate": 8.233191594256488e-06,
"loss": 0.1057,
"step": 33400
},
{
"epoch": 9.29,
"learning_rate": 7.928144450607015e-06,
"loss": 0.1078,
"step": 33500
},
{
"epoch": 9.29,
"eval_loss": 0.14669346809387207,
"eval_runtime": 776.8801,
"eval_samples_per_second": 20.648,
"eval_steps_per_second": 2.582,
"eval_wer": 0.12701911309596273,
"step": 33500
},
{
"epoch": 9.32,
"learning_rate": 7.620016022678253e-06,
"loss": 0.1106,
"step": 33600
},
{
"epoch": 9.35,
"learning_rate": 7.311887594749492e-06,
"loss": 0.1057,
"step": 33700
},
{
"epoch": 9.37,
"learning_rate": 7.003759166820731e-06,
"loss": 0.1069,
"step": 33800
},
{
"epoch": 9.4,
"learning_rate": 6.695630738891971e-06,
"loss": 0.1089,
"step": 33900
},
{
"epoch": 9.43,
"learning_rate": 6.38750231096321e-06,
"loss": 0.1073,
"step": 34000
},
{
"epoch": 9.43,
"eval_loss": 0.14469479024410248,
"eval_runtime": 770.0295,
"eval_samples_per_second": 20.832,
"eval_steps_per_second": 2.605,
"eval_wer": 0.1256159055814341,
"step": 34000
},
{
"epoch": 9.46,
"learning_rate": 6.079373883034449e-06,
"loss": 0.1056,
"step": 34100
},
{
"epoch": 9.48,
"learning_rate": 5.771245455105688e-06,
"loss": 0.105,
"step": 34200
},
{
"epoch": 9.51,
"learning_rate": 5.463117027176928e-06,
"loss": 0.1078,
"step": 34300
},
{
"epoch": 9.54,
"learning_rate": 5.154988599248167e-06,
"loss": 0.1061,
"step": 34400
},
{
"epoch": 9.57,
"learning_rate": 4.8468601713194066e-06,
"loss": 0.108,
"step": 34500
},
{
"epoch": 9.57,
"eval_loss": 0.14469197392463684,
"eval_runtime": 768.5913,
"eval_samples_per_second": 20.871,
"eval_steps_per_second": 2.61,
"eval_wer": 0.1257248303656669,
"step": 34500
},
{
"epoch": 9.6,
"learning_rate": 4.538731743390645e-06,
"loss": 0.106,
"step": 34600
},
{
"epoch": 9.62,
"learning_rate": 4.230603315461885e-06,
"loss": 0.1076,
"step": 34700
},
{
"epoch": 9.65,
"learning_rate": 3.922474887533124e-06,
"loss": 0.1065,
"step": 34800
},
{
"epoch": 9.68,
"learning_rate": 3.6143464596043634e-06,
"loss": 0.1045,
"step": 34900
},
{
"epoch": 9.71,
"learning_rate": 3.306218031675602e-06,
"loss": 0.106,
"step": 35000
},
{
"epoch": 9.71,
"eval_loss": 0.14382557570934296,
"eval_runtime": 768.3649,
"eval_samples_per_second": 20.877,
"eval_steps_per_second": 2.611,
"eval_wer": 0.1254813514362053,
"step": 35000
},
{
"epoch": 9.73,
"learning_rate": 2.998089603746842e-06,
"loss": 0.1051,
"step": 35100
},
{
"epoch": 9.76,
"learning_rate": 2.6899611758180813e-06,
"loss": 0.1116,
"step": 35200
},
{
"epoch": 9.79,
"learning_rate": 2.3818327478893203e-06,
"loss": 0.1048,
"step": 35300
},
{
"epoch": 9.82,
"learning_rate": 2.0737043199605598e-06,
"loss": 0.1057,
"step": 35400
},
{
"epoch": 9.84,
"learning_rate": 1.771738460590374e-06,
"loss": 0.1052,
"step": 35500
},
{
"epoch": 9.84,
"eval_loss": 0.14279937744140625,
"eval_runtime": 740.2589,
"eval_samples_per_second": 21.669,
"eval_steps_per_second": 2.71,
"eval_wer": 0.1247124706063266,
"step": 35500
},
{
"epoch": 9.87,
"learning_rate": 1.4636100326616134e-06,
"loss": 0.1012,
"step": 35600
},
{
"epoch": 9.9,
"learning_rate": 1.1554816047328529e-06,
"loss": 0.1051,
"step": 35700
},
{
"epoch": 9.93,
"learning_rate": 8.473531768040921e-07,
"loss": 0.1043,
"step": 35800
},
{
"epoch": 9.96,
"learning_rate": 5.392247488753312e-07,
"loss": 0.1038,
"step": 35900
},
{
"epoch": 9.98,
"learning_rate": 2.3109632094657053e-07,
"loss": 0.1044,
"step": 36000
},
{
"epoch": 9.98,
"eval_loss": 0.1430039405822754,
"eval_runtime": 779.4591,
"eval_samples_per_second": 20.58,
"eval_steps_per_second": 2.574,
"eval_wer": 0.12453306507935491,
"step": 36000
},
{
"epoch": 10.0,
"step": 36060,
"total_flos": 2.2265672303557702e+21,
"train_loss": 0.23386146696950752,
"train_runtime": 329994.9794,
"train_samples_per_second": 13.987,
"train_steps_per_second": 0.109
}
],
"max_steps": 36060,
"num_train_epochs": 10,
"total_flos": 2.2265672303557702e+21,
"trial_name": null,
"trial_params": null
}