boumehdi's picture
Upload 10 files
d5b4061
raw
history blame
No virus
79.8 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 35.986119743111665,
"global_step": 43400,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.17,
"learning_rate": 9.95e-05,
"loss": 0.6982,
"step": 200
},
{
"epoch": 0.17,
"eval_loss": 0.25508013367652893,
"eval_runtime": 247.2382,
"eval_samples_per_second": 20.907,
"eval_steps_per_second": 2.617,
"eval_wer": 0.24512755506258913,
"step": 200
},
{
"epoch": 0.33,
"learning_rate": 9.972560975609757e-05,
"loss": 0.5209,
"step": 400
},
{
"epoch": 0.33,
"eval_loss": 0.21009531617164612,
"eval_runtime": 249.2779,
"eval_samples_per_second": 20.736,
"eval_steps_per_second": 2.595,
"eval_wer": 0.21507420905297628,
"step": 400
},
{
"epoch": 0.5,
"learning_rate": 9.944844789356985e-05,
"loss": 0.4885,
"step": 600
},
{
"epoch": 0.5,
"eval_loss": 0.20174096524715424,
"eval_runtime": 247.285,
"eval_samples_per_second": 20.903,
"eval_steps_per_second": 2.616,
"eval_wer": 0.20297892568531137,
"step": 600
},
{
"epoch": 0.66,
"learning_rate": 9.917128603104213e-05,
"loss": 0.474,
"step": 800
},
{
"epoch": 0.66,
"eval_loss": 0.18579010665416718,
"eval_runtime": 250.2088,
"eval_samples_per_second": 20.659,
"eval_steps_per_second": 2.586,
"eval_wer": 0.1948977974964348,
"step": 800
},
{
"epoch": 0.83,
"learning_rate": 9.889412416851441e-05,
"loss": 0.4683,
"step": 1000
},
{
"epoch": 0.83,
"eval_loss": 0.17479585111141205,
"eval_runtime": 251.8549,
"eval_samples_per_second": 20.524,
"eval_steps_per_second": 2.569,
"eval_wer": 0.17192204088100144,
"step": 1000
},
{
"epoch": 0.99,
"learning_rate": 9.86169623059867e-05,
"loss": 0.4497,
"step": 1200
},
{
"epoch": 0.99,
"eval_loss": 0.15883031487464905,
"eval_runtime": 251.9945,
"eval_samples_per_second": 20.512,
"eval_steps_per_second": 2.568,
"eval_wer": 0.17171076955580203,
"step": 1200
},
{
"epoch": 1.16,
"learning_rate": 9.833980044345899e-05,
"loss": 0.4037,
"step": 1400
},
{
"epoch": 1.16,
"eval_loss": 0.15540002286434174,
"eval_runtime": 253.8837,
"eval_samples_per_second": 20.36,
"eval_steps_per_second": 2.548,
"eval_wer": 0.15987957534463634,
"step": 1400
},
{
"epoch": 1.33,
"learning_rate": 9.806263858093127e-05,
"loss": 0.3999,
"step": 1600
},
{
"epoch": 1.33,
"eval_loss": 0.1569492369890213,
"eval_runtime": 253.8314,
"eval_samples_per_second": 20.364,
"eval_steps_per_second": 2.549,
"eval_wer": 0.1581365869117414,
"step": 1600
},
{
"epoch": 1.49,
"learning_rate": 9.778547671840356e-05,
"loss": 0.4014,
"step": 1800
},
{
"epoch": 1.49,
"eval_loss": 0.14257089793682098,
"eval_runtime": 253.5715,
"eval_samples_per_second": 20.385,
"eval_steps_per_second": 2.552,
"eval_wer": 0.1482068346273702,
"step": 1800
},
{
"epoch": 1.66,
"learning_rate": 9.750831485587584e-05,
"loss": 0.3887,
"step": 2000
},
{
"epoch": 1.66,
"eval_loss": 0.14761227369308472,
"eval_runtime": 262.7757,
"eval_samples_per_second": 19.671,
"eval_steps_per_second": 2.462,
"eval_wer": 0.14361168330428353,
"step": 2000
},
{
"epoch": 1.82,
"learning_rate": 9.723115299334812e-05,
"loss": 0.3861,
"step": 2200
},
{
"epoch": 1.82,
"eval_loss": 0.14095284044742584,
"eval_runtime": 253.9647,
"eval_samples_per_second": 20.353,
"eval_steps_per_second": 2.548,
"eval_wer": 0.14815401679607035,
"step": 2200
},
{
"epoch": 1.99,
"learning_rate": 9.695399113082039e-05,
"loss": 0.3881,
"step": 2400
},
{
"epoch": 1.99,
"eval_loss": 0.13986040651798248,
"eval_runtime": 253.8881,
"eval_samples_per_second": 20.359,
"eval_steps_per_second": 2.548,
"eval_wer": 0.14012570643849365,
"step": 2400
},
{
"epoch": 2.16,
"learning_rate": 9.667682926829269e-05,
"loss": 0.3397,
"step": 2600
},
{
"epoch": 2.16,
"eval_loss": 0.1451854407787323,
"eval_runtime": 255.702,
"eval_samples_per_second": 20.215,
"eval_steps_per_second": 2.53,
"eval_wer": 0.13178048909311785,
"step": 2600
},
{
"epoch": 2.32,
"learning_rate": 9.639966740576497e-05,
"loss": 0.3383,
"step": 2800
},
{
"epoch": 2.32,
"eval_loss": 0.13278624415397644,
"eval_runtime": 254.5924,
"eval_samples_per_second": 20.303,
"eval_steps_per_second": 2.541,
"eval_wer": 0.13019595415412244,
"step": 2800
},
{
"epoch": 2.49,
"learning_rate": 9.612250554323725e-05,
"loss": 0.3366,
"step": 3000
},
{
"epoch": 2.49,
"eval_loss": 0.1430414617061615,
"eval_runtime": 253.9896,
"eval_samples_per_second": 20.351,
"eval_steps_per_second": 2.547,
"eval_wer": 0.13251993873131568,
"step": 3000
},
{
"epoch": 2.65,
"learning_rate": 9.584534368070954e-05,
"loss": 0.3481,
"step": 3200
},
{
"epoch": 2.65,
"eval_loss": 0.1356772631406784,
"eval_runtime": 253.702,
"eval_samples_per_second": 20.374,
"eval_steps_per_second": 2.55,
"eval_wer": 0.12829451222732793,
"step": 3200
},
{
"epoch": 2.82,
"learning_rate": 9.556956762749447e-05,
"loss": 0.337,
"step": 3400
},
{
"epoch": 2.82,
"eval_loss": 0.1254938244819641,
"eval_runtime": 254.1064,
"eval_samples_per_second": 20.342,
"eval_steps_per_second": 2.546,
"eval_wer": 0.1273437912639307,
"step": 3400
},
{
"epoch": 2.98,
"learning_rate": 9.529240576496675e-05,
"loss": 0.3346,
"step": 3600
},
{
"epoch": 2.98,
"eval_loss": 0.13027481734752655,
"eval_runtime": 254.6218,
"eval_samples_per_second": 20.301,
"eval_steps_per_second": 2.541,
"eval_wer": 0.1280304230708287,
"step": 3600
},
{
"epoch": 3.15,
"learning_rate": 9.501524390243903e-05,
"loss": 0.3192,
"step": 3800
},
{
"epoch": 3.15,
"eval_loss": 0.13303972780704498,
"eval_runtime": 254.7219,
"eval_samples_per_second": 20.293,
"eval_steps_per_second": 2.54,
"eval_wer": 0.12280145777214388,
"step": 3800
},
{
"epoch": 3.32,
"learning_rate": 9.473808203991131e-05,
"loss": 0.3093,
"step": 4000
},
{
"epoch": 3.32,
"eval_loss": 0.13668616116046906,
"eval_runtime": 254.6369,
"eval_samples_per_second": 20.299,
"eval_steps_per_second": 2.541,
"eval_wer": 0.12206200813394602,
"step": 4000
},
{
"epoch": 3.48,
"learning_rate": 9.446092017738359e-05,
"loss": 0.3119,
"step": 4200
},
{
"epoch": 3.48,
"eval_loss": 0.1260731816291809,
"eval_runtime": 255.6853,
"eval_samples_per_second": 20.216,
"eval_steps_per_second": 2.53,
"eval_wer": 0.1149316009084667,
"step": 4200
},
{
"epoch": 3.65,
"learning_rate": 9.418375831485588e-05,
"loss": 0.3115,
"step": 4400
},
{
"epoch": 3.65,
"eval_loss": 0.11900634318590164,
"eval_runtime": 255.3718,
"eval_samples_per_second": 20.241,
"eval_steps_per_second": 2.534,
"eval_wer": 0.11514287223366608,
"step": 4400
},
{
"epoch": 3.81,
"learning_rate": 9.390659645232817e-05,
"loss": 0.3104,
"step": 4600
},
{
"epoch": 3.81,
"eval_loss": 0.11844547092914581,
"eval_runtime": 253.3424,
"eval_samples_per_second": 20.403,
"eval_steps_per_second": 2.554,
"eval_wer": 0.11994929488195215,
"step": 4600
},
{
"epoch": 3.98,
"learning_rate": 9.362943458980045e-05,
"loss": 0.3084,
"step": 4800
},
{
"epoch": 3.98,
"eval_loss": 0.12033428996801376,
"eval_runtime": 253.1313,
"eval_samples_per_second": 20.42,
"eval_steps_per_second": 2.556,
"eval_wer": 0.114139333438969,
"step": 4800
},
{
"epoch": 4.15,
"learning_rate": 9.335227272727273e-05,
"loss": 0.2879,
"step": 5000
},
{
"epoch": 4.15,
"eval_loss": 0.1269288957118988,
"eval_runtime": 252.0701,
"eval_samples_per_second": 20.506,
"eval_steps_per_second": 2.567,
"eval_wer": 0.11239634500607405,
"step": 5000
},
{
"epoch": 4.31,
"learning_rate": 9.307511086474502e-05,
"loss": 0.2865,
"step": 5200
},
{
"epoch": 4.31,
"eval_loss": 0.13235774636268616,
"eval_runtime": 253.6428,
"eval_samples_per_second": 20.379,
"eval_steps_per_second": 2.551,
"eval_wer": 0.11118153488617757,
"step": 5200
},
{
"epoch": 4.48,
"learning_rate": 9.27979490022173e-05,
"loss": 0.2845,
"step": 5400
},
{
"epoch": 4.48,
"eval_loss": 0.12866514921188354,
"eval_runtime": 257.2798,
"eval_samples_per_second": 20.091,
"eval_steps_per_second": 2.515,
"eval_wer": 0.11424496910156869,
"step": 5400
},
{
"epoch": 4.64,
"learning_rate": 9.252078713968959e-05,
"loss": 0.2856,
"step": 5600
},
{
"epoch": 4.64,
"eval_loss": 0.12589029967784882,
"eval_runtime": 254.2212,
"eval_samples_per_second": 20.333,
"eval_steps_per_second": 2.545,
"eval_wer": 0.11012517826018063,
"step": 5600
},
{
"epoch": 4.81,
"learning_rate": 9.224362527716187e-05,
"loss": 0.2801,
"step": 5800
},
{
"epoch": 4.81,
"eval_loss": 0.12850765883922577,
"eval_runtime": 252.9838,
"eval_samples_per_second": 20.432,
"eval_steps_per_second": 2.557,
"eval_wer": 0.11023081392278034,
"step": 5800
},
{
"epoch": 4.97,
"learning_rate": 9.196646341463415e-05,
"loss": 0.2882,
"step": 6000
},
{
"epoch": 4.97,
"eval_loss": 0.13433855772018433,
"eval_runtime": 253.6459,
"eval_samples_per_second": 20.379,
"eval_steps_per_second": 2.551,
"eval_wer": 0.10880473247768446,
"step": 6000
},
{
"epoch": 5.14,
"learning_rate": 9.168930155210643e-05,
"loss": 0.2701,
"step": 6200
},
{
"epoch": 5.14,
"eval_loss": 0.14238382875919342,
"eval_runtime": 253.374,
"eval_samples_per_second": 20.401,
"eval_steps_per_second": 2.554,
"eval_wer": 0.10531875561189458,
"step": 6200
},
{
"epoch": 5.31,
"learning_rate": 9.141213968957871e-05,
"loss": 0.2688,
"step": 6400
},
{
"epoch": 5.31,
"eval_loss": 0.1337863802909851,
"eval_runtime": 253.8454,
"eval_samples_per_second": 20.363,
"eval_steps_per_second": 2.549,
"eval_wer": 0.10288913537210162,
"step": 6400
},
{
"epoch": 5.47,
"learning_rate": 9.1134977827051e-05,
"loss": 0.2683,
"step": 6600
},
{
"epoch": 5.47,
"eval_loss": 0.14259789884090424,
"eval_runtime": 252.7728,
"eval_samples_per_second": 20.449,
"eval_steps_per_second": 2.56,
"eval_wer": 0.10732583320128876,
"step": 6600
},
{
"epoch": 5.64,
"learning_rate": 9.085781596452329e-05,
"loss": 0.2609,
"step": 6800
},
{
"epoch": 5.64,
"eval_loss": 0.13099780678749084,
"eval_runtime": 252.7442,
"eval_samples_per_second": 20.452,
"eval_steps_per_second": 2.56,
"eval_wer": 0.10257222838430254,
"step": 6800
},
{
"epoch": 5.8,
"learning_rate": 9.058065410199557e-05,
"loss": 0.267,
"step": 7000
},
{
"epoch": 5.8,
"eval_loss": 0.14180444180965424,
"eval_runtime": 254.0779,
"eval_samples_per_second": 20.344,
"eval_steps_per_second": 2.546,
"eval_wer": 0.10119896477050652,
"step": 7000
},
{
"epoch": 5.97,
"learning_rate": 9.030487804878049e-05,
"loss": 0.2638,
"step": 7200
},
{
"epoch": 5.97,
"eval_loss": 0.13856083154678345,
"eval_runtime": 253.6851,
"eval_samples_per_second": 20.376,
"eval_steps_per_second": 2.55,
"eval_wer": 0.1007236042888079,
"step": 7200
},
{
"epoch": 6.14,
"learning_rate": 9.002771618625277e-05,
"loss": 0.2604,
"step": 7400
},
{
"epoch": 6.14,
"eval_loss": 0.14975795149803162,
"eval_runtime": 255.6414,
"eval_samples_per_second": 20.22,
"eval_steps_per_second": 2.531,
"eval_wer": 0.10389267416679872,
"step": 7400
},
{
"epoch": 6.3,
"learning_rate": 8.975055432372505e-05,
"loss": 0.2484,
"step": 7600
},
{
"epoch": 6.3,
"eval_loss": 0.1300615817308426,
"eval_runtime": 256.8835,
"eval_samples_per_second": 20.122,
"eval_steps_per_second": 2.519,
"eval_wer": 0.10230813922780331,
"step": 7600
},
{
"epoch": 6.47,
"learning_rate": 8.947339246119735e-05,
"loss": 0.2515,
"step": 7800
},
{
"epoch": 6.47,
"eval_loss": 0.13480910658836365,
"eval_runtime": 254.0211,
"eval_samples_per_second": 20.349,
"eval_steps_per_second": 2.547,
"eval_wer": 0.10310040669730101,
"step": 7800
},
{
"epoch": 6.63,
"learning_rate": 8.919623059866963e-05,
"loss": 0.2529,
"step": 8000
},
{
"epoch": 6.63,
"eval_loss": 0.12069129198789597,
"eval_runtime": 254.8765,
"eval_samples_per_second": 20.28,
"eval_steps_per_second": 2.538,
"eval_wer": 0.10146305392700576,
"step": 8000
},
{
"epoch": 6.8,
"learning_rate": 8.891906873614191e-05,
"loss": 0.2498,
"step": 8200
},
{
"epoch": 6.8,
"eval_loss": 0.14146772027015686,
"eval_runtime": 254.7381,
"eval_samples_per_second": 20.291,
"eval_steps_per_second": 2.54,
"eval_wer": 0.1016215074209053,
"step": 8200
},
{
"epoch": 6.96,
"learning_rate": 8.86419068736142e-05,
"loss": 0.2502,
"step": 8400
},
{
"epoch": 6.96,
"eval_loss": 0.12623198330402374,
"eval_runtime": 254.5919,
"eval_samples_per_second": 20.303,
"eval_steps_per_second": 2.541,
"eval_wer": 0.09760735224211693,
"step": 8400
},
{
"epoch": 7.13,
"learning_rate": 8.836474501108648e-05,
"loss": 0.2404,
"step": 8600
},
{
"epoch": 7.13,
"eval_loss": 0.13511496782302856,
"eval_runtime": 254.4607,
"eval_samples_per_second": 20.314,
"eval_steps_per_second": 2.543,
"eval_wer": 0.09929752284371204,
"step": 8600
},
{
"epoch": 7.3,
"learning_rate": 8.808758314855876e-05,
"loss": 0.2337,
"step": 8800
},
{
"epoch": 7.3,
"eval_loss": 0.13152754306793213,
"eval_runtime": 254.1423,
"eval_samples_per_second": 20.339,
"eval_steps_per_second": 2.546,
"eval_wer": 0.09876934453071357,
"step": 8800
},
{
"epoch": 7.46,
"learning_rate": 8.781042128603105e-05,
"loss": 0.2396,
"step": 9000
},
{
"epoch": 7.46,
"eval_loss": 0.135118767619133,
"eval_runtime": 255.0124,
"eval_samples_per_second": 20.27,
"eval_steps_per_second": 2.537,
"eval_wer": 0.09834680188031479,
"step": 9000
},
{
"epoch": 7.63,
"learning_rate": 8.753325942350333e-05,
"loss": 0.2431,
"step": 9200
},
{
"epoch": 7.63,
"eval_loss": 0.13074836134910583,
"eval_runtime": 255.0093,
"eval_samples_per_second": 20.27,
"eval_steps_per_second": 2.537,
"eval_wer": 0.09707917392911847,
"step": 9200
},
{
"epoch": 7.79,
"learning_rate": 8.725609756097561e-05,
"loss": 0.2379,
"step": 9400
},
{
"epoch": 7.79,
"eval_loss": 0.13186238706111908,
"eval_runtime": 255.2219,
"eval_samples_per_second": 20.253,
"eval_steps_per_second": 2.535,
"eval_wer": 0.09950879416891142,
"step": 9400
},
{
"epoch": 7.96,
"learning_rate": 8.697893569844789e-05,
"loss": 0.2421,
"step": 9600
},
{
"epoch": 7.96,
"eval_loss": 0.1254909485578537,
"eval_runtime": 255.0666,
"eval_samples_per_second": 20.265,
"eval_steps_per_second": 2.537,
"eval_wer": 0.09882216236201341,
"step": 9600
},
{
"epoch": 8.13,
"learning_rate": 8.670177383592018e-05,
"loss": 0.2324,
"step": 9800
},
{
"epoch": 8.13,
"eval_loss": 0.13816988468170166,
"eval_runtime": 257.5755,
"eval_samples_per_second": 20.068,
"eval_steps_per_second": 2.512,
"eval_wer": 0.09628690645962076,
"step": 9800
},
{
"epoch": 8.29,
"learning_rate": 8.642461197339246e-05,
"loss": 0.2258,
"step": 10000
},
{
"epoch": 8.29,
"eval_loss": 0.15982431173324585,
"eval_runtime": 257.1975,
"eval_samples_per_second": 20.097,
"eval_steps_per_second": 2.516,
"eval_wer": 0.09750171657951724,
"step": 10000
},
{
"epoch": 8.46,
"learning_rate": 8.614745011086475e-05,
"loss": 0.2253,
"step": 10200
},
{
"epoch": 8.46,
"eval_loss": 0.15032005310058594,
"eval_runtime": 256.9993,
"eval_samples_per_second": 20.113,
"eval_steps_per_second": 2.518,
"eval_wer": 0.09422701103892674,
"step": 10200
},
{
"epoch": 8.62,
"learning_rate": 8.587028824833703e-05,
"loss": 0.2228,
"step": 10400
},
{
"epoch": 8.62,
"eval_loss": 0.12655803561210632,
"eval_runtime": 258.0019,
"eval_samples_per_second": 20.035,
"eval_steps_per_second": 2.508,
"eval_wer": 0.09581154597792214,
"step": 10400
},
{
"epoch": 8.79,
"learning_rate": 8.559312638580932e-05,
"loss": 0.2255,
"step": 10600
},
{
"epoch": 8.79,
"eval_loss": 0.14087137579917908,
"eval_runtime": 252.7692,
"eval_samples_per_second": 20.449,
"eval_steps_per_second": 2.56,
"eval_wer": 0.09623408862832092,
"step": 10600
},
{
"epoch": 8.95,
"learning_rate": 8.53159645232816e-05,
"loss": 0.2307,
"step": 10800
},
{
"epoch": 8.95,
"eval_loss": 0.13605473935604095,
"eval_runtime": 255.7465,
"eval_samples_per_second": 20.211,
"eval_steps_per_second": 2.53,
"eval_wer": 0.0974488987482174,
"step": 10800
},
{
"epoch": 9.12,
"learning_rate": 8.503880266075388e-05,
"loss": 0.2149,
"step": 11000
},
{
"epoch": 9.12,
"eval_loss": 0.13241790235042572,
"eval_runtime": 254.7831,
"eval_samples_per_second": 20.288,
"eval_steps_per_second": 2.539,
"eval_wer": 0.09338192573812919,
"step": 11000
},
{
"epoch": 9.29,
"learning_rate": 8.476164079822618e-05,
"loss": 0.2168,
"step": 11200
},
{
"epoch": 9.29,
"eval_loss": 0.1478220671415329,
"eval_runtime": 255.9893,
"eval_samples_per_second": 20.192,
"eval_steps_per_second": 2.527,
"eval_wer": 0.09792425922991602,
"step": 11200
},
{
"epoch": 9.45,
"learning_rate": 8.448447893569845e-05,
"loss": 0.2152,
"step": 11400
},
{
"epoch": 9.45,
"eval_loss": 0.13686269521713257,
"eval_runtime": 254.4314,
"eval_samples_per_second": 20.316,
"eval_steps_per_second": 2.543,
"eval_wer": 0.09306501875033012,
"step": 11400
},
{
"epoch": 9.62,
"learning_rate": 8.420731707317073e-05,
"loss": 0.2155,
"step": 11600
},
{
"epoch": 9.62,
"eval_loss": 0.13407327234745026,
"eval_runtime": 254.6769,
"eval_samples_per_second": 20.296,
"eval_steps_per_second": 2.54,
"eval_wer": 0.09449110019542598,
"step": 11600
},
{
"epoch": 9.78,
"learning_rate": 8.393154101995566e-05,
"loss": 0.2108,
"step": 11800
},
{
"epoch": 9.78,
"eval_loss": 0.13564249873161316,
"eval_runtime": 254.2947,
"eval_samples_per_second": 20.327,
"eval_steps_per_second": 2.544,
"eval_wer": 0.0948608250145249,
"step": 11800
},
{
"epoch": 9.95,
"learning_rate": 8.365437915742794e-05,
"loss": 0.2179,
"step": 12000
},
{
"epoch": 9.95,
"eval_loss": 0.15698903799057007,
"eval_runtime": 254.2869,
"eval_samples_per_second": 20.327,
"eval_steps_per_second": 2.544,
"eval_wer": 0.08994876670363915,
"step": 12000
},
{
"epoch": 10.12,
"learning_rate": 8.337721729490022e-05,
"loss": 0.1988,
"step": 12200
},
{
"epoch": 10.12,
"eval_loss": 0.14923857152462006,
"eval_runtime": 254.962,
"eval_samples_per_second": 20.274,
"eval_steps_per_second": 2.538,
"eval_wer": 0.09132203031743516,
"step": 12200
},
{
"epoch": 10.28,
"learning_rate": 8.310005543237252e-05,
"loss": 0.2051,
"step": 12400
},
{
"epoch": 10.28,
"eval_loss": 0.1382753700017929,
"eval_runtime": 254.97,
"eval_samples_per_second": 20.273,
"eval_steps_per_second": 2.538,
"eval_wer": 0.08973749537843977,
"step": 12400
},
{
"epoch": 10.45,
"learning_rate": 8.28228935698448e-05,
"loss": 0.2079,
"step": 12600
},
{
"epoch": 10.45,
"eval_loss": 0.14029560983181,
"eval_runtime": 255.2219,
"eval_samples_per_second": 20.253,
"eval_steps_per_second": 2.535,
"eval_wer": 0.09132203031743516,
"step": 12600
},
{
"epoch": 10.61,
"learning_rate": 8.254573170731708e-05,
"loss": 0.2056,
"step": 12800
},
{
"epoch": 10.61,
"eval_loss": 0.13067609071731567,
"eval_runtime": 255.0916,
"eval_samples_per_second": 20.263,
"eval_steps_per_second": 2.536,
"eval_wer": 0.08994876670363915,
"step": 12800
},
{
"epoch": 10.78,
"learning_rate": 8.226856984478936e-05,
"loss": 0.2053,
"step": 13000
},
{
"epoch": 10.78,
"eval_loss": 0.13401809334754944,
"eval_runtime": 255.8654,
"eval_samples_per_second": 20.202,
"eval_steps_per_second": 2.529,
"eval_wer": 0.09031849152273808,
"step": 13000
},
{
"epoch": 10.94,
"learning_rate": 8.199140798226164e-05,
"loss": 0.2015,
"step": 13200
},
{
"epoch": 10.94,
"eval_loss": 0.12882278859615326,
"eval_runtime": 263.8909,
"eval_samples_per_second": 19.588,
"eval_steps_per_second": 2.452,
"eval_wer": 0.0923783869434321,
"step": 13200
},
{
"epoch": 11.11,
"learning_rate": 8.171424611973392e-05,
"loss": 0.2,
"step": 13400
},
{
"epoch": 11.11,
"eval_loss": 0.12576742470264435,
"eval_runtime": 255.4818,
"eval_samples_per_second": 20.232,
"eval_steps_per_second": 2.532,
"eval_wer": 0.08683251465694819,
"step": 13400
},
{
"epoch": 11.28,
"learning_rate": 8.14370842572062e-05,
"loss": 0.2029,
"step": 13600
},
{
"epoch": 11.28,
"eval_loss": 0.13859006762504578,
"eval_runtime": 254.423,
"eval_samples_per_second": 20.317,
"eval_steps_per_second": 2.543,
"eval_wer": 0.09000158453493899,
"step": 13600
},
{
"epoch": 11.44,
"learning_rate": 8.11599223946785e-05,
"loss": 0.2044,
"step": 13800
},
{
"epoch": 11.44,
"eval_loss": 0.138057678937912,
"eval_runtime": 255.1183,
"eval_samples_per_second": 20.261,
"eval_steps_per_second": 2.536,
"eval_wer": 0.09185020863043364,
"step": 13800
},
{
"epoch": 11.61,
"learning_rate": 8.088414634146342e-05,
"loss": 0.1943,
"step": 14000
},
{
"epoch": 11.61,
"eval_loss": 0.1461963802576065,
"eval_runtime": 255.5721,
"eval_samples_per_second": 20.225,
"eval_steps_per_second": 2.532,
"eval_wer": 0.09206147995563302,
"step": 14000
},
{
"epoch": 11.77,
"learning_rate": 8.06069844789357e-05,
"loss": 0.2072,
"step": 14200
},
{
"epoch": 11.77,
"eval_loss": 0.14551697671413422,
"eval_runtime": 256.1094,
"eval_samples_per_second": 20.183,
"eval_steps_per_second": 2.526,
"eval_wer": 0.08846986742724344,
"step": 14200
},
{
"epoch": 11.94,
"learning_rate": 8.032982261640798e-05,
"loss": 0.1998,
"step": 14400
},
{
"epoch": 11.94,
"eval_loss": 0.13519984483718872,
"eval_runtime": 255.2141,
"eval_samples_per_second": 20.254,
"eval_steps_per_second": 2.535,
"eval_wer": 0.09190302646173348,
"step": 14400
},
{
"epoch": 12.11,
"learning_rate": 8.00540465631929e-05,
"loss": 0.1952,
"step": 14600
},
{
"epoch": 12.11,
"eval_loss": 0.1399640440940857,
"eval_runtime": 254.8364,
"eval_samples_per_second": 20.284,
"eval_steps_per_second": 2.539,
"eval_wer": 0.090688216341837,
"step": 14600
},
{
"epoch": 12.27,
"learning_rate": 7.977688470066519e-05,
"loss": 0.1932,
"step": 14800
},
{
"epoch": 12.27,
"eval_loss": 0.13122260570526123,
"eval_runtime": 255.4641,
"eval_samples_per_second": 20.234,
"eval_steps_per_second": 2.533,
"eval_wer": 0.09084666983573654,
"step": 14800
},
{
"epoch": 12.44,
"learning_rate": 7.949972283813748e-05,
"loss": 0.1885,
"step": 15000
},
{
"epoch": 12.44,
"eval_loss": 0.14805012941360474,
"eval_runtime": 255.9292,
"eval_samples_per_second": 20.197,
"eval_steps_per_second": 2.528,
"eval_wer": 0.08883959224634237,
"step": 15000
},
{
"epoch": 12.6,
"learning_rate": 7.922256097560976e-05,
"loss": 0.1904,
"step": 15200
},
{
"epoch": 12.6,
"eval_loss": 0.13773396611213684,
"eval_runtime": 254.593,
"eval_samples_per_second": 20.303,
"eval_steps_per_second": 2.541,
"eval_wer": 0.08825859610204405,
"step": 15200
},
{
"epoch": 12.77,
"learning_rate": 7.894539911308204e-05,
"loss": 0.1924,
"step": 15400
},
{
"epoch": 12.77,
"eval_loss": 0.14221470057964325,
"eval_runtime": 254.58,
"eval_samples_per_second": 20.304,
"eval_steps_per_second": 2.541,
"eval_wer": 0.09026567369143823,
"step": 15400
},
{
"epoch": 12.93,
"learning_rate": 7.866823725055434e-05,
"loss": 0.188,
"step": 15600
},
{
"epoch": 12.93,
"eval_loss": 0.14350585639476776,
"eval_runtime": 258.9085,
"eval_samples_per_second": 19.965,
"eval_steps_per_second": 2.499,
"eval_wer": 0.08540643321185232,
"step": 15600
},
{
"epoch": 13.1,
"learning_rate": 7.839107538802661e-05,
"loss": 0.1877,
"step": 15800
},
{
"epoch": 13.1,
"eval_loss": 0.1520785242319107,
"eval_runtime": 255.8963,
"eval_samples_per_second": 20.2,
"eval_steps_per_second": 2.528,
"eval_wer": 0.08899804574024191,
"step": 15800
},
{
"epoch": 13.27,
"learning_rate": 7.811391352549889e-05,
"loss": 0.1825,
"step": 16000
},
{
"epoch": 13.27,
"eval_loss": 0.13483111560344696,
"eval_runtime": 256.5689,
"eval_samples_per_second": 20.147,
"eval_steps_per_second": 2.522,
"eval_wer": 0.08905086357154175,
"step": 16000
},
{
"epoch": 13.43,
"learning_rate": 7.783675166297117e-05,
"loss": 0.185,
"step": 16200
},
{
"epoch": 13.43,
"eval_loss": 0.13759800791740417,
"eval_runtime": 258.0191,
"eval_samples_per_second": 20.033,
"eval_steps_per_second": 2.508,
"eval_wer": 0.08672687899434849,
"step": 16200
},
{
"epoch": 13.6,
"learning_rate": 7.755958980044346e-05,
"loss": 0.1805,
"step": 16400
},
{
"epoch": 13.6,
"eval_loss": 0.14212605357170105,
"eval_runtime": 258.5566,
"eval_samples_per_second": 19.992,
"eval_steps_per_second": 2.502,
"eval_wer": 0.0883114139333439,
"step": 16400
},
{
"epoch": 13.76,
"learning_rate": 7.728242793791574e-05,
"loss": 0.186,
"step": 16600
},
{
"epoch": 13.76,
"eval_loss": 0.1396447867155075,
"eval_runtime": 257.807,
"eval_samples_per_second": 20.05,
"eval_steps_per_second": 2.51,
"eval_wer": 0.08514234405535309,
"step": 16600
},
{
"epoch": 13.93,
"learning_rate": 7.700526607538803e-05,
"loss": 0.1869,
"step": 16800
},
{
"epoch": 13.93,
"eval_loss": 0.14811939001083374,
"eval_runtime": 257.7698,
"eval_samples_per_second": 20.053,
"eval_steps_per_second": 2.51,
"eval_wer": 0.08456134791105477,
"step": 16800
},
{
"epoch": 14.1,
"learning_rate": 7.672949002217296e-05,
"loss": 0.1808,
"step": 17000
},
{
"epoch": 14.1,
"eval_loss": 0.15346239507198334,
"eval_runtime": 259.8127,
"eval_samples_per_second": 19.895,
"eval_steps_per_second": 2.49,
"eval_wer": 0.08503670839275339,
"step": 17000
},
{
"epoch": 14.26,
"learning_rate": 7.645232815964524e-05,
"loss": 0.1775,
"step": 17200
},
{
"epoch": 14.26,
"eval_loss": 0.14250528812408447,
"eval_runtime": 257.4388,
"eval_samples_per_second": 20.079,
"eval_steps_per_second": 2.513,
"eval_wer": 0.0876247821264459,
"step": 17200
},
{
"epoch": 14.43,
"learning_rate": 7.617516629711752e-05,
"loss": 0.1773,
"step": 17400
},
{
"epoch": 14.43,
"eval_loss": 0.14766837656497955,
"eval_runtime": 258.0221,
"eval_samples_per_second": 20.033,
"eval_steps_per_second": 2.508,
"eval_wer": 0.08471980140495432,
"step": 17400
},
{
"epoch": 14.59,
"learning_rate": 7.58980044345898e-05,
"loss": 0.1851,
"step": 17600
},
{
"epoch": 14.59,
"eval_loss": 0.15123723447322845,
"eval_runtime": 262.1208,
"eval_samples_per_second": 19.72,
"eval_steps_per_second": 2.468,
"eval_wer": 0.08667406116304864,
"step": 17600
},
{
"epoch": 14.76,
"learning_rate": 7.562084257206209e-05,
"loss": 0.1775,
"step": 17800
},
{
"epoch": 14.76,
"eval_loss": 0.14902031421661377,
"eval_runtime": 257.8432,
"eval_samples_per_second": 20.047,
"eval_steps_per_second": 2.509,
"eval_wer": 0.08329371995985844,
"step": 17800
},
{
"epoch": 14.92,
"learning_rate": 7.534368070953437e-05,
"loss": 0.1802,
"step": 18000
},
{
"epoch": 14.92,
"eval_loss": 0.15108011662960052,
"eval_runtime": 257.3237,
"eval_samples_per_second": 20.088,
"eval_steps_per_second": 2.514,
"eval_wer": 0.08709660381344742,
"step": 18000
},
{
"epoch": 15.09,
"learning_rate": 7.50679046563193e-05,
"loss": 0.1829,
"step": 18200
},
{
"epoch": 15.09,
"eval_loss": 0.14215655624866486,
"eval_runtime": 258.1845,
"eval_samples_per_second": 20.021,
"eval_steps_per_second": 2.506,
"eval_wer": 0.0859346115248508,
"step": 18200
},
{
"epoch": 15.26,
"learning_rate": 7.479074279379158e-05,
"loss": 0.1704,
"step": 18400
},
{
"epoch": 15.26,
"eval_loss": 0.1536380648612976,
"eval_runtime": 258.2175,
"eval_samples_per_second": 20.018,
"eval_steps_per_second": 2.506,
"eval_wer": 0.08535361538055247,
"step": 18400
},
{
"epoch": 15.42,
"learning_rate": 7.451358093126386e-05,
"loss": 0.1707,
"step": 18600
},
{
"epoch": 15.42,
"eval_loss": 0.15412335097789764,
"eval_runtime": 259.6526,
"eval_samples_per_second": 19.907,
"eval_steps_per_second": 2.492,
"eval_wer": 0.08366344477895737,
"step": 18600
},
{
"epoch": 15.59,
"learning_rate": 7.423641906873615e-05,
"loss": 0.1716,
"step": 18800
},
{
"epoch": 15.59,
"eval_loss": 0.15734080970287323,
"eval_runtime": 256.5213,
"eval_samples_per_second": 20.15,
"eval_steps_per_second": 2.522,
"eval_wer": 0.08419162309195584,
"step": 18800
},
{
"epoch": 15.75,
"learning_rate": 7.395925720620843e-05,
"loss": 0.1755,
"step": 19000
},
{
"epoch": 15.75,
"eval_loss": 0.1497374176979065,
"eval_runtime": 255.8623,
"eval_samples_per_second": 20.202,
"eval_steps_per_second": 2.529,
"eval_wer": 0.08408598742935615,
"step": 19000
},
{
"epoch": 15.92,
"learning_rate": 7.368209534368071e-05,
"loss": 0.1695,
"step": 19200
},
{
"epoch": 15.92,
"eval_loss": 0.14581099152565002,
"eval_runtime": 256.4224,
"eval_samples_per_second": 20.158,
"eval_steps_per_second": 2.523,
"eval_wer": 0.08371626261025722,
"step": 19200
},
{
"epoch": 16.09,
"learning_rate": 7.340493348115299e-05,
"loss": 0.1761,
"step": 19400
},
{
"epoch": 16.09,
"eval_loss": 0.14683474600315094,
"eval_runtime": 271.7581,
"eval_samples_per_second": 19.021,
"eval_steps_per_second": 2.381,
"eval_wer": 0.08545925104315216,
"step": 19400
},
{
"epoch": 16.25,
"learning_rate": 7.312777161862528e-05,
"loss": 0.1667,
"step": 19600
},
{
"epoch": 16.25,
"eval_loss": 0.1606747955083847,
"eval_runtime": 271.8508,
"eval_samples_per_second": 19.014,
"eval_steps_per_second": 2.38,
"eval_wer": 0.08751914646384619,
"step": 19600
},
{
"epoch": 16.42,
"learning_rate": 7.285060975609756e-05,
"loss": 0.1667,
"step": 19800
},
{
"epoch": 16.42,
"eval_loss": 0.14115694165229797,
"eval_runtime": 271.6689,
"eval_samples_per_second": 19.027,
"eval_steps_per_second": 2.382,
"eval_wer": 0.08524797971795278,
"step": 19800
},
{
"epoch": 16.58,
"learning_rate": 7.257344789356985e-05,
"loss": 0.1653,
"step": 20000
},
{
"epoch": 16.58,
"eval_loss": 0.13544563949108124,
"eval_runtime": 271.5302,
"eval_samples_per_second": 19.037,
"eval_steps_per_second": 2.383,
"eval_wer": 0.08477261923625416,
"step": 20000
},
{
"epoch": 16.75,
"learning_rate": 7.229628603104214e-05,
"loss": 0.1695,
"step": 20200
},
{
"epoch": 16.75,
"eval_loss": 0.1354389786720276,
"eval_runtime": 271.5697,
"eval_samples_per_second": 19.034,
"eval_steps_per_second": 2.382,
"eval_wer": 0.08350499128505784,
"step": 20200
},
{
"epoch": 16.91,
"learning_rate": 7.201912416851442e-05,
"loss": 0.171,
"step": 20400
},
{
"epoch": 16.91,
"eval_loss": 0.14289897680282593,
"eval_runtime": 258.0663,
"eval_samples_per_second": 20.03,
"eval_steps_per_second": 2.507,
"eval_wer": 0.08435007658585539,
"step": 20400
},
{
"epoch": 17.08,
"learning_rate": 7.17419623059867e-05,
"loss": 0.167,
"step": 20600
},
{
"epoch": 17.08,
"eval_loss": 0.13994231820106506,
"eval_runtime": 256.5044,
"eval_samples_per_second": 20.152,
"eval_steps_per_second": 2.522,
"eval_wer": 0.08207890983996197,
"step": 20600
},
{
"epoch": 17.25,
"learning_rate": 7.146480044345898e-05,
"loss": 0.1595,
"step": 20800
},
{
"epoch": 17.25,
"eval_loss": 0.16428013145923615,
"eval_runtime": 256.5622,
"eval_samples_per_second": 20.147,
"eval_steps_per_second": 2.522,
"eval_wer": 0.08192045634606243,
"step": 20800
},
{
"epoch": 17.41,
"learning_rate": 7.118763858093127e-05,
"loss": 0.1565,
"step": 21000
},
{
"epoch": 17.41,
"eval_loss": 0.1530633270740509,
"eval_runtime": 258.23,
"eval_samples_per_second": 20.017,
"eval_steps_per_second": 2.506,
"eval_wer": 0.08456134791105477,
"step": 21000
},
{
"epoch": 17.58,
"learning_rate": 7.091047671840355e-05,
"loss": 0.1589,
"step": 21200
},
{
"epoch": 17.58,
"eval_loss": 0.1481485366821289,
"eval_runtime": 257.1667,
"eval_samples_per_second": 20.1,
"eval_steps_per_second": 2.516,
"eval_wer": 0.08102255321396504,
"step": 21200
},
{
"epoch": 17.74,
"learning_rate": 7.063331485587583e-05,
"loss": 0.1602,
"step": 21400
},
{
"epoch": 17.74,
"eval_loss": 0.16114427149295807,
"eval_runtime": 257.6644,
"eval_samples_per_second": 20.061,
"eval_steps_per_second": 2.511,
"eval_wer": 0.07838166164897269,
"step": 21400
},
{
"epoch": 17.91,
"learning_rate": 7.035615299334812e-05,
"loss": 0.1622,
"step": 21600
},
{
"epoch": 17.91,
"eval_loss": 0.14328357577323914,
"eval_runtime": 258.6193,
"eval_samples_per_second": 19.987,
"eval_steps_per_second": 2.502,
"eval_wer": 0.0832409021285586,
"step": 21600
},
{
"epoch": 18.08,
"learning_rate": 7.00789911308204e-05,
"loss": 0.1629,
"step": 21800
},
{
"epoch": 18.08,
"eval_loss": 0.14952301979064941,
"eval_runtime": 253.7518,
"eval_samples_per_second": 20.37,
"eval_steps_per_second": 2.55,
"eval_wer": 0.08202609200866212,
"step": 21800
},
{
"epoch": 18.24,
"learning_rate": 6.980182926829268e-05,
"loss": 0.1542,
"step": 22000
},
{
"epoch": 18.24,
"eval_loss": 0.1603306531906128,
"eval_runtime": 252.9767,
"eval_samples_per_second": 20.433,
"eval_steps_per_second": 2.558,
"eval_wer": 0.07864575080547193,
"step": 22000
},
{
"epoch": 18.41,
"learning_rate": 6.952466740576497e-05,
"loss": 0.1577,
"step": 22200
},
{
"epoch": 18.41,
"eval_loss": 0.15311960875988007,
"eval_runtime": 253.1091,
"eval_samples_per_second": 20.422,
"eval_steps_per_second": 2.556,
"eval_wer": 0.08123382453916442,
"step": 22200
},
{
"epoch": 18.57,
"learning_rate": 6.924750554323726e-05,
"loss": 0.1592,
"step": 22400
},
{
"epoch": 18.57,
"eval_loss": 0.15086284279823303,
"eval_runtime": 257.495,
"eval_samples_per_second": 20.074,
"eval_steps_per_second": 2.513,
"eval_wer": 0.08170918502086304,
"step": 22400
},
{
"epoch": 18.74,
"learning_rate": 6.897172949002217e-05,
"loss": 0.1608,
"step": 22600
},
{
"epoch": 18.74,
"eval_loss": 0.14557667076587677,
"eval_runtime": 255.6435,
"eval_samples_per_second": 20.22,
"eval_steps_per_second": 2.531,
"eval_wer": 0.0799661965879681,
"step": 22600
},
{
"epoch": 18.9,
"learning_rate": 6.869456762749445e-05,
"loss": 0.1573,
"step": 22800
},
{
"epoch": 18.9,
"eval_loss": 0.15521085262298584,
"eval_runtime": 254.7778,
"eval_samples_per_second": 20.288,
"eval_steps_per_second": 2.539,
"eval_wer": 0.08081128188876564,
"step": 22800
},
{
"epoch": 19.07,
"learning_rate": 6.841740576496674e-05,
"loss": 0.1559,
"step": 23000
},
{
"epoch": 19.07,
"eval_loss": 0.1598125696182251,
"eval_runtime": 255.4991,
"eval_samples_per_second": 20.231,
"eval_steps_per_second": 2.532,
"eval_wer": 0.08123382453916442,
"step": 23000
},
{
"epoch": 19.24,
"learning_rate": 6.814024390243903e-05,
"loss": 0.1518,
"step": 23200
},
{
"epoch": 19.24,
"eval_loss": 0.15756739675998688,
"eval_runtime": 255.2152,
"eval_samples_per_second": 20.253,
"eval_steps_per_second": 2.535,
"eval_wer": 0.08229018116516136,
"step": 23200
},
{
"epoch": 19.4,
"learning_rate": 6.78630820399113e-05,
"loss": 0.1583,
"step": 23400
},
{
"epoch": 19.4,
"eval_loss": 0.1478932946920395,
"eval_runtime": 254.8478,
"eval_samples_per_second": 20.283,
"eval_steps_per_second": 2.539,
"eval_wer": 0.0790682934558707,
"step": 23400
},
{
"epoch": 19.57,
"learning_rate": 6.75859201773836e-05,
"loss": 0.1521,
"step": 23600
},
{
"epoch": 19.57,
"eval_loss": 0.15390987694263458,
"eval_runtime": 255.3412,
"eval_samples_per_second": 20.244,
"eval_steps_per_second": 2.534,
"eval_wer": 0.08144509586436381,
"step": 23600
},
{
"epoch": 19.73,
"learning_rate": 6.730875831485588e-05,
"loss": 0.1504,
"step": 23800
},
{
"epoch": 19.73,
"eval_loss": 0.15799568593502045,
"eval_runtime": 255.2877,
"eval_samples_per_second": 20.248,
"eval_steps_per_second": 2.534,
"eval_wer": 0.07980774309406856,
"step": 23800
},
{
"epoch": 19.9,
"learning_rate": 6.703159645232816e-05,
"loss": 0.1591,
"step": 24000
},
{
"epoch": 19.9,
"eval_loss": 0.14647792279720306,
"eval_runtime": 255.0201,
"eval_samples_per_second": 20.269,
"eval_steps_per_second": 2.537,
"eval_wer": 0.07700839803517667,
"step": 24000
},
{
"epoch": 20.07,
"learning_rate": 6.675443458980046e-05,
"loss": 0.1535,
"step": 24200
},
{
"epoch": 20.07,
"eval_loss": 0.1589883714914322,
"eval_runtime": 255.7034,
"eval_samples_per_second": 20.215,
"eval_steps_per_second": 2.53,
"eval_wer": 0.07669149104737759,
"step": 24200
},
{
"epoch": 20.23,
"learning_rate": 6.647727272727274e-05,
"loss": 0.146,
"step": 24400
},
{
"epoch": 20.23,
"eval_loss": 0.14599309861660004,
"eval_runtime": 254.7694,
"eval_samples_per_second": 20.289,
"eval_steps_per_second": 2.54,
"eval_wer": 0.07875138646807162,
"step": 24400
},
{
"epoch": 20.4,
"learning_rate": 6.6200110864745e-05,
"loss": 0.1492,
"step": 24600
},
{
"epoch": 20.4,
"eval_loss": 0.14993605017662048,
"eval_runtime": 254.9593,
"eval_samples_per_second": 20.274,
"eval_steps_per_second": 2.538,
"eval_wer": 0.07706121586647652,
"step": 24600
},
{
"epoch": 20.56,
"learning_rate": 6.592294900221729e-05,
"loss": 0.1508,
"step": 24800
},
{
"epoch": 20.56,
"eval_loss": 0.1447875052690506,
"eval_runtime": 255.7358,
"eval_samples_per_second": 20.212,
"eval_steps_per_second": 2.53,
"eval_wer": 0.07975492526276871,
"step": 24800
},
{
"epoch": 20.73,
"learning_rate": 6.564578713968958e-05,
"loss": 0.1525,
"step": 25000
},
{
"epoch": 20.73,
"eval_loss": 0.14607439935207367,
"eval_runtime": 255.9294,
"eval_samples_per_second": 20.197,
"eval_steps_per_second": 2.528,
"eval_wer": 0.07838166164897269,
"step": 25000
},
{
"epoch": 20.89,
"learning_rate": 6.53700110864745e-05,
"loss": 0.1503,
"step": 25200
},
{
"epoch": 20.89,
"eval_loss": 0.1411682814359665,
"eval_runtime": 255.8366,
"eval_samples_per_second": 20.204,
"eval_steps_per_second": 2.529,
"eval_wer": 0.07970210743146887,
"step": 25200
},
{
"epoch": 21.06,
"learning_rate": 6.509284922394679e-05,
"loss": 0.1497,
"step": 25400
},
{
"epoch": 21.06,
"eval_loss": 0.14832888543605804,
"eval_runtime": 255.5517,
"eval_samples_per_second": 20.227,
"eval_steps_per_second": 2.532,
"eval_wer": 0.07943801827496963,
"step": 25400
},
{
"epoch": 21.23,
"learning_rate": 6.481568736141908e-05,
"loss": 0.1444,
"step": 25600
},
{
"epoch": 21.23,
"eval_loss": 0.16129909455776215,
"eval_runtime": 255.967,
"eval_samples_per_second": 20.194,
"eval_steps_per_second": 2.528,
"eval_wer": 0.07864575080547193,
"step": 25600
},
{
"epoch": 21.39,
"learning_rate": 6.453852549889136e-05,
"loss": 0.1438,
"step": 25800
},
{
"epoch": 21.39,
"eval_loss": 0.1477702409029007,
"eval_runtime": 255.4815,
"eval_samples_per_second": 20.232,
"eval_steps_per_second": 2.532,
"eval_wer": 0.07890983996197116,
"step": 25800
},
{
"epoch": 21.56,
"learning_rate": 6.426136363636364e-05,
"loss": 0.1439,
"step": 26000
},
{
"epoch": 21.56,
"eval_loss": 0.15728013217449188,
"eval_runtime": 255.4616,
"eval_samples_per_second": 20.234,
"eval_steps_per_second": 2.533,
"eval_wer": 0.07774784767337453,
"step": 26000
},
{
"epoch": 21.72,
"learning_rate": 6.398420177383592e-05,
"loss": 0.1455,
"step": 26200
},
{
"epoch": 21.72,
"eval_loss": 0.14868445694446564,
"eval_runtime": 255.9049,
"eval_samples_per_second": 20.199,
"eval_steps_per_second": 2.528,
"eval_wer": 0.0790682934558707,
"step": 26200
},
{
"epoch": 21.89,
"learning_rate": 6.37070399113082e-05,
"loss": 0.1395,
"step": 26400
},
{
"epoch": 21.89,
"eval_loss": 0.16429665684700012,
"eval_runtime": 262.3659,
"eval_samples_per_second": 19.701,
"eval_steps_per_second": 2.466,
"eval_wer": 0.07600485924047959,
"step": 26400
},
{
"epoch": 22.06,
"learning_rate": 6.342987804878049e-05,
"loss": 0.1428,
"step": 26600
},
{
"epoch": 22.06,
"eval_loss": 0.1581258475780487,
"eval_runtime": 255.8292,
"eval_samples_per_second": 20.205,
"eval_steps_per_second": 2.529,
"eval_wer": 0.0781703903237733,
"step": 26600
},
{
"epoch": 22.22,
"learning_rate": 6.315271618625277e-05,
"loss": 0.1342,
"step": 26800
},
{
"epoch": 22.22,
"eval_loss": 0.16277597844600677,
"eval_runtime": 259.5604,
"eval_samples_per_second": 19.914,
"eval_steps_per_second": 2.493,
"eval_wer": 0.0773781228542756,
"step": 26800
},
{
"epoch": 22.39,
"learning_rate": 6.28769401330377e-05,
"loss": 0.1401,
"step": 27000
},
{
"epoch": 22.39,
"eval_loss": 0.1531515270471573,
"eval_runtime": 260.5139,
"eval_samples_per_second": 19.842,
"eval_steps_per_second": 2.484,
"eval_wer": 0.07859293297417208,
"step": 27000
},
{
"epoch": 22.55,
"learning_rate": 6.259977827050998e-05,
"loss": 0.1401,
"step": 27200
},
{
"epoch": 22.55,
"eval_loss": 0.15395356714725494,
"eval_runtime": 257.8197,
"eval_samples_per_second": 20.049,
"eval_steps_per_second": 2.51,
"eval_wer": 0.07727248719167591,
"step": 27200
},
{
"epoch": 22.72,
"learning_rate": 6.232261640798226e-05,
"loss": 0.1397,
"step": 27400
},
{
"epoch": 22.72,
"eval_loss": 0.1657487452030182,
"eval_runtime": 258.5849,
"eval_samples_per_second": 19.99,
"eval_steps_per_second": 2.502,
"eval_wer": 0.07774784767337453,
"step": 27400
},
{
"epoch": 22.89,
"learning_rate": 6.204545454545455e-05,
"loss": 0.1396,
"step": 27600
},
{
"epoch": 22.89,
"eval_loss": 0.1595001220703125,
"eval_runtime": 258.8028,
"eval_samples_per_second": 19.973,
"eval_steps_per_second": 2.5,
"eval_wer": 0.07695558020387683,
"step": 27600
},
{
"epoch": 23.05,
"learning_rate": 6.176829268292683e-05,
"loss": 0.1425,
"step": 27800
},
{
"epoch": 23.05,
"eval_loss": 0.14454737305641174,
"eval_runtime": 257.5774,
"eval_samples_per_second": 20.068,
"eval_steps_per_second": 2.512,
"eval_wer": 0.07695558020387683,
"step": 27800
},
{
"epoch": 23.22,
"learning_rate": 6.149113082039911e-05,
"loss": 0.1343,
"step": 28000
},
{
"epoch": 23.22,
"eval_loss": 0.15258438885211945,
"eval_runtime": 257.4198,
"eval_samples_per_second": 20.08,
"eval_steps_per_second": 2.513,
"eval_wer": 0.07700839803517667,
"step": 28000
},
{
"epoch": 23.38,
"learning_rate": 6.12139689578714e-05,
"loss": 0.1388,
"step": 28200
},
{
"epoch": 23.38,
"eval_loss": 0.15189868211746216,
"eval_runtime": 261.1531,
"eval_samples_per_second": 19.793,
"eval_steps_per_second": 2.477,
"eval_wer": 0.07447314213278403,
"step": 28200
},
{
"epoch": 23.55,
"learning_rate": 6.0936807095343684e-05,
"loss": 0.1364,
"step": 28400
},
{
"epoch": 23.55,
"eval_loss": 0.15030239522457123,
"eval_runtime": 259.6413,
"eval_samples_per_second": 19.908,
"eval_steps_per_second": 2.492,
"eval_wer": 0.07415623514498494,
"step": 28400
},
{
"epoch": 23.71,
"learning_rate": 6.0659645232815965e-05,
"loss": 0.1444,
"step": 28600
},
{
"epoch": 23.71,
"eval_loss": 0.16646933555603027,
"eval_runtime": 260.1679,
"eval_samples_per_second": 19.868,
"eval_steps_per_second": 2.487,
"eval_wer": 0.07875138646807162,
"step": 28600
},
{
"epoch": 23.88,
"learning_rate": 6.038248337028826e-05,
"loss": 0.1361,
"step": 28800
},
{
"epoch": 23.88,
"eval_loss": 0.15915772318840027,
"eval_runtime": 259.5414,
"eval_samples_per_second": 19.916,
"eval_steps_per_second": 2.493,
"eval_wer": 0.0757935879152802,
"step": 28800
},
{
"epoch": 24.05,
"learning_rate": 6.0105321507760534e-05,
"loss": 0.1398,
"step": 29000
},
{
"epoch": 24.05,
"eval_loss": 0.1606004387140274,
"eval_runtime": 259.8476,
"eval_samples_per_second": 19.892,
"eval_steps_per_second": 2.49,
"eval_wer": 0.07632176622827867,
"step": 29000
},
{
"epoch": 24.21,
"learning_rate": 5.9828159645232815e-05,
"loss": 0.1322,
"step": 29200
},
{
"epoch": 24.21,
"eval_loss": 0.1486821323633194,
"eval_runtime": 259.5122,
"eval_samples_per_second": 19.918,
"eval_steps_per_second": 2.493,
"eval_wer": 0.07848729731157239,
"step": 29200
},
{
"epoch": 24.38,
"learning_rate": 5.9550997782705096e-05,
"loss": 0.1309,
"step": 29400
},
{
"epoch": 24.38,
"eval_loss": 0.16220000386238098,
"eval_runtime": 259.2803,
"eval_samples_per_second": 19.936,
"eval_steps_per_second": 2.495,
"eval_wer": 0.07626894839697881,
"step": 29400
},
{
"epoch": 24.54,
"learning_rate": 5.927383592017739e-05,
"loss": 0.1351,
"step": 29600
},
{
"epoch": 24.54,
"eval_loss": 0.17341530323028564,
"eval_runtime": 262.8143,
"eval_samples_per_second": 19.668,
"eval_steps_per_second": 2.462,
"eval_wer": 0.07795911899857391,
"step": 29600
},
{
"epoch": 24.71,
"learning_rate": 5.899667405764967e-05,
"loss": 0.1298,
"step": 29800
},
{
"epoch": 24.71,
"eval_loss": 0.1510027050971985,
"eval_runtime": 263.1767,
"eval_samples_per_second": 19.641,
"eval_steps_per_second": 2.458,
"eval_wer": 0.07563513442138066,
"step": 29800
},
{
"epoch": 24.88,
"learning_rate": 5.871951219512195e-05,
"loss": 0.1369,
"step": 30000
},
{
"epoch": 24.88,
"eval_loss": 0.13624520599842072,
"eval_runtime": 263.8718,
"eval_samples_per_second": 19.589,
"eval_steps_per_second": 2.452,
"eval_wer": 0.07626894839697881,
"step": 30000
},
{
"epoch": 25.04,
"learning_rate": 5.844235033259424e-05,
"loss": 0.1341,
"step": 30200
},
{
"epoch": 25.04,
"eval_loss": 0.15082810819149017,
"eval_runtime": 261.0919,
"eval_samples_per_second": 19.798,
"eval_steps_per_second": 2.478,
"eval_wer": 0.07854011514287224,
"step": 30200
},
{
"epoch": 25.21,
"learning_rate": 5.816518847006652e-05,
"loss": 0.1249,
"step": 30400
},
{
"epoch": 25.21,
"eval_loss": 0.16026806831359863,
"eval_runtime": 260.2227,
"eval_samples_per_second": 19.864,
"eval_steps_per_second": 2.486,
"eval_wer": 0.07558231659008081,
"step": 30400
},
{
"epoch": 25.37,
"learning_rate": 5.78880266075388e-05,
"loss": 0.129,
"step": 30600
},
{
"epoch": 25.37,
"eval_loss": 0.16147717833518982,
"eval_runtime": 258.8644,
"eval_samples_per_second": 19.968,
"eval_steps_per_second": 2.499,
"eval_wer": 0.07457877779538372,
"step": 30600
},
{
"epoch": 25.54,
"learning_rate": 5.7610864745011084e-05,
"loss": 0.1336,
"step": 30800
},
{
"epoch": 25.54,
"eval_loss": 0.15992993116378784,
"eval_runtime": 258.9913,
"eval_samples_per_second": 19.958,
"eval_steps_per_second": 2.498,
"eval_wer": 0.07505413827708235,
"step": 30800
},
{
"epoch": 25.7,
"learning_rate": 5.733370288248338e-05,
"loss": 0.127,
"step": 31000
},
{
"epoch": 25.7,
"eval_loss": 0.17056865990161896,
"eval_runtime": 259.4613,
"eval_samples_per_second": 19.922,
"eval_steps_per_second": 2.494,
"eval_wer": 0.07484286695188296,
"step": 31000
},
{
"epoch": 25.87,
"learning_rate": 5.705654101995565e-05,
"loss": 0.126,
"step": 31200
},
{
"epoch": 25.87,
"eval_loss": 0.1541663110256195,
"eval_runtime": 258.8605,
"eval_samples_per_second": 19.968,
"eval_steps_per_second": 2.499,
"eval_wer": 0.07442032430148418,
"step": 31200
},
{
"epoch": 26.04,
"learning_rate": 5.6780764966740575e-05,
"loss": 0.124,
"step": 31400
},
{
"epoch": 26.04,
"eval_loss": 0.16358500719070435,
"eval_runtime": 258.6242,
"eval_samples_per_second": 19.987,
"eval_steps_per_second": 2.502,
"eval_wer": 0.07531822743358157,
"step": 31400
},
{
"epoch": 26.2,
"learning_rate": 5.650360310421286e-05,
"loss": 0.1268,
"step": 31600
},
{
"epoch": 26.2,
"eval_loss": 0.16622310876846313,
"eval_runtime": 258.7306,
"eval_samples_per_second": 19.978,
"eval_steps_per_second": 2.501,
"eval_wer": 0.07220197538689062,
"step": 31600
},
{
"epoch": 26.37,
"learning_rate": 5.6227827050997785e-05,
"loss": 0.1286,
"step": 31800
},
{
"epoch": 26.37,
"eval_loss": 0.16970515251159668,
"eval_runtime": 258.9239,
"eval_samples_per_second": 19.963,
"eval_steps_per_second": 2.499,
"eval_wer": 0.07257170020598955,
"step": 31800
},
{
"epoch": 26.53,
"learning_rate": 5.5950665188470066e-05,
"loss": 0.1299,
"step": 32000
},
{
"epoch": 26.53,
"eval_loss": 0.17085173726081848,
"eval_runtime": 259.6854,
"eval_samples_per_second": 19.905,
"eval_steps_per_second": 2.491,
"eval_wer": 0.07167379707389214,
"step": 32000
},
{
"epoch": 26.7,
"learning_rate": 5.5673503325942354e-05,
"loss": 0.1303,
"step": 32200
},
{
"epoch": 26.7,
"eval_loss": 0.16575023531913757,
"eval_runtime": 259.4515,
"eval_samples_per_second": 19.923,
"eval_steps_per_second": 2.494,
"eval_wer": 0.07352242116938679,
"step": 32200
},
{
"epoch": 26.87,
"learning_rate": 5.5396341463414635e-05,
"loss": 0.1246,
"step": 32400
},
{
"epoch": 26.87,
"eval_loss": 0.16010864078998566,
"eval_runtime": 259.7317,
"eval_samples_per_second": 19.901,
"eval_steps_per_second": 2.491,
"eval_wer": 0.07204352189299107,
"step": 32400
},
{
"epoch": 27.03,
"learning_rate": 5.5119179600886916e-05,
"loss": 0.1234,
"step": 32600
},
{
"epoch": 27.03,
"eval_loss": 0.1471298187971115,
"eval_runtime": 259.2276,
"eval_samples_per_second": 19.94,
"eval_steps_per_second": 2.496,
"eval_wer": 0.07214915755559077,
"step": 32600
},
{
"epoch": 27.2,
"learning_rate": 5.484201773835921e-05,
"loss": 0.1179,
"step": 32800
},
{
"epoch": 27.2,
"eval_loss": 0.16308201849460602,
"eval_runtime": 259.2656,
"eval_samples_per_second": 19.937,
"eval_steps_per_second": 2.496,
"eval_wer": 0.07114561876089368,
"step": 32800
},
{
"epoch": 27.36,
"learning_rate": 5.456485587583149e-05,
"loss": 0.1218,
"step": 33000
},
{
"epoch": 27.36,
"eval_loss": 0.1502005010843277,
"eval_runtime": 259.8271,
"eval_samples_per_second": 19.894,
"eval_steps_per_second": 2.49,
"eval_wer": 0.07199070406169122,
"step": 33000
},
{
"epoch": 27.53,
"learning_rate": 5.4287694013303766e-05,
"loss": 0.1249,
"step": 33200
},
{
"epoch": 27.53,
"eval_loss": 0.15461181104183197,
"eval_runtime": 271.8472,
"eval_samples_per_second": 19.014,
"eval_steps_per_second": 2.38,
"eval_wer": 0.07214915755559077,
"step": 33200
},
{
"epoch": 27.69,
"learning_rate": 5.401053215077606e-05,
"loss": 0.1199,
"step": 33400
},
{
"epoch": 27.69,
"eval_loss": 0.14347407221794128,
"eval_runtime": 271.4782,
"eval_samples_per_second": 19.04,
"eval_steps_per_second": 2.383,
"eval_wer": 0.07304706068768817,
"step": 33400
},
{
"epoch": 27.86,
"learning_rate": 5.373337028824834e-05,
"loss": 0.1199,
"step": 33600
},
{
"epoch": 27.86,
"eval_loss": 0.16159255802631378,
"eval_runtime": 272.7821,
"eval_samples_per_second": 18.949,
"eval_steps_per_second": 2.372,
"eval_wer": 0.07262451803728939,
"step": 33600
},
{
"epoch": 28.03,
"learning_rate": 5.345620842572062e-05,
"loss": 0.1213,
"step": 33800
},
{
"epoch": 28.03,
"eval_loss": 0.1633623242378235,
"eval_runtime": 267.8584,
"eval_samples_per_second": 19.298,
"eval_steps_per_second": 2.415,
"eval_wer": 0.07188506839909153,
"step": 33800
},
{
"epoch": 28.19,
"learning_rate": 5.3179046563192904e-05,
"loss": 0.1166,
"step": 34000
},
{
"epoch": 28.19,
"eval_loss": 0.15763157606124878,
"eval_runtime": 258.2022,
"eval_samples_per_second": 20.019,
"eval_steps_per_second": 2.506,
"eval_wer": 0.07278297153118893,
"step": 34000
},
{
"epoch": 28.36,
"learning_rate": 5.290188470066519e-05,
"loss": 0.1123,
"step": 34200
},
{
"epoch": 28.36,
"eval_loss": 0.16512486338615417,
"eval_runtime": 256.1777,
"eval_samples_per_second": 20.177,
"eval_steps_per_second": 2.526,
"eval_wer": 0.07500132044578249,
"step": 34200
},
{
"epoch": 28.52,
"learning_rate": 5.262472283813747e-05,
"loss": 0.121,
"step": 34400
},
{
"epoch": 28.52,
"eval_loss": 0.15457598865032196,
"eval_runtime": 278.1382,
"eval_samples_per_second": 18.584,
"eval_steps_per_second": 2.326,
"eval_wer": 0.07452595996408387,
"step": 34400
},
{
"epoch": 28.69,
"learning_rate": 5.2347560975609754e-05,
"loss": 0.1197,
"step": 34600
},
{
"epoch": 28.69,
"eval_loss": 0.1601417064666748,
"eval_runtime": 278.0073,
"eval_samples_per_second": 18.593,
"eval_steps_per_second": 2.327,
"eval_wer": 0.07315269635028786,
"step": 34600
},
{
"epoch": 28.86,
"learning_rate": 5.207039911308205e-05,
"loss": 0.1168,
"step": 34800
},
{
"epoch": 28.86,
"eval_loss": 0.16127680242061615,
"eval_runtime": 278.2559,
"eval_samples_per_second": 18.576,
"eval_steps_per_second": 2.325,
"eval_wer": 0.07468441345798342,
"step": 34800
},
{
"epoch": 29.02,
"learning_rate": 5.179323725055433e-05,
"loss": 0.1205,
"step": 35000
},
{
"epoch": 29.02,
"eval_loss": 0.15306903421878815,
"eval_runtime": 276.9929,
"eval_samples_per_second": 18.661,
"eval_steps_per_second": 2.336,
"eval_wer": 0.07346960333808694,
"step": 35000
},
{
"epoch": 29.19,
"learning_rate": 5.151607538802661e-05,
"loss": 0.1165,
"step": 35200
},
{
"epoch": 29.19,
"eval_loss": 0.15544754266738892,
"eval_runtime": 276.1997,
"eval_samples_per_second": 18.715,
"eval_steps_per_second": 2.343,
"eval_wer": 0.07431468863888449,
"step": 35200
},
{
"epoch": 29.35,
"learning_rate": 5.1238913525498885e-05,
"loss": 0.1198,
"step": 35400
},
{
"epoch": 29.35,
"eval_loss": 0.15731526911258698,
"eval_runtime": 276.5622,
"eval_samples_per_second": 18.69,
"eval_steps_per_second": 2.339,
"eval_wer": 0.07288860719378862,
"step": 35400
},
{
"epoch": 29.52,
"learning_rate": 5.0963137472283814e-05,
"loss": 0.1192,
"step": 35600
},
{
"epoch": 29.52,
"eval_loss": 0.1620793640613556,
"eval_runtime": 278.1544,
"eval_samples_per_second": 18.583,
"eval_steps_per_second": 2.326,
"eval_wer": 0.07209633972429091,
"step": 35600
},
{
"epoch": 29.68,
"learning_rate": 5.0685975609756095e-05,
"loss": 0.1184,
"step": 35800
},
{
"epoch": 29.68,
"eval_loss": 0.15125353634357452,
"eval_runtime": 279.7716,
"eval_samples_per_second": 18.476,
"eval_steps_per_second": 2.313,
"eval_wer": 0.07177943273649184,
"step": 35800
},
{
"epoch": 29.85,
"learning_rate": 5.0408813747228376e-05,
"loss": 0.1141,
"step": 36000
},
{
"epoch": 29.85,
"eval_loss": 0.15804697573184967,
"eval_runtime": 279.7652,
"eval_samples_per_second": 18.476,
"eval_steps_per_second": 2.313,
"eval_wer": 0.07109280092959383,
"step": 36000
},
{
"epoch": 30.02,
"learning_rate": 5.013165188470067e-05,
"loss": 0.1147,
"step": 36200
},
{
"epoch": 30.02,
"eval_loss": 0.15915371477603912,
"eval_runtime": 260.2704,
"eval_samples_per_second": 19.86,
"eval_steps_per_second": 2.486,
"eval_wer": 0.0700364443035969,
"step": 36200
},
{
"epoch": 30.18,
"learning_rate": 4.985449002217295e-05,
"loss": 0.1124,
"step": 36400
},
{
"epoch": 30.18,
"eval_loss": 0.17016097903251648,
"eval_runtime": 265.3722,
"eval_samples_per_second": 19.478,
"eval_steps_per_second": 2.438,
"eval_wer": 0.07214915755559077,
"step": 36400
},
{
"epoch": 30.35,
"learning_rate": 4.957732815964524e-05,
"loss": 0.1128,
"step": 36600
},
{
"epoch": 30.35,
"eval_loss": 0.16143444180488586,
"eval_runtime": 255.9611,
"eval_samples_per_second": 20.194,
"eval_steps_per_second": 2.528,
"eval_wer": 0.07193788623039138,
"step": 36600
},
{
"epoch": 30.51,
"learning_rate": 4.9300166297117514e-05,
"loss": 0.1082,
"step": 36800
},
{
"epoch": 30.51,
"eval_loss": 0.16003426909446716,
"eval_runtime": 255.199,
"eval_samples_per_second": 20.255,
"eval_steps_per_second": 2.535,
"eval_wer": 0.07220197538689062,
"step": 36800
},
{
"epoch": 30.68,
"learning_rate": 4.90230044345898e-05,
"loss": 0.1159,
"step": 37000
},
{
"epoch": 30.68,
"eval_loss": 0.15168212354183197,
"eval_runtime": 255.5835,
"eval_samples_per_second": 20.224,
"eval_steps_per_second": 2.531,
"eval_wer": 0.0748956847831828,
"step": 37000
},
{
"epoch": 30.85,
"learning_rate": 4.874584257206209e-05,
"loss": 0.1124,
"step": 37200
},
{
"epoch": 30.85,
"eval_loss": 0.1633358746767044,
"eval_runtime": 254.9468,
"eval_samples_per_second": 20.275,
"eval_steps_per_second": 2.538,
"eval_wer": 0.07135689008609307,
"step": 37200
},
{
"epoch": 31.01,
"learning_rate": 4.846868070953437e-05,
"loss": 0.1153,
"step": 37400
},
{
"epoch": 31.01,
"eval_loss": 0.14990398287773132,
"eval_runtime": 255.5087,
"eval_samples_per_second": 20.23,
"eval_steps_per_second": 2.532,
"eval_wer": 0.07294142502508846,
"step": 37400
},
{
"epoch": 31.18,
"learning_rate": 4.819151884700666e-05,
"loss": 0.1083,
"step": 37600
},
{
"epoch": 31.18,
"eval_loss": 0.15318718552589417,
"eval_runtime": 255.4906,
"eval_samples_per_second": 20.232,
"eval_steps_per_second": 2.532,
"eval_wer": 0.07146252574869276,
"step": 37600
},
{
"epoch": 31.34,
"learning_rate": 4.791435698447893e-05,
"loss": 0.1082,
"step": 37800
},
{
"epoch": 31.34,
"eval_loss": 0.15611271560192108,
"eval_runtime": 255.2065,
"eval_samples_per_second": 20.254,
"eval_steps_per_second": 2.535,
"eval_wer": 0.07183225056779169,
"step": 37800
},
{
"epoch": 31.51,
"learning_rate": 4.763719512195122e-05,
"loss": 0.1114,
"step": 38000
},
{
"epoch": 31.51,
"eval_loss": 0.15616507828235626,
"eval_runtime": 255.2918,
"eval_samples_per_second": 20.247,
"eval_steps_per_second": 2.534,
"eval_wer": 0.07204352189299107,
"step": 38000
},
{
"epoch": 31.67,
"learning_rate": 4.73600332594235e-05,
"loss": 0.1103,
"step": 38200
},
{
"epoch": 31.67,
"eval_loss": 0.1566246598958969,
"eval_runtime": 255.37,
"eval_samples_per_second": 20.241,
"eval_steps_per_second": 2.534,
"eval_wer": 0.07146252574869276,
"step": 38200
},
{
"epoch": 31.84,
"learning_rate": 4.708287139689579e-05,
"loss": 0.1091,
"step": 38400
},
{
"epoch": 31.84,
"eval_loss": 0.1507750004529953,
"eval_runtime": 255.5097,
"eval_samples_per_second": 20.23,
"eval_steps_per_second": 2.532,
"eval_wer": 0.07030053346009613,
"step": 38400
},
{
"epoch": 32.01,
"learning_rate": 4.680570953436808e-05,
"loss": 0.1111,
"step": 38600
},
{
"epoch": 32.01,
"eval_loss": 0.145137757062912,
"eval_runtime": 254.9212,
"eval_samples_per_second": 20.277,
"eval_steps_per_second": 2.538,
"eval_wer": 0.07336396767548724,
"step": 38600
},
{
"epoch": 32.17,
"learning_rate": 4.652854767184035e-05,
"loss": 0.1113,
"step": 38800
},
{
"epoch": 32.17,
"eval_loss": 0.15428981184959412,
"eval_runtime": 255.1259,
"eval_samples_per_second": 20.261,
"eval_steps_per_second": 2.536,
"eval_wer": 0.07415623514498494,
"step": 38800
},
{
"epoch": 32.34,
"learning_rate": 4.625138580931264e-05,
"loss": 0.1072,
"step": 39000
},
{
"epoch": 32.34,
"eval_loss": 0.14538711309432983,
"eval_runtime": 255.0771,
"eval_samples_per_second": 20.264,
"eval_steps_per_second": 2.536,
"eval_wer": 0.07299424285638832,
"step": 39000
},
{
"epoch": 32.5,
"learning_rate": 4.597422394678492e-05,
"loss": 0.1033,
"step": 39200
},
{
"epoch": 32.5,
"eval_loss": 0.16375206410884857,
"eval_runtime": 255.084,
"eval_samples_per_second": 20.264,
"eval_steps_per_second": 2.536,
"eval_wer": 0.07135689008609307,
"step": 39200
},
{
"epoch": 32.67,
"learning_rate": 4.569706208425721e-05,
"loss": 0.1019,
"step": 39400
},
{
"epoch": 32.67,
"eval_loss": 0.16679570078849792,
"eval_runtime": 254.9797,
"eval_samples_per_second": 20.272,
"eval_steps_per_second": 2.537,
"eval_wer": 0.07183225056779169,
"step": 39400
},
{
"epoch": 32.84,
"learning_rate": 4.54199002217295e-05,
"loss": 0.1053,
"step": 39600
},
{
"epoch": 32.84,
"eval_loss": 0.16691266000270844,
"eval_runtime": 257.5588,
"eval_samples_per_second": 20.069,
"eval_steps_per_second": 2.512,
"eval_wer": 0.07082871177309459,
"step": 39600
},
{
"epoch": 33.0,
"learning_rate": 4.514273835920178e-05,
"loss": 0.1097,
"step": 39800
},
{
"epoch": 33.0,
"eval_loss": 0.17189669609069824,
"eval_runtime": 258.3507,
"eval_samples_per_second": 20.008,
"eval_steps_per_second": 2.504,
"eval_wer": 0.07288860719378862,
"step": 39800
},
{
"epoch": 33.17,
"learning_rate": 4.486557649667406e-05,
"loss": 0.1021,
"step": 40000
},
{
"epoch": 33.17,
"eval_loss": 0.16738824546337128,
"eval_runtime": 257.6603,
"eval_samples_per_second": 20.061,
"eval_steps_per_second": 2.511,
"eval_wer": 0.07177943273649184,
"step": 40000
},
{
"epoch": 33.33,
"learning_rate": 4.458980044345898e-05,
"loss": 0.1056,
"step": 40200
},
{
"epoch": 33.33,
"eval_loss": 0.15968775749206543,
"eval_runtime": 257.6821,
"eval_samples_per_second": 20.06,
"eval_steps_per_second": 2.511,
"eval_wer": 0.07098716526699414,
"step": 40200
},
{
"epoch": 33.5,
"learning_rate": 4.431263858093126e-05,
"loss": 0.1043,
"step": 40400
},
{
"epoch": 33.5,
"eval_loss": 0.16819486021995544,
"eval_runtime": 258.1617,
"eval_samples_per_second": 20.022,
"eval_steps_per_second": 2.506,
"eval_wer": 0.07294142502508846,
"step": 40400
},
{
"epoch": 33.66,
"learning_rate": 4.403547671840355e-05,
"loss": 0.1015,
"step": 40600
},
{
"epoch": 33.66,
"eval_loss": 0.17912797629833221,
"eval_runtime": 257.4928,
"eval_samples_per_second": 20.074,
"eval_steps_per_second": 2.513,
"eval_wer": 0.07389214598848572,
"step": 40600
},
{
"epoch": 33.83,
"learning_rate": 4.375831485587583e-05,
"loss": 0.1038,
"step": 40800
},
{
"epoch": 33.83,
"eval_loss": 0.16278141736984253,
"eval_runtime": 258.2425,
"eval_samples_per_second": 20.016,
"eval_steps_per_second": 2.505,
"eval_wer": 0.07299424285638832,
"step": 40800
},
{
"epoch": 34.0,
"learning_rate": 4.348115299334812e-05,
"loss": 0.1018,
"step": 41000
},
{
"epoch": 34.0,
"eval_loss": 0.17246678471565247,
"eval_runtime": 257.824,
"eval_samples_per_second": 20.049,
"eval_steps_per_second": 2.509,
"eval_wer": 0.07431468863888449,
"step": 41000
},
{
"epoch": 34.16,
"learning_rate": 4.32039911308204e-05,
"loss": 0.1002,
"step": 41200
},
{
"epoch": 34.16,
"eval_loss": 0.17683491110801697,
"eval_runtime": 259.2472,
"eval_samples_per_second": 19.938,
"eval_steps_per_second": 2.496,
"eval_wer": 0.06998362647229704,
"step": 41200
},
{
"epoch": 34.33,
"learning_rate": 4.292682926829268e-05,
"loss": 0.1004,
"step": 41400
},
{
"epoch": 34.33,
"eval_loss": 0.1728859543800354,
"eval_runtime": 258.3657,
"eval_samples_per_second": 20.007,
"eval_steps_per_second": 2.504,
"eval_wer": 0.0709343474356943,
"step": 41400
},
{
"epoch": 34.49,
"learning_rate": 4.264966740576497e-05,
"loss": 0.1023,
"step": 41600
},
{
"epoch": 34.49,
"eval_loss": 0.1567125767469406,
"eval_runtime": 258.2421,
"eval_samples_per_second": 20.016,
"eval_steps_per_second": 2.505,
"eval_wer": 0.07378651032588601,
"step": 41600
},
{
"epoch": 34.66,
"learning_rate": 4.237250554323725e-05,
"loss": 0.1003,
"step": 41800
},
{
"epoch": 34.66,
"eval_loss": 0.16443106532096863,
"eval_runtime": 258.2982,
"eval_samples_per_second": 20.012,
"eval_steps_per_second": 2.505,
"eval_wer": 0.07251888237468969,
"step": 41800
},
{
"epoch": 34.83,
"learning_rate": 4.209534368070954e-05,
"loss": 0.103,
"step": 42000
},
{
"epoch": 34.83,
"eval_loss": 0.17008621990680695,
"eval_runtime": 257.8252,
"eval_samples_per_second": 20.048,
"eval_steps_per_second": 2.509,
"eval_wer": 0.0716209792425923,
"step": 42000
},
{
"epoch": 34.99,
"learning_rate": 4.181818181818182e-05,
"loss": 0.1056,
"step": 42200
},
{
"epoch": 34.99,
"eval_loss": 0.16209852695465088,
"eval_runtime": 258.245,
"eval_samples_per_second": 20.016,
"eval_steps_per_second": 2.505,
"eval_wer": 0.06956108382189827,
"step": 42200
},
{
"epoch": 35.16,
"learning_rate": 4.15410199556541e-05,
"loss": 0.102,
"step": 42400
},
{
"epoch": 35.16,
"eval_loss": 0.1503116935491562,
"eval_runtime": 258.2089,
"eval_samples_per_second": 20.019,
"eval_steps_per_second": 2.506,
"eval_wer": 0.07024771562879628,
"step": 42400
},
{
"epoch": 35.32,
"learning_rate": 4.126385809312639e-05,
"loss": 0.0979,
"step": 42600
},
{
"epoch": 35.32,
"eval_loss": 0.15129025280475616,
"eval_runtime": 258.9706,
"eval_samples_per_second": 19.96,
"eval_steps_per_second": 2.498,
"eval_wer": 0.06977235514709766,
"step": 42600
},
{
"epoch": 35.49,
"learning_rate": 4.098808203991131e-05,
"loss": 0.0969,
"step": 42800
},
{
"epoch": 35.49,
"eval_loss": 0.16101005673408508,
"eval_runtime": 258.464,
"eval_samples_per_second": 19.999,
"eval_steps_per_second": 2.503,
"eval_wer": 0.07082871177309459,
"step": 42800
},
{
"epoch": 35.65,
"learning_rate": 4.071092017738359e-05,
"loss": 0.1016,
"step": 43000
},
{
"epoch": 35.65,
"eval_loss": 0.17464140057563782,
"eval_runtime": 258.5693,
"eval_samples_per_second": 19.991,
"eval_steps_per_second": 2.502,
"eval_wer": 0.07140970791739291,
"step": 43000
},
{
"epoch": 35.82,
"learning_rate": 4.043375831485588e-05,
"loss": 0.0994,
"step": 43200
},
{
"epoch": 35.82,
"eval_loss": 0.16432413458824158,
"eval_runtime": 259.177,
"eval_samples_per_second": 19.944,
"eval_steps_per_second": 2.496,
"eval_wer": 0.07045898695399568,
"step": 43200
},
{
"epoch": 35.99,
"learning_rate": 4.015659645232816e-05,
"loss": 0.0966,
"step": 43400
},
{
"epoch": 35.99,
"eval_loss": 0.1695939600467682,
"eval_runtime": 258.2906,
"eval_samples_per_second": 20.012,
"eval_steps_per_second": 2.505,
"eval_wer": 0.0707230761104949,
"step": 43400
}
],
"max_steps": 72360,
"num_train_epochs": 60,
"total_flos": 1.9733994835008543e+20,
"trial_name": null,
"trial_params": null
}