panjiariputra's picture
Upload trainer_state.json
c7e1027
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 9.312782393237137,
"global_step": 102910,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.02,
"learning_rate": 0.0001188,
"loss": 6.3637,
"step": 200
},
{
"epoch": 0.02,
"eval_loss": 2.970613718032837,
"eval_runtime": 1204.8934,
"eval_samples_per_second": 9.49,
"eval_steps_per_second": 1.187,
"eval_wer": 1.0,
"step": 200
},
{
"epoch": 0.04,
"learning_rate": 0.0002388,
"loss": 2.9537,
"step": 400
},
{
"epoch": 0.04,
"eval_loss": 2.926468849182129,
"eval_runtime": 1196.9703,
"eval_samples_per_second": 9.553,
"eval_steps_per_second": 1.195,
"eval_wer": 1.0,
"step": 400
},
{
"epoch": 0.06,
"learning_rate": 0.00029971291866028705,
"loss": 2.322,
"step": 600
},
{
"epoch": 0.06,
"eval_loss": 0.9299482107162476,
"eval_runtime": 1200.9258,
"eval_samples_per_second": 9.522,
"eval_steps_per_second": 1.191,
"eval_wer": 0.7969234236772412,
"step": 600
},
{
"epoch": 0.08,
"learning_rate": 0.0002991270383751586,
"loss": 1.1527,
"step": 800
},
{
"epoch": 0.08,
"eval_loss": 0.6302356719970703,
"eval_runtime": 1200.2547,
"eval_samples_per_second": 9.527,
"eval_steps_per_second": 1.191,
"eval_wer": 0.6488195187919085,
"step": 800
},
{
"epoch": 0.1,
"learning_rate": 0.00029854115809003026,
"loss": 0.9892,
"step": 1000
},
{
"epoch": 0.1,
"eval_loss": 0.5595320463180542,
"eval_runtime": 1199.9051,
"eval_samples_per_second": 9.53,
"eval_steps_per_second": 1.192,
"eval_wer": 0.6062207697075562,
"step": 1000
},
{
"epoch": 0.12,
"learning_rate": 0.00029795527780490183,
"loss": 0.8919,
"step": 1200
},
{
"epoch": 0.12,
"eval_loss": 0.5005972981452942,
"eval_runtime": 1200.1109,
"eval_samples_per_second": 9.528,
"eval_steps_per_second": 1.192,
"eval_wer": 0.5602411675212712,
"step": 1200
},
{
"epoch": 0.02,
"learning_rate": 0.0002973693975197734,
"loss": 0.8609,
"step": 1400
},
{
"epoch": 0.02,
"eval_loss": 0.4540606439113617,
"eval_runtime": 1277.6037,
"eval_samples_per_second": 8.95,
"eval_steps_per_second": 1.119,
"eval_wer": 0.5377472248830788,
"step": 1400
},
{
"epoch": 0.04,
"learning_rate": 0.00029678351723464504,
"loss": 0.8229,
"step": 1600
},
{
"epoch": 0.04,
"eval_loss": 0.42465054988861084,
"eval_runtime": 1258.3012,
"eval_samples_per_second": 9.088,
"eval_steps_per_second": 1.136,
"eval_wer": 0.5064968727108807,
"step": 1600
},
{
"epoch": 0.06,
"learning_rate": 0.0002961976369495166,
"loss": 0.7813,
"step": 1800
},
{
"epoch": 0.06,
"eval_loss": 0.4217381477355957,
"eval_runtime": 1266.2898,
"eval_samples_per_second": 9.03,
"eval_steps_per_second": 1.129,
"eval_wer": 0.5103735842677636,
"step": 1800
},
{
"epoch": 0.08,
"learning_rate": 0.0002956117566643882,
"loss": 0.7586,
"step": 2000
},
{
"epoch": 0.08,
"eval_loss": 0.3938300311565399,
"eval_runtime": 1264.268,
"eval_samples_per_second": 9.045,
"eval_steps_per_second": 1.131,
"eval_wer": 0.48733870513326194,
"step": 2000
},
{
"epoch": 0.1,
"learning_rate": 0.0002950258763792598,
"loss": 0.7416,
"step": 2200
},
{
"epoch": 0.1,
"eval_loss": 0.3816222548484802,
"eval_runtime": 1263.3113,
"eval_samples_per_second": 9.052,
"eval_steps_per_second": 1.132,
"eval_wer": 0.46917225446554345,
"step": 2200
},
{
"epoch": 0.12,
"learning_rate": 0.0002944399960941314,
"loss": 0.7077,
"step": 2400
},
{
"epoch": 0.12,
"eval_loss": 0.4034684896469116,
"eval_runtime": 1262.8373,
"eval_samples_per_second": 9.055,
"eval_steps_per_second": 1.132,
"eval_wer": 0.4645404857158956,
"step": 2400
},
{
"epoch": 0.14,
"learning_rate": 0.000293854115809003,
"loss": 0.7359,
"step": 2600
},
{
"epoch": 0.14,
"eval_loss": 0.3767629861831665,
"eval_runtime": 1266.8299,
"eval_samples_per_second": 9.026,
"eval_steps_per_second": 1.129,
"eval_wer": 0.46494618808812754,
"step": 2600
},
{
"epoch": 0.16,
"learning_rate": 0.0002932682355238746,
"loss": 0.7335,
"step": 2800
},
{
"epoch": 0.16,
"eval_loss": 0.37543314695358276,
"eval_runtime": 1278.5608,
"eval_samples_per_second": 8.944,
"eval_steps_per_second": 1.118,
"eval_wer": 0.4669296219079281,
"step": 2800
},
{
"epoch": 0.17,
"learning_rate": 0.0002926823552387462,
"loss": 0.7204,
"step": 3000
},
{
"epoch": 0.17,
"eval_loss": 0.3659396171569824,
"eval_runtime": 1288.786,
"eval_samples_per_second": 8.873,
"eval_steps_per_second": 1.11,
"eval_wer": 0.4529103510452471,
"step": 3000
},
{
"epoch": 0.19,
"learning_rate": 0.00029209647495361777,
"loss": 0.7003,
"step": 3200
},
{
"epoch": 0.19,
"eval_loss": 0.3635198473930359,
"eval_runtime": 1309.43,
"eval_samples_per_second": 8.733,
"eval_steps_per_second": 1.092,
"eval_wer": 0.43374091395728853,
"step": 3200
},
{
"epoch": 0.21,
"learning_rate": 0.0002915105946684894,
"loss": 0.7048,
"step": 3400
},
{
"epoch": 0.21,
"eval_loss": 0.33965152502059937,
"eval_runtime": 1308.7374,
"eval_samples_per_second": 8.737,
"eval_steps_per_second": 1.093,
"eval_wer": 0.4208824026596044,
"step": 3400
},
{
"epoch": 0.23,
"learning_rate": 0.000290924714383361,
"loss": 0.6782,
"step": 3600
},
{
"epoch": 0.23,
"eval_loss": 0.34997662901878357,
"eval_runtime": 1307.483,
"eval_samples_per_second": 8.746,
"eval_steps_per_second": 1.094,
"eval_wer": 0.43742604383839523,
"step": 3600
},
{
"epoch": 0.25,
"learning_rate": 0.00029033883409823255,
"loss": 0.6748,
"step": 3800
},
{
"epoch": 0.25,
"eval_loss": 0.328862726688385,
"eval_runtime": 1308.3222,
"eval_samples_per_second": 8.74,
"eval_steps_per_second": 1.093,
"eval_wer": 0.4091283033752183,
"step": 3800
},
{
"epoch": 0.27,
"learning_rate": 0.0002897558832145298,
"loss": 0.6673,
"step": 4000
},
{
"epoch": 0.27,
"eval_loss": 0.328796923160553,
"eval_runtime": 1280.3163,
"eval_samples_per_second": 8.931,
"eval_steps_per_second": 1.117,
"eval_wer": 0.42204316222460136,
"step": 4000
},
{
"epoch": 0.29,
"learning_rate": 0.0002891700029294014,
"loss": 0.682,
"step": 4200
},
{
"epoch": 0.29,
"eval_loss": 0.32723408937454224,
"eval_runtime": 1263.2249,
"eval_samples_per_second": 9.052,
"eval_steps_per_second": 1.132,
"eval_wer": 0.40732518172085425,
"step": 4200
},
{
"epoch": 0.31,
"learning_rate": 0.000288584122644273,
"loss": 0.6484,
"step": 4400
},
{
"epoch": 0.31,
"eval_loss": 0.3117896616458893,
"eval_runtime": 1263.1269,
"eval_samples_per_second": 9.053,
"eval_steps_per_second": 1.132,
"eval_wer": 0.39746436017355047,
"step": 4400
},
{
"epoch": 0.33,
"learning_rate": 0.0002879982423591446,
"loss": 0.6614,
"step": 4600
},
{
"epoch": 0.33,
"eval_loss": 0.3179396390914917,
"eval_runtime": 1264.4151,
"eval_samples_per_second": 9.044,
"eval_steps_per_second": 1.131,
"eval_wer": 0.3975094382149096,
"step": 4600
},
{
"epoch": 0.35,
"learning_rate": 0.0002874123620740162,
"loss": 0.6557,
"step": 4800
},
{
"epoch": 0.35,
"eval_loss": 0.31483808159828186,
"eval_runtime": 1264.2237,
"eval_samples_per_second": 9.045,
"eval_steps_per_second": 1.131,
"eval_wer": 0.39069138445934526,
"step": 4800
},
{
"epoch": 0.37,
"learning_rate": 0.00028682648178888776,
"loss": 0.6501,
"step": 5000
},
{
"epoch": 0.37,
"eval_loss": 0.32537421584129333,
"eval_runtime": 1269.162,
"eval_samples_per_second": 9.01,
"eval_steps_per_second": 1.127,
"eval_wer": 0.3900828309009974,
"step": 5000
},
{
"epoch": 0.39,
"learning_rate": 0.00028624060150375934,
"loss": 0.6487,
"step": 5200
},
{
"epoch": 0.39,
"eval_loss": 0.29997891187667847,
"eval_runtime": 1266.7543,
"eval_samples_per_second": 9.027,
"eval_steps_per_second": 1.129,
"eval_wer": 0.3837042880486843,
"step": 5200
},
{
"epoch": 0.41,
"learning_rate": 0.00028565472121863097,
"loss": 0.6493,
"step": 5400
},
{
"epoch": 0.41,
"eval_loss": 0.2948152720928192,
"eval_runtime": 1259.7136,
"eval_samples_per_second": 9.077,
"eval_steps_per_second": 1.135,
"eval_wer": 0.3774271707894292,
"step": 5400
},
{
"epoch": 0.43,
"learning_rate": 0.00028506884093350255,
"loss": 0.6302,
"step": 5600
},
{
"epoch": 0.43,
"eval_loss": 0.29879939556121826,
"eval_runtime": 1259.867,
"eval_samples_per_second": 9.076,
"eval_steps_per_second": 1.135,
"eval_wer": 0.3797824984504423,
"step": 5600
},
{
"epoch": 0.45,
"learning_rate": 0.0002844829606483741,
"loss": 0.6508,
"step": 5800
},
{
"epoch": 0.45,
"eval_loss": 0.29643869400024414,
"eval_runtime": 1261.7676,
"eval_samples_per_second": 9.063,
"eval_steps_per_second": 1.133,
"eval_wer": 0.3807742153603426,
"step": 5800
},
{
"epoch": 0.47,
"learning_rate": 0.00028389708036324576,
"loss": 0.6188,
"step": 6000
},
{
"epoch": 0.47,
"eval_loss": 0.29014137387275696,
"eval_runtime": 1270.9486,
"eval_samples_per_second": 8.997,
"eval_steps_per_second": 1.125,
"eval_wer": 0.3699554854341579,
"step": 6000
},
{
"epoch": 0.49,
"learning_rate": 0.0002833112000781174,
"loss": 0.6215,
"step": 6200
},
{
"epoch": 0.49,
"eval_loss": 0.29307612776756287,
"eval_runtime": 1276.8284,
"eval_samples_per_second": 8.956,
"eval_steps_per_second": 1.12,
"eval_wer": 0.3614244661069477,
"step": 6200
},
{
"epoch": 0.51,
"learning_rate": 0.0002827253197929889,
"loss": 0.6035,
"step": 6400
},
{
"epoch": 0.51,
"eval_loss": 0.2853919267654419,
"eval_runtime": 1270.8617,
"eval_samples_per_second": 8.998,
"eval_steps_per_second": 1.125,
"eval_wer": 0.3639150278920381,
"step": 6400
},
{
"epoch": 0.52,
"learning_rate": 0.00028213943950786054,
"loss": 0.613,
"step": 6600
},
{
"epoch": 0.52,
"eval_loss": 0.2793109714984894,
"eval_runtime": 1273.0596,
"eval_samples_per_second": 8.982,
"eval_steps_per_second": 1.123,
"eval_wer": 0.3593170676734096,
"step": 6600
},
{
"epoch": 0.54,
"learning_rate": 0.0002815535592227321,
"loss": 0.5967,
"step": 6800
},
{
"epoch": 0.54,
"eval_loss": 0.2713634669780731,
"eval_runtime": 1279.2102,
"eval_samples_per_second": 8.939,
"eval_steps_per_second": 1.118,
"eval_wer": 0.35412182340677295,
"step": 6800
},
{
"epoch": 0.56,
"learning_rate": 0.00028096767893760375,
"loss": 0.6118,
"step": 7000
},
{
"epoch": 0.56,
"eval_loss": 0.27592843770980835,
"eval_runtime": 1269.9249,
"eval_samples_per_second": 9.004,
"eval_steps_per_second": 1.126,
"eval_wer": 0.34716853552713134,
"step": 7000
},
{
"epoch": 0.58,
"learning_rate": 0.00028038179865247533,
"loss": 0.6016,
"step": 7200
},
{
"epoch": 0.58,
"eval_loss": 0.27817872166633606,
"eval_runtime": 1278.4857,
"eval_samples_per_second": 8.944,
"eval_steps_per_second": 1.119,
"eval_wer": 0.35648842057812585,
"step": 7200
},
{
"epoch": 0.6,
"learning_rate": 0.0002797959183673469,
"loss": 0.5965,
"step": 7400
},
{
"epoch": 0.6,
"eval_loss": 0.2640519440174103,
"eval_runtime": 1280.4206,
"eval_samples_per_second": 8.931,
"eval_steps_per_second": 1.117,
"eval_wer": 0.3394714599650645,
"step": 7400
},
{
"epoch": 0.62,
"learning_rate": 0.00027921003808221854,
"loss": 0.596,
"step": 7600
},
{
"epoch": 0.62,
"eval_loss": 0.2649860978126526,
"eval_runtime": 1278.933,
"eval_samples_per_second": 8.941,
"eval_steps_per_second": 1.118,
"eval_wer": 0.3421197948949118,
"step": 7600
},
{
"epoch": 0.64,
"learning_rate": 0.0002786241577970901,
"loss": 0.6075,
"step": 7800
},
{
"epoch": 0.64,
"eval_loss": 0.26620569825172424,
"eval_runtime": 1277.4585,
"eval_samples_per_second": 8.951,
"eval_steps_per_second": 1.119,
"eval_wer": 0.3415225108469037,
"step": 7800
},
{
"epoch": 0.66,
"learning_rate": 0.0002780382775119617,
"loss": 0.5988,
"step": 8000
},
{
"epoch": 0.66,
"eval_loss": 0.2684703469276428,
"eval_runtime": 1278.0005,
"eval_samples_per_second": 8.948,
"eval_steps_per_second": 1.119,
"eval_wer": 0.336383614131966,
"step": 8000
},
{
"epoch": 0.68,
"learning_rate": 0.0002774523972268333,
"loss": 0.5973,
"step": 8200
},
{
"epoch": 0.68,
"eval_loss": 0.25252845883369446,
"eval_runtime": 1274.619,
"eval_samples_per_second": 8.971,
"eval_steps_per_second": 1.122,
"eval_wer": 0.33392686087789486,
"step": 8200
},
{
"epoch": 0.7,
"learning_rate": 0.0002768665169417049,
"loss": 0.5809,
"step": 8400
},
{
"epoch": 0.7,
"eval_loss": 0.2525635361671448,
"eval_runtime": 1273.2438,
"eval_samples_per_second": 8.981,
"eval_steps_per_second": 1.123,
"eval_wer": 0.322713698089818,
"step": 8400
},
{
"epoch": 0.72,
"learning_rate": 0.0002762806366565765,
"loss": 0.574,
"step": 8600
},
{
"epoch": 0.72,
"eval_loss": 0.25077855587005615,
"eval_runtime": 1281.2675,
"eval_samples_per_second": 8.925,
"eval_steps_per_second": 1.116,
"eval_wer": 0.32358145038598074,
"step": 8600
},
{
"epoch": 0.74,
"learning_rate": 0.0002756947563714481,
"loss": 0.5893,
"step": 8800
},
{
"epoch": 0.74,
"eval_loss": 0.25881966948509216,
"eval_runtime": 1276.5376,
"eval_samples_per_second": 8.958,
"eval_steps_per_second": 1.12,
"eval_wer": 0.3342649461880881,
"step": 8800
},
{
"epoch": 0.76,
"learning_rate": 0.0002751088760863197,
"loss": 0.5876,
"step": 9000
},
{
"epoch": 0.76,
"eval_loss": 0.25579118728637695,
"eval_runtime": 1273.8923,
"eval_samples_per_second": 8.976,
"eval_steps_per_second": 1.123,
"eval_wer": 0.3283709922803854,
"step": 9000
},
{
"epoch": 0.78,
"learning_rate": 0.00027452299580119126,
"loss": 0.5686,
"step": 9200
},
{
"epoch": 0.78,
"eval_loss": 0.24226322770118713,
"eval_runtime": 1284.5776,
"eval_samples_per_second": 8.902,
"eval_steps_per_second": 1.113,
"eval_wer": 0.311004676846791,
"step": 9200
},
{
"epoch": 0.8,
"learning_rate": 0.00027393711551606284,
"loss": 0.5798,
"step": 9400
},
{
"epoch": 0.8,
"eval_loss": 0.24731135368347168,
"eval_runtime": 1276.3349,
"eval_samples_per_second": 8.959,
"eval_steps_per_second": 1.12,
"eval_wer": 0.3168648222234744,
"step": 9400
},
{
"epoch": 0.82,
"learning_rate": 0.00027335123523093447,
"loss": 0.5758,
"step": 9600
},
{
"epoch": 0.82,
"eval_loss": 0.2408532351255417,
"eval_runtime": 1298.8974,
"eval_samples_per_second": 8.804,
"eval_steps_per_second": 1.101,
"eval_wer": 0.3150053530174114,
"step": 9600
},
{
"epoch": 0.84,
"learning_rate": 0.00027276535494580605,
"loss": 0.5717,
"step": 9800
},
{
"epoch": 0.84,
"eval_loss": 0.24253633618354797,
"eval_runtime": 1290.9724,
"eval_samples_per_second": 8.858,
"eval_steps_per_second": 1.108,
"eval_wer": 0.30879585282019495,
"step": 9800
},
{
"epoch": 0.86,
"learning_rate": 0.0002721794746606776,
"loss": 0.5515,
"step": 10000
},
{
"epoch": 0.86,
"eval_loss": 0.24737118184566498,
"eval_runtime": 1307.8378,
"eval_samples_per_second": 8.743,
"eval_steps_per_second": 1.093,
"eval_wer": 0.31223305347382657,
"step": 10000
},
{
"epoch": 0.87,
"learning_rate": 0.00027159359437554925,
"loss": 0.5719,
"step": 10200
},
{
"epoch": 0.87,
"eval_loss": 0.23542268574237823,
"eval_runtime": 1311.0297,
"eval_samples_per_second": 8.722,
"eval_steps_per_second": 1.091,
"eval_wer": 0.30239477094720235,
"step": 10200
},
{
"epoch": 0.89,
"learning_rate": 0.00027100771409042083,
"loss": 0.5614,
"step": 10400
},
{
"epoch": 0.89,
"eval_loss": 0.247614324092865,
"eval_runtime": 1303.8784,
"eval_samples_per_second": 8.77,
"eval_steps_per_second": 1.097,
"eval_wer": 0.3179579647264326,
"step": 10400
},
{
"epoch": 0.91,
"learning_rate": 0.00027042476320671805,
"loss": 0.5593,
"step": 10600
},
{
"epoch": 0.91,
"eval_loss": 0.23083819448947906,
"eval_runtime": 1300.6119,
"eval_samples_per_second": 8.792,
"eval_steps_per_second": 1.099,
"eval_wer": 0.2990251873556094,
"step": 10600
},
{
"epoch": 0.93,
"learning_rate": 0.0002698388829215897,
"loss": 0.5617,
"step": 10800
},
{
"epoch": 0.93,
"eval_loss": 0.235725536942482,
"eval_runtime": 1286.8437,
"eval_samples_per_second": 8.886,
"eval_steps_per_second": 1.111,
"eval_wer": 0.29992674818279147,
"step": 10800
},
{
"epoch": 0.95,
"learning_rate": 0.00026925300263646126,
"loss": 0.5596,
"step": 11000
},
{
"epoch": 0.95,
"eval_loss": 0.24363787472248077,
"eval_runtime": 1282.1875,
"eval_samples_per_second": 8.918,
"eval_steps_per_second": 1.115,
"eval_wer": 0.30588831915253284,
"step": 11000
},
{
"epoch": 1.02,
"learning_rate": 0.00026866712235133284,
"loss": 0.5505,
"step": 11200
},
{
"epoch": 1.02,
"eval_loss": 0.2367905229330063,
"eval_runtime": 1272.677,
"eval_samples_per_second": 8.985,
"eval_steps_per_second": 1.124,
"eval_wer": 0.30030991153434383,
"step": 11200
},
{
"epoch": 1.04,
"learning_rate": 0.00026808124206620447,
"loss": 0.5445,
"step": 11400
},
{
"epoch": 1.04,
"eval_loss": 0.2314738780260086,
"eval_runtime": 1260.4441,
"eval_samples_per_second": 9.072,
"eval_steps_per_second": 1.135,
"eval_wer": 0.2962866963430439,
"step": 11400
},
{
"epoch": 1.06,
"learning_rate": 0.00026749536178107604,
"loss": 0.5259,
"step": 11600
},
{
"epoch": 1.06,
"eval_loss": 0.2309747040271759,
"eval_runtime": 1241.2773,
"eval_samples_per_second": 9.212,
"eval_steps_per_second": 1.152,
"eval_wer": 0.2933002761030033,
"step": 11600
},
{
"epoch": 1.08,
"learning_rate": 0.0002669094814959476,
"loss": 0.5268,
"step": 11800
},
{
"epoch": 1.08,
"eval_loss": 0.22442255914211273,
"eval_runtime": 1246.8773,
"eval_samples_per_second": 9.171,
"eval_steps_per_second": 1.147,
"eval_wer": 0.2917788922071336,
"step": 11800
},
{
"epoch": 1.1,
"learning_rate": 0.00026632360121081925,
"loss": 0.5479,
"step": 12000
},
{
"epoch": 1.1,
"eval_loss": 0.22898849844932556,
"eval_runtime": 1248.9274,
"eval_samples_per_second": 9.156,
"eval_steps_per_second": 1.145,
"eval_wer": 0.2952048233504254,
"step": 12000
},
{
"epoch": 1.12,
"learning_rate": 0.00026573772092569083,
"loss": 0.5308,
"step": 12200
},
{
"epoch": 1.12,
"eval_loss": 0.2276710867881775,
"eval_runtime": 1248.0355,
"eval_samples_per_second": 9.162,
"eval_steps_per_second": 1.146,
"eval_wer": 0.28650476136811853,
"step": 12200
},
{
"epoch": 1.14,
"learning_rate": 0.0002651518406405624,
"loss": 0.5345,
"step": 12400
},
{
"epoch": 1.14,
"eval_loss": 0.22329020500183105,
"eval_runtime": 1258.1958,
"eval_samples_per_second": 9.088,
"eval_steps_per_second": 1.137,
"eval_wer": 0.29397644672338985,
"step": 12400
},
{
"epoch": 1.16,
"learning_rate": 0.00026456596035543404,
"loss": 0.5324,
"step": 12600
},
{
"epoch": 1.16,
"eval_loss": 0.23222756385803223,
"eval_runtime": 1257.7533,
"eval_samples_per_second": 9.092,
"eval_steps_per_second": 1.137,
"eval_wer": 0.2929734603031498,
"step": 12600
},
{
"epoch": 1.17,
"learning_rate": 0.00026398300947173126,
"loss": 0.5374,
"step": 12800
},
{
"epoch": 1.17,
"eval_loss": 0.21313965320587158,
"eval_runtime": 1251.7467,
"eval_samples_per_second": 9.135,
"eval_steps_per_second": 1.142,
"eval_wer": 0.27523525102834284,
"step": 12800
},
{
"epoch": 1.19,
"learning_rate": 0.00026339712918660283,
"loss": 0.5177,
"step": 13000
},
{
"epoch": 1.19,
"eval_loss": 0.2149176001548767,
"eval_runtime": 1254.8601,
"eval_samples_per_second": 9.113,
"eval_steps_per_second": 1.14,
"eval_wer": 0.2795063954471178,
"step": 13000
},
{
"epoch": 1.21,
"learning_rate": 0.00026281124890147447,
"loss": 0.5234,
"step": 13200
},
{
"epoch": 1.21,
"eval_loss": 0.21338462829589844,
"eval_runtime": 1267.9076,
"eval_samples_per_second": 9.019,
"eval_steps_per_second": 1.128,
"eval_wer": 0.2745478108976165,
"step": 13200
},
{
"epoch": 1.23,
"learning_rate": 0.00026222536861634604,
"loss": 0.5208,
"step": 13400
},
{
"epoch": 1.23,
"eval_loss": 0.21556991338729858,
"eval_runtime": 1278.0567,
"eval_samples_per_second": 8.947,
"eval_steps_per_second": 1.119,
"eval_wer": 0.27523525102834284,
"step": 13400
},
{
"epoch": 1.25,
"learning_rate": 0.0002616394883312176,
"loss": 0.5139,
"step": 13600
},
{
"epoch": 1.25,
"eval_loss": 0.21141602098941803,
"eval_runtime": 1279.0428,
"eval_samples_per_second": 8.94,
"eval_steps_per_second": 1.118,
"eval_wer": 0.2733307037809207,
"step": 13600
},
{
"epoch": 1.27,
"learning_rate": 0.00026105360804608925,
"loss": 0.5034,
"step": 13800
},
{
"epoch": 1.27,
"eval_loss": 0.21080410480499268,
"eval_runtime": 1283.2325,
"eval_samples_per_second": 8.911,
"eval_steps_per_second": 1.114,
"eval_wer": 0.2685524313968558,
"step": 13800
},
{
"epoch": 1.29,
"learning_rate": 0.00026046772776096083,
"loss": 0.5283,
"step": 14000
},
{
"epoch": 1.29,
"eval_loss": 0.21575190126895905,
"eval_runtime": 1258.3659,
"eval_samples_per_second": 9.087,
"eval_steps_per_second": 1.136,
"eval_wer": 0.2740406829323266,
"step": 14000
},
{
"epoch": 1.31,
"learning_rate": 0.0002598818474758324,
"loss": 0.5166,
"step": 14200
},
{
"epoch": 1.31,
"eval_loss": 0.20629876852035522,
"eval_runtime": 1254.3394,
"eval_samples_per_second": 9.116,
"eval_steps_per_second": 1.14,
"eval_wer": 0.2717980503747112,
"step": 14200
},
{
"epoch": 1.33,
"learning_rate": 0.00025929596719070404,
"loss": 0.5214,
"step": 14400
},
{
"epoch": 1.33,
"eval_loss": 0.20648950338363647,
"eval_runtime": 1257.7224,
"eval_samples_per_second": 9.092,
"eval_steps_per_second": 1.137,
"eval_wer": 0.2600552206006649,
"step": 14400
},
{
"epoch": 1.35,
"learning_rate": 0.0002587100869055756,
"loss": 0.511,
"step": 14600
},
{
"epoch": 1.35,
"eval_loss": 0.21166543662548065,
"eval_runtime": 1257.0914,
"eval_samples_per_second": 9.096,
"eval_steps_per_second": 1.138,
"eval_wer": 0.2707837944441314,
"step": 14600
},
{
"epoch": 1.37,
"learning_rate": 0.0002581242066204472,
"loss": 0.5086,
"step": 14800
},
{
"epoch": 1.37,
"eval_loss": 0.20775602757930756,
"eval_runtime": 1250.3755,
"eval_samples_per_second": 9.145,
"eval_steps_per_second": 1.144,
"eval_wer": 0.26485603200540936,
"step": 14800
},
{
"epoch": 1.39,
"learning_rate": 0.00025753832633531877,
"loss": 0.5134,
"step": 15000
},
{
"epoch": 1.39,
"eval_loss": 0.20706060528755188,
"eval_runtime": 1256.0437,
"eval_samples_per_second": 9.104,
"eval_steps_per_second": 1.138,
"eval_wer": 0.2688341691553502,
"step": 15000
},
{
"epoch": 1.41,
"learning_rate": 0.00025695537545161604,
"loss": 0.5021,
"step": 15200
},
{
"epoch": 1.41,
"eval_loss": 0.2014995664358139,
"eval_runtime": 1266.4014,
"eval_samples_per_second": 9.03,
"eval_steps_per_second": 1.129,
"eval_wer": 0.26383050656448975,
"step": 15200
},
{
"epoch": 1.43,
"learning_rate": 0.0002563694951664876,
"loss": 0.506,
"step": 15400
},
{
"epoch": 1.43,
"eval_loss": 0.20584553480148315,
"eval_runtime": 1282.7956,
"eval_samples_per_second": 8.914,
"eval_steps_per_second": 1.115,
"eval_wer": 0.2588268439736294,
"step": 15400
},
{
"epoch": 1.45,
"learning_rate": 0.00025578361488135925,
"loss": 0.5139,
"step": 15600
},
{
"epoch": 1.45,
"eval_loss": 0.20228460431098938,
"eval_runtime": 1297.6236,
"eval_samples_per_second": 8.812,
"eval_steps_per_second": 1.102,
"eval_wer": 0.25989744745590804,
"step": 15600
},
{
"epoch": 1.47,
"learning_rate": 0.0002551977345962308,
"loss": 0.4951,
"step": 15800
},
{
"epoch": 1.47,
"eval_loss": 0.20315276086330414,
"eval_runtime": 1298.6234,
"eval_samples_per_second": 8.805,
"eval_steps_per_second": 1.101,
"eval_wer": 0.26025807178678084,
"step": 15800
},
{
"epoch": 1.49,
"learning_rate": 0.0002546118543111024,
"loss": 0.492,
"step": 16000
},
{
"epoch": 1.49,
"eval_loss": 0.19616416096687317,
"eval_runtime": 1288.7568,
"eval_samples_per_second": 8.873,
"eval_steps_per_second": 1.11,
"eval_wer": 0.25178340001126953,
"step": 16000
},
{
"epoch": 1.51,
"learning_rate": 0.000254025974025974,
"loss": 0.4886,
"step": 16200
},
{
"epoch": 1.51,
"eval_loss": 0.1980104148387909,
"eval_runtime": 1289.7166,
"eval_samples_per_second": 8.866,
"eval_steps_per_second": 1.109,
"eval_wer": 0.24772637628895025,
"step": 16200
},
{
"epoch": 1.52,
"learning_rate": 0.0002534400937408456,
"loss": 0.4847,
"step": 16400
},
{
"epoch": 1.52,
"eval_loss": 0.19249635934829712,
"eval_runtime": 1251.9702,
"eval_samples_per_second": 9.134,
"eval_steps_per_second": 1.142,
"eval_wer": 0.2432974587254184,
"step": 16400
},
{
"epoch": 1.54,
"learning_rate": 0.0002528542134557172,
"loss": 0.4818,
"step": 16600
},
{
"epoch": 1.54,
"eval_loss": 0.1978258192539215,
"eval_runtime": 1264.8774,
"eval_samples_per_second": 9.04,
"eval_steps_per_second": 1.131,
"eval_wer": 0.25403730207922465,
"step": 16600
},
{
"epoch": 1.56,
"learning_rate": 0.00025226833317058876,
"loss": 0.4823,
"step": 16800
},
{
"epoch": 1.56,
"eval_loss": 0.1943204402923584,
"eval_runtime": 1276.7796,
"eval_samples_per_second": 8.956,
"eval_steps_per_second": 1.12,
"eval_wer": 0.24585563757254747,
"step": 16800
},
{
"epoch": 1.58,
"learning_rate": 0.0002516824528854604,
"loss": 0.4834,
"step": 17000
},
{
"epoch": 1.58,
"eval_loss": 0.19206224381923676,
"eval_runtime": 1273.2063,
"eval_samples_per_second": 8.981,
"eval_steps_per_second": 1.123,
"eval_wer": 0.24493153772468587,
"step": 17000
},
{
"epoch": 1.6,
"learning_rate": 0.000251096572600332,
"loss": 0.4814,
"step": 17200
},
{
"epoch": 1.6,
"eval_loss": 0.18929176032543182,
"eval_runtime": 1279.8788,
"eval_samples_per_second": 8.934,
"eval_steps_per_second": 1.117,
"eval_wer": 0.2424973234912943,
"step": 17200
},
{
"epoch": 1.62,
"learning_rate": 0.00025051069231520355,
"loss": 0.4961,
"step": 17400
},
{
"epoch": 1.62,
"eval_loss": 0.19354866445064545,
"eval_runtime": 1283.269,
"eval_samples_per_second": 8.911,
"eval_steps_per_second": 1.114,
"eval_wer": 0.2469037020341466,
"step": 17400
},
{
"epoch": 1.64,
"learning_rate": 0.0002499277414315008,
"loss": 0.4899,
"step": 17600
},
{
"epoch": 1.64,
"eval_loss": 0.19293488562107086,
"eval_runtime": 1281.2009,
"eval_samples_per_second": 8.925,
"eval_steps_per_second": 1.116,
"eval_wer": 0.2515467402941342,
"step": 17600
},
{
"epoch": 1.66,
"learning_rate": 0.0002493418611463724,
"loss": 0.4859,
"step": 17800
},
{
"epoch": 1.66,
"eval_loss": 0.1929776519536972,
"eval_runtime": 1274.0955,
"eval_samples_per_second": 8.975,
"eval_steps_per_second": 1.122,
"eval_wer": 0.2457429424691497,
"step": 17800
},
{
"epoch": 1.68,
"learning_rate": 0.000248755980861244,
"loss": 0.4889,
"step": 18000
},
{
"epoch": 1.68,
"eval_loss": 0.18940649926662445,
"eval_runtime": 1293.2691,
"eval_samples_per_second": 8.842,
"eval_steps_per_second": 1.106,
"eval_wer": 0.24051388967149379,
"step": 18000
},
{
"epoch": 1.7,
"learning_rate": 0.0002481701005761156,
"loss": 0.4718,
"step": 18200
},
{
"epoch": 1.7,
"eval_loss": 0.18651717901229858,
"eval_runtime": 1283.6643,
"eval_samples_per_second": 8.908,
"eval_steps_per_second": 1.114,
"eval_wer": 0.23402265171578296,
"step": 18200
},
{
"epoch": 1.72,
"learning_rate": 0.0002475842202909872,
"loss": 0.4784,
"step": 18400
},
{
"epoch": 1.72,
"eval_loss": 0.18498806655406952,
"eval_runtime": 1277.8059,
"eval_samples_per_second": 8.949,
"eval_steps_per_second": 1.119,
"eval_wer": 0.23561165267369133,
"step": 18400
},
{
"epoch": 1.74,
"learning_rate": 0.00024699834000585876,
"loss": 0.4843,
"step": 18600
},
{
"epoch": 1.74,
"eval_loss": 0.18745319545269012,
"eval_runtime": 1301.5017,
"eval_samples_per_second": 8.786,
"eval_steps_per_second": 1.099,
"eval_wer": 0.2299092804417648,
"step": 18600
},
{
"epoch": 1.76,
"learning_rate": 0.00024641538912215604,
"loss": 0.4768,
"step": 18800
},
{
"epoch": 1.76,
"eval_loss": 0.18831437826156616,
"eval_runtime": 1283.9645,
"eval_samples_per_second": 8.906,
"eval_steps_per_second": 1.114,
"eval_wer": 0.23689637685242576,
"step": 18800
},
{
"epoch": 1.78,
"learning_rate": 0.0002458295088370276,
"loss": 0.4599,
"step": 19000
},
{
"epoch": 1.78,
"eval_loss": 0.18521185219287872,
"eval_runtime": 1294.064,
"eval_samples_per_second": 8.837,
"eval_steps_per_second": 1.105,
"eval_wer": 0.2295373866005522,
"step": 19000
},
{
"epoch": 1.8,
"learning_rate": 0.0002452436285518992,
"loss": 0.4944,
"step": 19200
},
{
"epoch": 1.8,
"eval_loss": 0.1821286529302597,
"eval_runtime": 1279.5843,
"eval_samples_per_second": 8.936,
"eval_steps_per_second": 1.118,
"eval_wer": 0.23201667887530286,
"step": 19200
},
{
"epoch": 1.82,
"learning_rate": 0.0002446577482667708,
"loss": 0.4753,
"step": 19400
},
{
"epoch": 1.82,
"eval_loss": 0.18405307829380035,
"eval_runtime": 1292.3701,
"eval_samples_per_second": 8.848,
"eval_steps_per_second": 1.106,
"eval_wer": 0.23243365075787456,
"step": 19400
},
{
"epoch": 1.84,
"learning_rate": 0.0002440718679816424,
"loss": 0.4675,
"step": 19600
},
{
"epoch": 1.84,
"eval_loss": 0.18435348570346832,
"eval_runtime": 1281.9809,
"eval_samples_per_second": 8.92,
"eval_steps_per_second": 1.115,
"eval_wer": 0.23523975883247872,
"step": 19600
},
{
"epoch": 1.86,
"learning_rate": 0.00024348598769651398,
"loss": 0.4615,
"step": 19800
},
{
"epoch": 1.86,
"eval_loss": 0.17844724655151367,
"eval_runtime": 1282.3895,
"eval_samples_per_second": 8.917,
"eval_steps_per_second": 1.115,
"eval_wer": 0.2273511015946357,
"step": 19800
},
{
"epoch": 1.87,
"learning_rate": 0.00024290010741138558,
"loss": 0.4723,
"step": 20000
},
{
"epoch": 1.87,
"eval_loss": 0.1748301386833191,
"eval_runtime": 1290.0733,
"eval_samples_per_second": 8.864,
"eval_steps_per_second": 1.108,
"eval_wer": 0.2285231306699724,
"step": 20000
},
{
"epoch": 1.89,
"learning_rate": 0.00024231422712625716,
"loss": 0.4644,
"step": 20200
},
{
"epoch": 1.89,
"eval_loss": 0.17795561254024506,
"eval_runtime": 1276.663,
"eval_samples_per_second": 8.957,
"eval_steps_per_second": 1.12,
"eval_wer": 0.22774553445652787,
"step": 20200
},
{
"epoch": 1.91,
"learning_rate": 0.00024172834684112876,
"loss": 0.4516,
"step": 20400
},
{
"epoch": 1.91,
"eval_loss": 0.18295042216777802,
"eval_runtime": 1278.8615,
"eval_samples_per_second": 8.942,
"eval_steps_per_second": 1.118,
"eval_wer": 0.23694145489378488,
"step": 20400
},
{
"epoch": 1.93,
"learning_rate": 0.0002411424665560004,
"loss": 0.4656,
"step": 20600
},
{
"epoch": 1.93,
"eval_loss": 0.17588302493095398,
"eval_runtime": 1272.4536,
"eval_samples_per_second": 8.987,
"eval_steps_per_second": 1.124,
"eval_wer": 0.22738491012565504,
"step": 20600
},
{
"epoch": 1.95,
"learning_rate": 0.00024055658627087194,
"loss": 0.4649,
"step": 20800
},
{
"epoch": 1.95,
"eval_loss": 0.1794005036354065,
"eval_runtime": 1274.9253,
"eval_samples_per_second": 8.969,
"eval_steps_per_second": 1.122,
"eval_wer": 0.22744125767735393,
"step": 20800
},
{
"epoch": 2.02,
"learning_rate": 0.0002399736353871692,
"loss": 0.458,
"step": 21000
},
{
"epoch": 2.02,
"eval_loss": 0.18070010840892792,
"eval_runtime": 1348.5976,
"eval_samples_per_second": 8.479,
"eval_steps_per_second": 1.06,
"eval_wer": 0.23123908266185833,
"step": 21000
},
{
"epoch": 2.04,
"learning_rate": 0.0002393877551020408,
"loss": 0.4605,
"step": 21200
},
{
"epoch": 2.04,
"eval_loss": 0.1788109391927719,
"eval_runtime": 1335.4279,
"eval_samples_per_second": 8.563,
"eval_steps_per_second": 1.071,
"eval_wer": 0.22942469149715444,
"step": 21200
},
{
"epoch": 2.06,
"learning_rate": 0.00023880187481691237,
"loss": 0.446,
"step": 21400
},
{
"epoch": 2.06,
"eval_loss": 0.17524349689483643,
"eval_runtime": 1337.1415,
"eval_samples_per_second": 8.552,
"eval_steps_per_second": 1.069,
"eval_wer": 0.22274187186566743,
"step": 21400
},
{
"epoch": 2.08,
"learning_rate": 0.00023821599453178398,
"loss": 0.4442,
"step": 21600
},
{
"epoch": 2.08,
"eval_loss": 0.16901686787605286,
"eval_runtime": 1340.3966,
"eval_samples_per_second": 8.531,
"eval_steps_per_second": 1.067,
"eval_wer": 0.21865103961232885,
"step": 21600
},
{
"epoch": 2.1,
"learning_rate": 0.00023763011424665558,
"loss": 0.4557,
"step": 21800
},
{
"epoch": 2.1,
"eval_loss": 0.1691495031118393,
"eval_runtime": 1342.8042,
"eval_samples_per_second": 8.516,
"eval_steps_per_second": 1.065,
"eval_wer": 0.21790725192990365,
"step": 21800
},
{
"epoch": 2.12,
"learning_rate": 0.00023704423396152716,
"loss": 0.4435,
"step": 22000
},
{
"epoch": 2.12,
"eval_loss": 0.17447154223918915,
"eval_runtime": 1342.6406,
"eval_samples_per_second": 8.517,
"eval_steps_per_second": 1.065,
"eval_wer": 0.21763678368174902,
"step": 22000
},
{
"epoch": 2.14,
"learning_rate": 0.00023645835367639876,
"loss": 0.4427,
"step": 22200
},
{
"epoch": 2.14,
"eval_loss": 0.16724492609500885,
"eval_runtime": 1348.4035,
"eval_samples_per_second": 8.48,
"eval_steps_per_second": 1.061,
"eval_wer": 0.2169944215923818,
"step": 22200
},
{
"epoch": 2.16,
"learning_rate": 0.00023587247339127036,
"loss": 0.4439,
"step": 22400
},
{
"epoch": 2.16,
"eval_loss": 0.16558879613876343,
"eval_runtime": 1349.3597,
"eval_samples_per_second": 8.474,
"eval_steps_per_second": 1.06,
"eval_wer": 0.2161153997858793,
"step": 22400
},
{
"epoch": 2.17,
"learning_rate": 0.00023528659310614194,
"loss": 0.4416,
"step": 22600
},
{
"epoch": 2.17,
"eval_loss": 0.1659516543149948,
"eval_runtime": 1345.2434,
"eval_samples_per_second": 8.5,
"eval_steps_per_second": 1.063,
"eval_wer": 0.21102158111230068,
"step": 22600
},
{
"epoch": 2.19,
"learning_rate": 0.00023470071282101355,
"loss": 0.434,
"step": 22800
},
{
"epoch": 2.19,
"eval_loss": 0.16529063880443573,
"eval_runtime": 1343.6004,
"eval_samples_per_second": 8.511,
"eval_steps_per_second": 1.064,
"eval_wer": 0.21015382881613795,
"step": 22800
},
{
"epoch": 2.21,
"learning_rate": 0.00023411483253588512,
"loss": 0.4431,
"step": 23000
},
{
"epoch": 2.21,
"eval_loss": 0.16421248018741608,
"eval_runtime": 1343.5764,
"eval_samples_per_second": 8.511,
"eval_steps_per_second": 1.064,
"eval_wer": 0.2060742660731391,
"step": 23000
},
{
"epoch": 2.23,
"learning_rate": 0.00023352895225075675,
"loss": 0.4328,
"step": 23200
},
{
"epoch": 2.23,
"eval_loss": 0.16530516743659973,
"eval_runtime": 1340.835,
"eval_samples_per_second": 8.528,
"eval_steps_per_second": 1.066,
"eval_wer": 0.2064123513833324,
"step": 23200
},
{
"epoch": 2.25,
"learning_rate": 0.00023294307196562836,
"loss": 0.4291,
"step": 23400
},
{
"epoch": 2.25,
"eval_loss": 0.16716133058071136,
"eval_runtime": 1349.4559,
"eval_samples_per_second": 8.474,
"eval_steps_per_second": 1.06,
"eval_wer": 0.20953400574745026,
"step": 23400
},
{
"epoch": 2.27,
"learning_rate": 0.00023235719168049993,
"loss": 0.4249,
"step": 23600
},
{
"epoch": 2.27,
"eval_loss": 0.1660962998867035,
"eval_runtime": 1342.5077,
"eval_samples_per_second": 8.518,
"eval_steps_per_second": 1.065,
"eval_wer": 0.20847467177551135,
"step": 23600
},
{
"epoch": 2.29,
"learning_rate": 0.00023177131139537154,
"loss": 0.4476,
"step": 23800
},
{
"epoch": 2.29,
"eval_loss": 0.167561873793602,
"eval_runtime": 1343.4696,
"eval_samples_per_second": 8.512,
"eval_steps_per_second": 1.064,
"eval_wer": 0.21436862568321408,
"step": 23800
},
{
"epoch": 2.31,
"learning_rate": 0.00023118543111024314,
"loss": 0.4246,
"step": 24000
},
{
"epoch": 2.31,
"eval_loss": 0.1651725172996521,
"eval_runtime": 1345.4703,
"eval_samples_per_second": 8.499,
"eval_steps_per_second": 1.063,
"eval_wer": 0.21284724178734435,
"step": 24000
},
{
"epoch": 2.33,
"learning_rate": 0.00023060248022654034,
"loss": 0.445,
"step": 24200
},
{
"epoch": 2.33,
"eval_loss": 0.16498707234859467,
"eval_runtime": 1347.0845,
"eval_samples_per_second": 8.489,
"eval_steps_per_second": 1.062,
"eval_wer": 0.2074716853552713,
"step": 24200
},
{
"epoch": 2.35,
"learning_rate": 0.00023001659994141194,
"loss": 0.4303,
"step": 24400
},
{
"epoch": 2.35,
"eval_loss": 0.15905718505382538,
"eval_runtime": 1346.9157,
"eval_samples_per_second": 8.49,
"eval_steps_per_second": 1.062,
"eval_wer": 0.20397813714994084,
"step": 24400
},
{
"epoch": 2.37,
"learning_rate": 0.00022943071965628354,
"loss": 0.4194,
"step": 24600
},
{
"epoch": 2.37,
"eval_loss": 0.1634632647037506,
"eval_runtime": 1345.7282,
"eval_samples_per_second": 8.497,
"eval_steps_per_second": 1.063,
"eval_wer": 0.20863244492026822,
"step": 24600
},
{
"epoch": 2.39,
"learning_rate": 0.00022884483937115512,
"loss": 0.4211,
"step": 24800
},
{
"epoch": 2.39,
"eval_loss": 0.16573943197727203,
"eval_runtime": 1346.4203,
"eval_samples_per_second": 8.493,
"eval_steps_per_second": 1.062,
"eval_wer": 0.21404180988336058,
"step": 24800
},
{
"epoch": 2.41,
"learning_rate": 0.00022825895908602673,
"loss": 0.4238,
"step": 25000
},
{
"epoch": 2.41,
"eval_loss": 0.16177457571029663,
"eval_runtime": 1353.3476,
"eval_samples_per_second": 8.449,
"eval_steps_per_second": 1.057,
"eval_wer": 0.20668281963148702,
"step": 25000
},
{
"epoch": 2.43,
"learning_rate": 0.00022767307880089836,
"loss": 0.4229,
"step": 25200
},
{
"epoch": 2.43,
"eval_loss": 0.1606961190700531,
"eval_runtime": 1347.2789,
"eval_samples_per_second": 8.487,
"eval_steps_per_second": 1.061,
"eval_wer": 0.20163407899926747,
"step": 25200
},
{
"epoch": 2.45,
"learning_rate": 0.0002270871985157699,
"loss": 0.434,
"step": 25400
},
{
"epoch": 2.45,
"eval_loss": 0.1586761772632599,
"eval_runtime": 1345.6532,
"eval_samples_per_second": 8.498,
"eval_steps_per_second": 1.063,
"eval_wer": 0.19963937566912718,
"step": 25400
},
{
"epoch": 2.47,
"learning_rate": 0.00022650131823064154,
"loss": 0.4232,
"step": 25600
},
{
"epoch": 2.47,
"eval_loss": 0.15713459253311157,
"eval_runtime": 1346.3424,
"eval_samples_per_second": 8.493,
"eval_steps_per_second": 1.062,
"eval_wer": 0.20052966698596947,
"step": 25600
},
{
"epoch": 2.49,
"learning_rate": 0.0002259154379455131,
"loss": 0.4132,
"step": 25800
},
{
"epoch": 2.49,
"eval_loss": 0.15517787635326385,
"eval_runtime": 1347.0293,
"eval_samples_per_second": 8.489,
"eval_steps_per_second": 1.062,
"eval_wer": 0.2024680227644109,
"step": 25800
},
{
"epoch": 2.51,
"learning_rate": 0.00022532955766038472,
"loss": 0.4239,
"step": 26000
},
{
"epoch": 2.51,
"eval_loss": 0.15804125368595123,
"eval_runtime": 1349.3993,
"eval_samples_per_second": 8.474,
"eval_steps_per_second": 1.06,
"eval_wer": 0.20016904265509664,
"step": 26000
},
{
"epoch": 2.52,
"learning_rate": 0.00022474367737525632,
"loss": 0.4097,
"step": 26200
},
{
"epoch": 2.52,
"eval_loss": 0.1611405611038208,
"eval_runtime": 1344.7866,
"eval_samples_per_second": 8.503,
"eval_steps_per_second": 1.063,
"eval_wer": 0.20251310080576998,
"step": 26200
},
{
"epoch": 2.54,
"learning_rate": 0.00022416072649155354,
"loss": 0.3975,
"step": 26400
},
{
"epoch": 2.54,
"eval_loss": 0.15802615880966187,
"eval_runtime": 1349.3436,
"eval_samples_per_second": 8.474,
"eval_steps_per_second": 1.06,
"eval_wer": 0.20389925057756242,
"step": 26400
},
{
"epoch": 2.56,
"learning_rate": 0.00022357484620642512,
"loss": 0.418,
"step": 26600
},
{
"epoch": 2.56,
"eval_loss": 0.1567668914794922,
"eval_runtime": 1346.9229,
"eval_samples_per_second": 8.49,
"eval_steps_per_second": 1.062,
"eval_wer": 0.20108187299261848,
"step": 26600
},
{
"epoch": 2.58,
"learning_rate": 0.00022298896592129672,
"loss": 0.4126,
"step": 26800
},
{
"epoch": 2.58,
"eval_loss": 0.15674176812171936,
"eval_runtime": 1347.6959,
"eval_samples_per_second": 8.485,
"eval_steps_per_second": 1.061,
"eval_wer": 0.19748689919423001,
"step": 26800
},
{
"epoch": 2.6,
"learning_rate": 0.0002224030856361683,
"loss": 0.4227,
"step": 27000
},
{
"epoch": 2.6,
"eval_loss": 0.15419313311576843,
"eval_runtime": 1347.3912,
"eval_samples_per_second": 8.487,
"eval_steps_per_second": 1.061,
"eval_wer": 0.19683326759452302,
"step": 27000
},
{
"epoch": 2.62,
"learning_rate": 0.0002218172053510399,
"loss": 0.4176,
"step": 27200
},
{
"epoch": 2.62,
"eval_loss": 0.1559024453163147,
"eval_runtime": 1346.8455,
"eval_samples_per_second": 8.49,
"eval_steps_per_second": 1.062,
"eval_wer": 0.19721643094607538,
"step": 27200
},
{
"epoch": 2.64,
"learning_rate": 0.00022123132506591154,
"loss": 0.4158,
"step": 27400
},
{
"epoch": 2.64,
"eval_loss": 0.15258029103279114,
"eval_runtime": 1345.1608,
"eval_samples_per_second": 8.501,
"eval_steps_per_second": 1.063,
"eval_wer": 0.1984673465937905,
"step": 27400
},
{
"epoch": 2.66,
"learning_rate": 0.00022064544478078309,
"loss": 0.4064,
"step": 27600
},
{
"epoch": 2.66,
"eval_loss": 0.1543867439031601,
"eval_runtime": 1350.12,
"eval_samples_per_second": 8.47,
"eval_steps_per_second": 1.059,
"eval_wer": 0.19683326759452302,
"step": 27600
},
{
"epoch": 2.68,
"learning_rate": 0.00022005956449565472,
"loss": 0.4054,
"step": 27800
},
{
"epoch": 2.68,
"eval_loss": 0.1523013412952423,
"eval_runtime": 1347.6703,
"eval_samples_per_second": 8.485,
"eval_steps_per_second": 1.061,
"eval_wer": 0.19182960500366258,
"step": 27800
},
{
"epoch": 2.7,
"learning_rate": 0.00021947368421052632,
"loss": 0.4046,
"step": 28000
},
{
"epoch": 2.7,
"eval_loss": 0.15553198754787445,
"eval_runtime": 1346.2686,
"eval_samples_per_second": 8.494,
"eval_steps_per_second": 1.062,
"eval_wer": 0.19630360060855356,
"step": 28000
},
{
"epoch": 2.72,
"learning_rate": 0.0002188878039253979,
"loss": 0.4052,
"step": 28200
},
{
"epoch": 2.72,
"eval_loss": 0.15202964842319489,
"eval_runtime": 1350.4067,
"eval_samples_per_second": 8.468,
"eval_steps_per_second": 1.059,
"eval_wer": 0.19546965684341017,
"step": 28200
},
{
"epoch": 2.74,
"learning_rate": 0.0002183019236402695,
"loss": 0.4139,
"step": 28400
},
{
"epoch": 2.74,
"eval_loss": 0.1537465751171112,
"eval_runtime": 1348.6125,
"eval_samples_per_second": 8.479,
"eval_steps_per_second": 1.06,
"eval_wer": 0.19421874119569504,
"step": 28400
},
{
"epoch": 2.76,
"learning_rate": 0.00021771604335514108,
"loss": 0.4043,
"step": 28600
},
{
"epoch": 2.76,
"eval_loss": 0.15482832491397858,
"eval_runtime": 1353.2391,
"eval_samples_per_second": 8.45,
"eval_steps_per_second": 1.057,
"eval_wer": 0.1914013636107511,
"step": 28600
},
{
"epoch": 2.78,
"learning_rate": 0.00021713016307001268,
"loss": 0.4028,
"step": 28800
},
{
"epoch": 2.78,
"eval_loss": 0.15318334102630615,
"eval_runtime": 1349.2472,
"eval_samples_per_second": 8.475,
"eval_steps_per_second": 1.06,
"eval_wer": 0.19257339268608778,
"step": 28800
},
{
"epoch": 2.8,
"learning_rate": 0.0002165442827848843,
"loss": 0.4195,
"step": 29000
},
{
"epoch": 2.8,
"eval_loss": 0.15186063945293427,
"eval_runtime": 1355.3879,
"eval_samples_per_second": 8.437,
"eval_steps_per_second": 1.055,
"eval_wer": 0.19338479743055165,
"step": 29000
},
{
"epoch": 2.82,
"learning_rate": 0.00021595840249975586,
"loss": 0.4086,
"step": 29200
},
{
"epoch": 2.82,
"eval_loss": 0.1497160643339157,
"eval_runtime": 1351.97,
"eval_samples_per_second": 8.458,
"eval_steps_per_second": 1.058,
"eval_wer": 0.19105200879021805,
"step": 29200
},
{
"epoch": 2.84,
"learning_rate": 0.00021537252221462747,
"loss": 0.39,
"step": 29400
},
{
"epoch": 2.84,
"eval_loss": 0.1531924307346344,
"eval_runtime": 1349.4993,
"eval_samples_per_second": 8.474,
"eval_steps_per_second": 1.06,
"eval_wer": 0.1928889389756015,
"step": 29400
},
{
"epoch": 2.86,
"learning_rate": 0.00021478957133092472,
"loss": 0.3936,
"step": 29600
},
{
"epoch": 2.86,
"eval_loss": 0.14919565618038177,
"eval_runtime": 1346.555,
"eval_samples_per_second": 8.492,
"eval_steps_per_second": 1.062,
"eval_wer": 0.18807685806051727,
"step": 29600
},
{
"epoch": 2.87,
"learning_rate": 0.00021420369104579627,
"loss": 0.4065,
"step": 29800
},
{
"epoch": 2.87,
"eval_loss": 0.14806747436523438,
"eval_runtime": 1359.5314,
"eval_samples_per_second": 8.411,
"eval_steps_per_second": 1.052,
"eval_wer": 0.187738772750324,
"step": 29800
},
{
"epoch": 2.89,
"learning_rate": 0.0002136178107606679,
"loss": 0.4047,
"step": 30000
},
{
"epoch": 2.89,
"eval_loss": 0.1506689190864563,
"eval_runtime": 1347.9533,
"eval_samples_per_second": 8.483,
"eval_steps_per_second": 1.061,
"eval_wer": 0.192764974361864,
"step": 30000
},
{
"epoch": 2.02,
"learning_rate": 0.0002130319304755395,
"loss": 0.3972,
"step": 30200
},
{
"epoch": 2.02,
"eval_loss": 0.14971239864826202,
"eval_runtime": 1295.4974,
"eval_samples_per_second": 8.827,
"eval_steps_per_second": 1.104,
"eval_wer": 0.18893334084634023,
"step": 30200
},
{
"epoch": 2.04,
"learning_rate": 0.00021244605019041108,
"loss": 0.3955,
"step": 30400
},
{
"epoch": 2.04,
"eval_loss": 0.15231847763061523,
"eval_runtime": 1286.7728,
"eval_samples_per_second": 8.887,
"eval_steps_per_second": 1.111,
"eval_wer": 0.1934974925339494,
"step": 30400
},
{
"epoch": 2.06,
"learning_rate": 0.00021186016990528268,
"loss": 0.3864,
"step": 30600
},
{
"epoch": 2.06,
"eval_loss": 0.14847034215927124,
"eval_runtime": 1289.1638,
"eval_samples_per_second": 8.87,
"eval_steps_per_second": 1.109,
"eval_wer": 0.1906688454386657,
"step": 30600
},
{
"epoch": 2.08,
"learning_rate": 0.00021127428962015426,
"loss": 0.3847,
"step": 30800
},
{
"epoch": 2.08,
"eval_loss": 0.14542284607887268,
"eval_runtime": 1293.2483,
"eval_samples_per_second": 8.842,
"eval_steps_per_second": 1.106,
"eval_wer": 0.18785146785372175,
"step": 30800
},
{
"epoch": 2.1,
"learning_rate": 0.00021068840933502586,
"loss": 0.3971,
"step": 31000
},
{
"epoch": 2.1,
"eval_loss": 0.14737120270729065,
"eval_runtime": 1285.34,
"eval_samples_per_second": 8.896,
"eval_steps_per_second": 1.113,
"eval_wer": 0.18689355947484082,
"step": 31000
},
{
"epoch": 2.12,
"learning_rate": 0.00021010252904989747,
"loss": 0.3945,
"step": 31200
},
{
"epoch": 2.12,
"eval_loss": 0.14705486595630646,
"eval_runtime": 1285.8175,
"eval_samples_per_second": 8.893,
"eval_steps_per_second": 1.112,
"eval_wer": 0.18310700400067617,
"step": 31200
},
{
"epoch": 2.14,
"learning_rate": 0.00020951664876476904,
"loss": 0.3921,
"step": 31400
},
{
"epoch": 2.14,
"eval_loss": 0.14592072367668152,
"eval_runtime": 1297.0191,
"eval_samples_per_second": 8.816,
"eval_steps_per_second": 1.103,
"eval_wer": 0.18582295599256213,
"step": 31400
},
{
"epoch": 2.16,
"learning_rate": 0.00020893076847964065,
"loss": 0.3884,
"step": 31600
},
{
"epoch": 2.16,
"eval_loss": 0.14477235078811646,
"eval_runtime": 1294.3727,
"eval_samples_per_second": 8.834,
"eval_steps_per_second": 1.105,
"eval_wer": 0.18609342424071673,
"step": 31600
},
{
"epoch": 2.17,
"learning_rate": 0.00020834488819451225,
"loss": 0.3834,
"step": 31800
},
{
"epoch": 2.17,
"eval_loss": 0.14469768106937408,
"eval_runtime": 1297.5153,
"eval_samples_per_second": 8.813,
"eval_steps_per_second": 1.102,
"eval_wer": 0.18483123908266186,
"step": 31800
},
{
"epoch": 2.19,
"learning_rate": 0.00020776193731080944,
"loss": 0.382,
"step": 32000
},
{
"epoch": 2.19,
"eval_loss": 0.14314468204975128,
"eval_runtime": 1293.9163,
"eval_samples_per_second": 8.838,
"eval_steps_per_second": 1.105,
"eval_wer": 0.17969234236772413,
"step": 32000
},
{
"epoch": 2.21,
"learning_rate": 0.00020717605702568108,
"loss": 0.3847,
"step": 32200
},
{
"epoch": 2.21,
"eval_loss": 0.14419673383235931,
"eval_runtime": 1295.5312,
"eval_samples_per_second": 8.826,
"eval_steps_per_second": 1.104,
"eval_wer": 0.18103341409815743,
"step": 32200
},
{
"epoch": 2.23,
"learning_rate": 0.0002065931061419783,
"loss": 0.3824,
"step": 32400
},
{
"epoch": 2.23,
"eval_loss": 0.14198584854602814,
"eval_runtime": 1291.5798,
"eval_samples_per_second": 8.853,
"eval_steps_per_second": 1.107,
"eval_wer": 0.1794218741195695,
"step": 32400
},
{
"epoch": 2.25,
"learning_rate": 0.0002060072258568499,
"loss": 0.375,
"step": 32600
},
{
"epoch": 2.25,
"eval_loss": 0.1454899162054062,
"eval_runtime": 1296.0759,
"eval_samples_per_second": 8.823,
"eval_steps_per_second": 1.103,
"eval_wer": 0.1824984504423283,
"step": 32600
},
{
"epoch": 2.27,
"learning_rate": 0.00020542134557172148,
"loss": 0.3649,
"step": 32800
},
{
"epoch": 2.27,
"eval_loss": 0.14184387028217316,
"eval_runtime": 1293.9484,
"eval_samples_per_second": 8.837,
"eval_steps_per_second": 1.105,
"eval_wer": 0.17908378880937623,
"step": 32800
},
{
"epoch": 2.29,
"learning_rate": 0.00020483546528659308,
"loss": 0.3835,
"step": 33000
},
{
"epoch": 2.29,
"eval_loss": 0.14400140941143036,
"eval_runtime": 1291.8948,
"eval_samples_per_second": 8.851,
"eval_steps_per_second": 1.107,
"eval_wer": 0.18164196765650534,
"step": 33000
},
{
"epoch": 2.31,
"learning_rate": 0.00020424958500146466,
"loss": 0.3708,
"step": 33200
},
{
"epoch": 2.31,
"eval_loss": 0.14257806539535522,
"eval_runtime": 1287.163,
"eval_samples_per_second": 8.884,
"eval_steps_per_second": 1.111,
"eval_wer": 0.181055953118837,
"step": 33200
},
{
"epoch": 2.33,
"learning_rate": 0.00020366370471633626,
"loss": 0.3903,
"step": 33400
},
{
"epoch": 2.33,
"eval_loss": 0.14411504566669464,
"eval_runtime": 1294.8904,
"eval_samples_per_second": 8.831,
"eval_steps_per_second": 1.104,
"eval_wer": 0.18088691046374036,
"step": 33400
},
{
"epoch": 2.35,
"learning_rate": 0.0002030778244312079,
"loss": 0.3901,
"step": 33600
},
{
"epoch": 2.35,
"eval_loss": 0.14472506940364838,
"eval_runtime": 1287.7937,
"eval_samples_per_second": 8.88,
"eval_steps_per_second": 1.11,
"eval_wer": 0.18023327886403337,
"step": 33600
},
{
"epoch": 2.37,
"learning_rate": 0.00020249194414607944,
"loss": 0.372,
"step": 33800
},
{
"epoch": 2.37,
"eval_loss": 0.14397132396697998,
"eval_runtime": 1288.3131,
"eval_samples_per_second": 8.876,
"eval_steps_per_second": 1.11,
"eval_wer": 0.17937679607821042,
"step": 33800
},
{
"epoch": 2.39,
"learning_rate": 0.00020190606386095107,
"loss": 0.373,
"step": 34000
},
{
"epoch": 2.39,
"eval_loss": 0.14335143566131592,
"eval_runtime": 1294.3533,
"eval_samples_per_second": 8.835,
"eval_steps_per_second": 1.105,
"eval_wer": 0.17952329971262748,
"step": 34000
},
{
"epoch": 2.41,
"learning_rate": 0.00020132018357582268,
"loss": 0.382,
"step": 34200
},
{
"epoch": 2.41,
"eval_loss": 0.14260776340961456,
"eval_runtime": 1294.0006,
"eval_samples_per_second": 8.837,
"eval_steps_per_second": 1.105,
"eval_wer": 0.17981630698146164,
"step": 34200
},
{
"epoch": 2.43,
"learning_rate": 0.00020073430329069426,
"loss": 0.3735,
"step": 34400
},
{
"epoch": 2.43,
"eval_loss": 0.14174862205982208,
"eval_runtime": 1291.0684,
"eval_samples_per_second": 8.857,
"eval_steps_per_second": 1.108,
"eval_wer": 0.17719051107229392,
"step": 34400
},
{
"epoch": 2.45,
"learning_rate": 0.00020014842300556586,
"loss": 0.3919,
"step": 34600
},
{
"epoch": 2.45,
"eval_loss": 0.14172929525375366,
"eval_runtime": 1295.6993,
"eval_samples_per_second": 8.825,
"eval_steps_per_second": 1.104,
"eval_wer": 0.18066152025694485,
"step": 34600
},
{
"epoch": 2.47,
"learning_rate": 0.00019956254272043744,
"loss": 0.3694,
"step": 34800
},
{
"epoch": 2.47,
"eval_loss": 0.1413334310054779,
"eval_runtime": 1291.4925,
"eval_samples_per_second": 8.854,
"eval_steps_per_second": 1.107,
"eval_wer": 0.1777990646306418,
"step": 34800
},
{
"epoch": 2.49,
"learning_rate": 0.00019897666243530904,
"loss": 0.3747,
"step": 35000
},
{
"epoch": 2.49,
"eval_loss": 0.14046485722064972,
"eval_runtime": 1291.2845,
"eval_samples_per_second": 8.856,
"eval_steps_per_second": 1.107,
"eval_wer": 0.1763565673071505,
"step": 35000
},
{
"epoch": 2.51,
"learning_rate": 0.00019839078215018064,
"loss": 0.3728,
"step": 35200
},
{
"epoch": 2.51,
"eval_loss": 0.14019745588302612,
"eval_runtime": 1277.9327,
"eval_samples_per_second": 8.948,
"eval_steps_per_second": 1.119,
"eval_wer": 0.17606356003831633,
"step": 35200
},
{
"epoch": 2.52,
"learning_rate": 0.00019780490186505222,
"loss": 0.3604,
"step": 35400
},
{
"epoch": 2.52,
"eval_loss": 0.14010049402713776,
"eval_runtime": 1269.2145,
"eval_samples_per_second": 9.01,
"eval_steps_per_second": 1.127,
"eval_wer": 0.1762551417140925,
"step": 35400
},
{
"epoch": 2.54,
"learning_rate": 0.00019721902157992383,
"loss": 0.354,
"step": 35600
},
{
"epoch": 2.54,
"eval_loss": 0.13699594140052795,
"eval_runtime": 1266.9571,
"eval_samples_per_second": 9.026,
"eval_steps_per_second": 1.129,
"eval_wer": 0.17405758719783626,
"step": 35600
},
{
"epoch": 2.56,
"learning_rate": 0.00019663314129479543,
"loss": 0.3731,
"step": 35800
},
{
"epoch": 2.56,
"eval_loss": 0.137326180934906,
"eval_runtime": 1281.6045,
"eval_samples_per_second": 8.922,
"eval_steps_per_second": 1.116,
"eval_wer": 0.1728292105708007,
"step": 35800
},
{
"epoch": 2.58,
"learning_rate": 0.000196047261009667,
"loss": 0.3704,
"step": 36000
},
{
"epoch": 2.58,
"eval_loss": 0.14074836671352386,
"eval_runtime": 1278.0727,
"eval_samples_per_second": 8.947,
"eval_steps_per_second": 1.119,
"eval_wer": 0.17788922071336,
"step": 36000
},
{
"epoch": 2.6,
"learning_rate": 0.00019546431012596425,
"loss": 0.3737,
"step": 36200
},
{
"epoch": 2.6,
"eval_loss": 0.1350381225347519,
"eval_runtime": 1289.4945,
"eval_samples_per_second": 8.868,
"eval_steps_per_second": 1.109,
"eval_wer": 0.1738547360117203,
"step": 36200
},
{
"epoch": 2.62,
"learning_rate": 0.00019487842984083586,
"loss": 0.3638,
"step": 36400
},
{
"epoch": 2.62,
"eval_loss": 0.13623464107513428,
"eval_runtime": 1306.2961,
"eval_samples_per_second": 8.754,
"eval_steps_per_second": 1.095,
"eval_wer": 0.1758494393418606,
"step": 36400
},
{
"epoch": 2.64,
"learning_rate": 0.00019429254955570743,
"loss": 0.3726,
"step": 36600
},
{
"epoch": 2.64,
"eval_loss": 0.1357557475566864,
"eval_runtime": 1277.9297,
"eval_samples_per_second": 8.948,
"eval_steps_per_second": 1.119,
"eval_wer": 0.17244604721924833,
"step": 36600
},
{
"epoch": 2.66,
"learning_rate": 0.00019370666927057904,
"loss": 0.362,
"step": 36800
},
{
"epoch": 2.66,
"eval_loss": 0.136088564991951,
"eval_runtime": 1273.2522,
"eval_samples_per_second": 8.981,
"eval_steps_per_second": 1.123,
"eval_wer": 0.17147686933002762,
"step": 36800
},
{
"epoch": 2.68,
"learning_rate": 0.00019312078898545064,
"loss": 0.3707,
"step": 37000
},
{
"epoch": 2.68,
"eval_loss": 0.13885775208473206,
"eval_runtime": 1286.0056,
"eval_samples_per_second": 8.892,
"eval_steps_per_second": 1.112,
"eval_wer": 0.17355045923254633,
"step": 37000
},
{
"epoch": 2.7,
"learning_rate": 0.00019253490870032222,
"loss": 0.3682,
"step": 37200
},
{
"epoch": 2.7,
"eval_loss": 0.13624690473079681,
"eval_runtime": 1286.554,
"eval_samples_per_second": 8.888,
"eval_steps_per_second": 1.111,
"eval_wer": 0.17115005353017412,
"step": 37200
},
{
"epoch": 2.72,
"learning_rate": 0.00019194902841519382,
"loss": 0.3553,
"step": 37400
},
{
"epoch": 2.72,
"eval_loss": 0.13790255784988403,
"eval_runtime": 1291.8798,
"eval_samples_per_second": 8.851,
"eval_steps_per_second": 1.107,
"eval_wer": 0.17359553727390545,
"step": 37400
},
{
"epoch": 2.74,
"learning_rate": 0.0001913631481300654,
"loss": 0.3721,
"step": 37600
},
{
"epoch": 2.74,
"eval_loss": 0.1351141631603241,
"eval_runtime": 1288.5954,
"eval_samples_per_second": 8.874,
"eval_steps_per_second": 1.11,
"eval_wer": 0.16746492364906745,
"step": 37600
},
{
"epoch": 2.76,
"learning_rate": 0.000190777267844937,
"loss": 0.3615,
"step": 37800
},
{
"epoch": 2.76,
"eval_loss": 0.13291703164577484,
"eval_runtime": 1285.1295,
"eval_samples_per_second": 8.898,
"eval_steps_per_second": 1.113,
"eval_wer": 0.1660449653462557,
"step": 37800
},
{
"epoch": 2.78,
"learning_rate": 0.0001901913875598086,
"loss": 0.3484,
"step": 38000
},
{
"epoch": 2.78,
"eval_loss": 0.1341363489627838,
"eval_runtime": 1287.2816,
"eval_samples_per_second": 8.883,
"eval_steps_per_second": 1.111,
"eval_wer": 0.16912154166901447,
"step": 38000
},
{
"epoch": 2.8,
"learning_rate": 0.00018960550727468019,
"loss": 0.3738,
"step": 38200
},
{
"epoch": 2.8,
"eval_loss": 0.13387584686279297,
"eval_runtime": 1267.1408,
"eval_samples_per_second": 9.024,
"eval_steps_per_second": 1.129,
"eval_wer": 0.1686031441933848,
"step": 38200
},
{
"epoch": 2.82,
"learning_rate": 0.0001890196269895518,
"loss": 0.3599,
"step": 38400
},
{
"epoch": 2.82,
"eval_loss": 0.13417528569698334,
"eval_runtime": 1259.8892,
"eval_samples_per_second": 9.076,
"eval_steps_per_second": 1.135,
"eval_wer": 0.16907646362765538,
"step": 38400
},
{
"epoch": 2.84,
"learning_rate": 0.0001884337467044234,
"loss": 0.3534,
"step": 38600
},
{
"epoch": 2.84,
"eval_loss": 0.13447332382202148,
"eval_runtime": 1271.9609,
"eval_samples_per_second": 8.99,
"eval_steps_per_second": 1.124,
"eval_wer": 0.1683664844762495,
"step": 38600
},
{
"epoch": 2.86,
"learning_rate": 0.00018784786641929497,
"loss": 0.3502,
"step": 38800
},
{
"epoch": 2.86,
"eval_loss": 0.13398751616477966,
"eval_runtime": 1260.4382,
"eval_samples_per_second": 9.072,
"eval_steps_per_second": 1.135,
"eval_wer": 0.16712683833887418,
"step": 38800
},
{
"epoch": 2.87,
"learning_rate": 0.00018726198613416658,
"loss": 0.3597,
"step": 39000
},
{
"epoch": 2.87,
"eval_loss": 0.1342509537935257,
"eval_runtime": 1268.7112,
"eval_samples_per_second": 9.013,
"eval_steps_per_second": 1.127,
"eval_wer": 0.17053023046148644,
"step": 39000
},
{
"epoch": 2.89,
"learning_rate": 0.00018667610584903815,
"loss": 0.3558,
"step": 39200
},
{
"epoch": 2.89,
"eval_loss": 0.13048462569713593,
"eval_runtime": 1294.9536,
"eval_samples_per_second": 8.83,
"eval_steps_per_second": 1.104,
"eval_wer": 0.1658646531808193,
"step": 39200
},
{
"epoch": 2.91,
"learning_rate": 0.00018609022556390976,
"loss": 0.3685,
"step": 39400
},
{
"epoch": 2.91,
"eval_loss": 0.13240975141525269,
"eval_runtime": 1294.9408,
"eval_samples_per_second": 8.831,
"eval_steps_per_second": 1.104,
"eval_wer": 0.16629289457373078,
"step": 39400
},
{
"epoch": 2.93,
"learning_rate": 0.00018550434527878136,
"loss": 0.3709,
"step": 39600
},
{
"epoch": 2.93,
"eval_loss": 0.13161210715770721,
"eval_runtime": 1282.8283,
"eval_samples_per_second": 8.914,
"eval_steps_per_second": 1.115,
"eval_wer": 0.1704626133994478,
"step": 39600
},
{
"epoch": 3.02,
"learning_rate": 0.00018491846499365294,
"loss": 0.3561,
"step": 39800
},
{
"epoch": 3.02,
"eval_loss": 0.13415904343128204,
"eval_runtime": 1283.3514,
"eval_samples_per_second": 8.91,
"eval_steps_per_second": 1.114,
"eval_wer": 0.16870456978644277,
"step": 39800
},
{
"epoch": 3.04,
"learning_rate": 0.00018433258470852454,
"loss": 0.3465,
"step": 40000
},
{
"epoch": 3.04,
"eval_loss": 0.12848955392837524,
"eval_runtime": 1271.6159,
"eval_samples_per_second": 8.992,
"eval_steps_per_second": 1.125,
"eval_wer": 0.1640051839747563,
"step": 40000
},
{
"epoch": 3.06,
"learning_rate": 0.00018374670442339615,
"loss": 0.3381,
"step": 40200
},
{
"epoch": 3.06,
"eval_loss": 0.13284260034561157,
"eval_runtime": 1266.2009,
"eval_samples_per_second": 9.031,
"eval_steps_per_second": 1.129,
"eval_wer": 0.1692116977517327,
"step": 40200
},
{
"epoch": 3.08,
"learning_rate": 0.00018316082413826772,
"loss": 0.3391,
"step": 40400
},
{
"epoch": 3.08,
"eval_loss": 0.1303485929965973,
"eval_runtime": 1268.7911,
"eval_samples_per_second": 9.013,
"eval_steps_per_second": 1.127,
"eval_wer": 0.16649574575984674,
"step": 40400
},
{
"epoch": 3.1,
"learning_rate": 0.00018257494385313933,
"loss": 0.3657,
"step": 40600
},
{
"epoch": 3.1,
"eval_loss": 0.13046273589134216,
"eval_runtime": 1268.0254,
"eval_samples_per_second": 9.018,
"eval_steps_per_second": 1.128,
"eval_wer": 0.1679945906350369,
"step": 40600
},
{
"epoch": 3.12,
"learning_rate": 0.0001819890635680109,
"loss": 0.3401,
"step": 40800
},
{
"epoch": 3.12,
"eval_loss": 0.12838347256183624,
"eval_runtime": 1274.5116,
"eval_samples_per_second": 8.972,
"eval_steps_per_second": 1.122,
"eval_wer": 0.16308108412689468,
"step": 40800
},
{
"epoch": 3.14,
"learning_rate": 0.0001814031832828825,
"loss": 0.3534,
"step": 41000
},
{
"epoch": 3.14,
"eval_loss": 0.1312979757785797,
"eval_runtime": 1280.3407,
"eval_samples_per_second": 8.931,
"eval_steps_per_second": 1.117,
"eval_wer": 0.16876091733814166,
"step": 41000
},
{
"epoch": 3.16,
"learning_rate": 0.0001808173029977541,
"loss": 0.3451,
"step": 41200
},
{
"epoch": 3.16,
"eval_loss": 0.1285577118396759,
"eval_runtime": 1281.0478,
"eval_samples_per_second": 8.926,
"eval_steps_per_second": 1.116,
"eval_wer": 0.16237110497548882,
"step": 41200
},
{
"epoch": 3.17,
"learning_rate": 0.0001802314227126257,
"loss": 0.3436,
"step": 41400
},
{
"epoch": 3.17,
"eval_loss": 0.1303623467683792,
"eval_runtime": 1282.6637,
"eval_samples_per_second": 8.915,
"eval_steps_per_second": 1.115,
"eval_wer": 0.1643319997746098,
"step": 41400
},
{
"epoch": 3.19,
"learning_rate": 0.0001796455424274973,
"loss": 0.3406,
"step": 41600
},
{
"epoch": 3.19,
"eval_loss": 0.12939453125,
"eval_runtime": 1277.6832,
"eval_samples_per_second": 8.95,
"eval_steps_per_second": 1.119,
"eval_wer": 0.1627993463684003,
"step": 41600
},
{
"epoch": 3.21,
"learning_rate": 0.0001790596621423689,
"loss": 0.3449,
"step": 41800
},
{
"epoch": 3.21,
"eval_loss": 0.12918172776699066,
"eval_runtime": 1279.0857,
"eval_samples_per_second": 8.94,
"eval_steps_per_second": 1.118,
"eval_wer": 0.165627993463684,
"step": 41800
},
{
"epoch": 3.23,
"learning_rate": 0.00017847671125866612,
"loss": 0.3374,
"step": 42000
},
{
"epoch": 3.23,
"eval_loss": 0.1299501359462738,
"eval_runtime": 1278.9732,
"eval_samples_per_second": 8.941,
"eval_steps_per_second": 1.118,
"eval_wer": 0.1630247365751958,
"step": 42000
},
{
"epoch": 3.25,
"learning_rate": 0.00017789083097353772,
"loss": 0.3392,
"step": 42200
},
{
"epoch": 3.25,
"eval_loss": 0.12759089469909668,
"eval_runtime": 1268.8237,
"eval_samples_per_second": 9.012,
"eval_steps_per_second": 1.127,
"eval_wer": 0.16211190623767396,
"step": 42200
},
{
"epoch": 3.27,
"learning_rate": 0.00017730495068840932,
"loss": 0.3234,
"step": 42400
},
{
"epoch": 3.27,
"eval_loss": 0.12891671061515808,
"eval_runtime": 1261.6618,
"eval_samples_per_second": 9.063,
"eval_steps_per_second": 1.133,
"eval_wer": 0.16194286358257734,
"step": 42400
},
{
"epoch": 3.29,
"learning_rate": 0.0001767190704032809,
"loss": 0.3506,
"step": 42600
},
{
"epoch": 3.29,
"eval_loss": 0.1317521631717682,
"eval_runtime": 1268.2708,
"eval_samples_per_second": 9.016,
"eval_steps_per_second": 1.128,
"eval_wer": 0.1603764016453485,
"step": 42600
},
{
"epoch": 3.31,
"learning_rate": 0.0001761331901181525,
"loss": 0.3317,
"step": 42800
},
{
"epoch": 3.31,
"eval_loss": 0.12691594660282135,
"eval_runtime": 1266.6129,
"eval_samples_per_second": 9.028,
"eval_steps_per_second": 1.129,
"eval_wer": 0.16011720290753367,
"step": 42800
},
{
"epoch": 3.33,
"learning_rate": 0.0001755473098330241,
"loss": 0.3412,
"step": 43000
},
{
"epoch": 3.33,
"eval_loss": 0.12849685549736023,
"eval_runtime": 1268.3183,
"eval_samples_per_second": 9.016,
"eval_steps_per_second": 1.127,
"eval_wer": 0.15849439341860597,
"step": 43000
},
{
"epoch": 3.35,
"learning_rate": 0.0001749614295478957,
"loss": 0.3432,
"step": 43200
},
{
"epoch": 3.35,
"eval_loss": 0.12799765169620514,
"eval_runtime": 1270.7987,
"eval_samples_per_second": 8.998,
"eval_steps_per_second": 1.125,
"eval_wer": 0.1610300332450555,
"step": 43200
},
{
"epoch": 3.37,
"learning_rate": 0.0001743755492627673,
"loss": 0.3274,
"step": 43400
},
{
"epoch": 3.37,
"eval_loss": 0.1282772719860077,
"eval_runtime": 1270.8967,
"eval_samples_per_second": 8.998,
"eval_steps_per_second": 1.125,
"eval_wer": 0.15816757761875247,
"step": 43400
},
{
"epoch": 3.39,
"learning_rate": 0.00017378966897763887,
"loss": 0.3378,
"step": 43600
},
{
"epoch": 3.39,
"eval_loss": 0.12611497938632965,
"eval_runtime": 1268.024,
"eval_samples_per_second": 9.018,
"eval_steps_per_second": 1.128,
"eval_wer": 0.15873105313574126,
"step": 43600
},
{
"epoch": 3.41,
"learning_rate": 0.00017320378869251047,
"loss": 0.3335,
"step": 43800
},
{
"epoch": 3.41,
"eval_loss": 0.12488209456205368,
"eval_runtime": 1262.74,
"eval_samples_per_second": 9.056,
"eval_steps_per_second": 1.132,
"eval_wer": 0.157637910632783,
"step": 43800
},
{
"epoch": 3.43,
"learning_rate": 0.00017261790840738208,
"loss": 0.323,
"step": 44000
},
{
"epoch": 3.43,
"eval_loss": 0.1285601556301117,
"eval_runtime": 1264.5781,
"eval_samples_per_second": 9.043,
"eval_steps_per_second": 1.131,
"eval_wer": 0.15807742153603427,
"step": 44000
},
{
"epoch": 3.45,
"learning_rate": 0.00017203202812225365,
"loss": 0.3427,
"step": 44200
},
{
"epoch": 3.45,
"eval_loss": 0.12231270223855972,
"eval_runtime": 1271.7465,
"eval_samples_per_second": 8.992,
"eval_steps_per_second": 1.124,
"eval_wer": 0.15785203132923875,
"step": 44200
},
{
"epoch": 3.47,
"learning_rate": 0.00017144614783712526,
"loss": 0.3276,
"step": 44400
},
{
"epoch": 3.47,
"eval_loss": 0.12326563894748688,
"eval_runtime": 1274.0885,
"eval_samples_per_second": 8.975,
"eval_steps_per_second": 1.122,
"eval_wer": 0.1624725305685468,
"step": 44400
},
{
"epoch": 3.49,
"learning_rate": 0.0001708602675519969,
"loss": 0.3291,
"step": 44600
},
{
"epoch": 3.49,
"eval_loss": 0.12240497022867203,
"eval_runtime": 1272.556,
"eval_samples_per_second": 8.986,
"eval_steps_per_second": 1.124,
"eval_wer": 0.15554178170958471,
"step": 44600
},
{
"epoch": 3.51,
"learning_rate": 0.00017027438726686844,
"loss": 0.3374,
"step": 44800
},
{
"epoch": 3.51,
"eval_loss": 0.12430132925510406,
"eval_runtime": 1271.1476,
"eval_samples_per_second": 8.996,
"eval_steps_per_second": 1.125,
"eval_wer": 0.15789710937059784,
"step": 44800
},
{
"epoch": 3.52,
"learning_rate": 0.00016968850698174007,
"loss": 0.3383,
"step": 45000
},
{
"epoch": 3.52,
"eval_loss": 0.12537476420402527,
"eval_runtime": 1276.5687,
"eval_samples_per_second": 8.958,
"eval_steps_per_second": 1.12,
"eval_wer": 0.15711951315715333,
"step": 45000
},
{
"epoch": 3.54,
"learning_rate": 0.00016910262669661162,
"loss": 0.3231,
"step": 45200
},
{
"epoch": 3.54,
"eval_loss": 0.1274578869342804,
"eval_runtime": 1279.812,
"eval_samples_per_second": 8.935,
"eval_steps_per_second": 1.117,
"eval_wer": 0.1589000957908379,
"step": 45200
},
{
"epoch": 3.56,
"learning_rate": 0.00016851674641148325,
"loss": 0.3265,
"step": 45400
},
{
"epoch": 3.56,
"eval_loss": 0.12590159475803375,
"eval_runtime": 1276.0756,
"eval_samples_per_second": 8.961,
"eval_steps_per_second": 1.121,
"eval_wer": 0.15724347777089084,
"step": 45400
},
{
"epoch": 3.58,
"learning_rate": 0.00016793086612635485,
"loss": 0.3334,
"step": 45600
},
{
"epoch": 3.58,
"eval_loss": 0.12398205697536469,
"eval_runtime": 1283.216,
"eval_samples_per_second": 8.911,
"eval_steps_per_second": 1.114,
"eval_wer": 0.1549895757029357,
"step": 45600
},
{
"epoch": 3.6,
"learning_rate": 0.00016734791524265207,
"loss": 0.3314,
"step": 45800
},
{
"epoch": 3.6,
"eval_loss": 0.12473876029253006,
"eval_runtime": 1280.783,
"eval_samples_per_second": 8.928,
"eval_steps_per_second": 1.117,
"eval_wer": 0.15710824364681356,
"step": 45800
},
{
"epoch": 3.62,
"learning_rate": 0.00016676203495752365,
"loss": 0.3372,
"step": 46000
},
{
"epoch": 3.62,
"eval_loss": 0.1239311620593071,
"eval_runtime": 1282.1393,
"eval_samples_per_second": 8.919,
"eval_steps_per_second": 1.115,
"eval_wer": 0.15447117822730602,
"step": 46000
},
{
"epoch": 3.64,
"learning_rate": 0.00016617615467239526,
"loss": 0.3362,
"step": 46200
},
{
"epoch": 3.64,
"eval_loss": 0.1215914860367775,
"eval_runtime": 1278.6758,
"eval_samples_per_second": 8.943,
"eval_steps_per_second": 1.118,
"eval_wer": 0.15436975263424804,
"step": 46200
},
{
"epoch": 3.66,
"learning_rate": 0.00016559027438726683,
"loss": 0.3209,
"step": 46400
},
{
"epoch": 3.66,
"eval_loss": 0.1207798570394516,
"eval_runtime": 1279.7208,
"eval_samples_per_second": 8.936,
"eval_steps_per_second": 1.117,
"eval_wer": 0.15486561108919816,
"step": 46400
},
{
"epoch": 3.68,
"learning_rate": 0.00016500732350356408,
"loss": 0.3202,
"step": 46600
},
{
"epoch": 3.68,
"eval_loss": 0.11999519914388657,
"eval_runtime": 1274.3631,
"eval_samples_per_second": 8.973,
"eval_steps_per_second": 1.122,
"eval_wer": 0.15501211472361526,
"step": 46600
},
{
"epoch": 3.7,
"learning_rate": 0.00016442144321843568,
"loss": 0.3135,
"step": 46800
},
{
"epoch": 3.7,
"eval_loss": 0.12257663160562515,
"eval_runtime": 1258.8007,
"eval_samples_per_second": 9.084,
"eval_steps_per_second": 1.136,
"eval_wer": 0.15324280160027046,
"step": 46800
},
{
"epoch": 3.72,
"learning_rate": 0.0001638355629333073,
"loss": 0.3148,
"step": 47000
},
{
"epoch": 3.72,
"eval_loss": 0.11898791790008545,
"eval_runtime": 1289.0474,
"eval_samples_per_second": 8.871,
"eval_steps_per_second": 1.109,
"eval_wer": 0.15274694314532034,
"step": 47000
},
{
"epoch": 3.74,
"learning_rate": 0.00016324968264817887,
"loss": 0.3339,
"step": 47200
},
{
"epoch": 3.74,
"eval_loss": 0.12242983281612396,
"eval_runtime": 1285.1481,
"eval_samples_per_second": 8.898,
"eval_steps_per_second": 1.113,
"eval_wer": 0.15426832704119006,
"step": 47200
},
{
"epoch": 3.76,
"learning_rate": 0.00016266380236305047,
"loss": 0.3238,
"step": 47400
},
{
"epoch": 3.76,
"eval_loss": 0.12152837961912155,
"eval_runtime": 1287.6381,
"eval_samples_per_second": 8.881,
"eval_steps_per_second": 1.111,
"eval_wer": 0.15251028342818504,
"step": 47400
},
{
"epoch": 3.78,
"learning_rate": 0.00016207792207792205,
"loss": 0.3141,
"step": 47600
},
{
"epoch": 3.78,
"eval_loss": 0.11933837085962296,
"eval_runtime": 1282.8603,
"eval_samples_per_second": 8.914,
"eval_steps_per_second": 1.115,
"eval_wer": 0.1536034259311433,
"step": 47600
},
{
"epoch": 3.8,
"learning_rate": 0.00016149204179279365,
"loss": 0.3354,
"step": 47800
},
{
"epoch": 3.8,
"eval_loss": 0.12152481079101562,
"eval_runtime": 1280.7316,
"eval_samples_per_second": 8.928,
"eval_steps_per_second": 1.117,
"eval_wer": 0.15500084521327548,
"step": 47800
},
{
"epoch": 3.82,
"learning_rate": 0.00016090616150766525,
"loss": 0.3217,
"step": 48000
},
{
"epoch": 3.82,
"eval_loss": 0.12007062137126923,
"eval_runtime": 1281.3849,
"eval_samples_per_second": 8.924,
"eval_steps_per_second": 1.116,
"eval_wer": 0.15225108469037021,
"step": 48000
},
{
"epoch": 3.84,
"learning_rate": 0.00016032028122253683,
"loss": 0.3248,
"step": 48200
},
{
"epoch": 3.84,
"eval_loss": 0.11909425258636475,
"eval_runtime": 1287.6101,
"eval_samples_per_second": 8.881,
"eval_steps_per_second": 1.111,
"eval_wer": 0.15036907646362765,
"step": 48200
},
{
"epoch": 3.86,
"learning_rate": 0.00015973440093740844,
"loss": 0.3169,
"step": 48400
},
{
"epoch": 3.86,
"eval_loss": 0.12102551758289337,
"eval_runtime": 1285.0012,
"eval_samples_per_second": 8.899,
"eval_steps_per_second": 1.113,
"eval_wer": 0.15103397757367443,
"step": 48400
},
{
"epoch": 3.87,
"learning_rate": 0.00015914852065228,
"loss": 0.3235,
"step": 48600
},
{
"epoch": 3.87,
"eval_loss": 0.12175353616476059,
"eval_runtime": 1286.2751,
"eval_samples_per_second": 8.89,
"eval_steps_per_second": 1.112,
"eval_wer": 0.15386262466895814,
"step": 48600
},
{
"epoch": 3.89,
"learning_rate": 0.00015856264036715162,
"loss": 0.3262,
"step": 48800
},
{
"epoch": 3.89,
"eval_loss": 0.11936228722333908,
"eval_runtime": 1280.7325,
"eval_samples_per_second": 8.928,
"eval_steps_per_second": 1.117,
"eval_wer": 0.15041415450498677,
"step": 48800
},
{
"epoch": 3.91,
"learning_rate": 0.00015797676008202325,
"loss": 0.3183,
"step": 49000
},
{
"epoch": 3.91,
"eval_loss": 0.116153784096241,
"eval_runtime": 1283.8223,
"eval_samples_per_second": 8.907,
"eval_steps_per_second": 1.114,
"eval_wer": 0.14855468529892377,
"step": 49000
},
{
"epoch": 3.93,
"learning_rate": 0.0001573908797968948,
"loss": 0.3229,
"step": 49200
},
{
"epoch": 3.93,
"eval_loss": 0.11911948770284653,
"eval_runtime": 1284.0466,
"eval_samples_per_second": 8.905,
"eval_steps_per_second": 1.114,
"eval_wer": 0.14968163633290132,
"step": 49200
},
{
"epoch": 4.02,
"learning_rate": 0.00015680499951176643,
"loss": 0.322,
"step": 49400
},
{
"epoch": 4.02,
"eval_loss": 0.11941692978143692,
"eval_runtime": 629.3496,
"eval_samples_per_second": 18.17,
"eval_steps_per_second": 2.272,
"eval_wer": 0.15029018989124923,
"step": 49400
},
{
"epoch": 4.04,
"learning_rate": 0.00015621911922663803,
"loss": 0.309,
"step": 49600
},
{
"epoch": 4.04,
"eval_loss": 0.11948557198047638,
"eval_runtime": 625.3187,
"eval_samples_per_second": 18.287,
"eval_steps_per_second": 2.287,
"eval_wer": 0.14937735955372738,
"step": 49600
},
{
"epoch": 4.06,
"learning_rate": 0.0001556332389415096,
"loss": 0.3013,
"step": 49800
},
{
"epoch": 4.06,
"eval_loss": 0.11908197402954102,
"eval_runtime": 625.6323,
"eval_samples_per_second": 18.278,
"eval_steps_per_second": 2.286,
"eval_wer": 0.1490392742435341,
"step": 49800
},
{
"epoch": 4.08,
"learning_rate": 0.00015504735865638121,
"loss": 0.3107,
"step": 50000
},
{
"epoch": 4.08,
"eval_loss": 0.11991952359676361,
"eval_runtime": 618.7466,
"eval_samples_per_second": 18.481,
"eval_steps_per_second": 2.311,
"eval_wer": 0.14963655829154224,
"step": 50000
},
{
"epoch": 4.1,
"learning_rate": 0.00015446440777267843,
"loss": 0.3205,
"step": 50200
},
{
"epoch": 4.1,
"eval_loss": 0.11845077574253082,
"eval_runtime": 622.4777,
"eval_samples_per_second": 18.37,
"eval_steps_per_second": 2.297,
"eval_wer": 0.1494224375950865,
"step": 50200
},
{
"epoch": 4.12,
"learning_rate": 0.00015387852748755,
"loss": 0.3053,
"step": 50400
},
{
"epoch": 4.12,
"eval_loss": 0.11776554584503174,
"eval_runtime": 626.5582,
"eval_samples_per_second": 18.25,
"eval_steps_per_second": 2.282,
"eval_wer": 0.14600777596213443,
"step": 50400
},
{
"epoch": 4.14,
"learning_rate": 0.00015329264720242161,
"loss": 0.3039,
"step": 50600
},
{
"epoch": 4.14,
"eval_loss": 0.11720620095729828,
"eval_runtime": 626.1062,
"eval_samples_per_second": 18.264,
"eval_steps_per_second": 2.284,
"eval_wer": 0.14637966980334705,
"step": 50600
},
{
"epoch": 4.16,
"learning_rate": 0.00015270676691729325,
"loss": 0.3122,
"step": 50800
},
{
"epoch": 4.16,
"eval_loss": 0.11798885464668274,
"eval_runtime": 617.4335,
"eval_samples_per_second": 18.52,
"eval_steps_per_second": 2.316,
"eval_wer": 0.147889784188877,
"step": 50800
},
{
"epoch": 4.17,
"learning_rate": 0.0001521208866321648,
"loss": 0.3144,
"step": 51000
},
{
"epoch": 4.17,
"eval_loss": 0.1195751279592514,
"eval_runtime": 623.8518,
"eval_samples_per_second": 18.33,
"eval_steps_per_second": 2.292,
"eval_wer": 0.15110159463571307,
"step": 51000
},
{
"epoch": 4.19,
"learning_rate": 0.00015153500634703643,
"loss": 0.3075,
"step": 51200
},
{
"epoch": 4.19,
"eval_loss": 0.11787259578704834,
"eval_runtime": 625.9862,
"eval_samples_per_second": 18.267,
"eval_steps_per_second": 2.284,
"eval_wer": 0.14795740125091564,
"step": 51200
},
{
"epoch": 4.21,
"learning_rate": 0.00015094912606190798,
"loss": 0.311,
"step": 51400
},
{
"epoch": 4.21,
"eval_loss": 0.12053581327199936,
"eval_runtime": 618.1157,
"eval_samples_per_second": 18.5,
"eval_steps_per_second": 2.313,
"eval_wer": 0.14891530962979657,
"step": 51400
},
{
"epoch": 4.23,
"learning_rate": 0.0001503632457767796,
"loss": 0.3015,
"step": 51600
},
{
"epoch": 4.23,
"eval_loss": 0.11665117740631104,
"eval_runtime": 622.4687,
"eval_samples_per_second": 18.37,
"eval_steps_per_second": 2.297,
"eval_wer": 0.14651490392742436,
"step": 51600
},
{
"epoch": 4.25,
"learning_rate": 0.00014977736549165119,
"loss": 0.3106,
"step": 51800
},
{
"epoch": 4.25,
"eval_loss": 0.11705104261636734,
"eval_runtime": 625.4889,
"eval_samples_per_second": 18.282,
"eval_steps_per_second": 2.286,
"eval_wer": 0.15017749478785147,
"step": 51800
},
{
"epoch": 4.27,
"learning_rate": 0.0001491914852065228,
"loss": 0.2971,
"step": 52000
},
{
"epoch": 4.27,
"eval_loss": 0.1164257824420929,
"eval_runtime": 623.9511,
"eval_samples_per_second": 18.327,
"eval_steps_per_second": 2.292,
"eval_wer": 0.14739392573392687,
"step": 52000
},
{
"epoch": 4.29,
"learning_rate": 0.0001486056049213944,
"loss": 0.3113,
"step": 52200
},
{
"epoch": 4.29,
"eval_loss": 0.11716081202030182,
"eval_runtime": 620.6594,
"eval_samples_per_second": 18.424,
"eval_steps_per_second": 2.304,
"eval_wer": 0.1467741026652392,
"step": 52200
},
{
"epoch": 4.31,
"learning_rate": 0.00014801972463626597,
"loss": 0.2966,
"step": 52400
},
{
"epoch": 4.31,
"eval_loss": 0.11439959704875946,
"eval_runtime": 625.7976,
"eval_samples_per_second": 18.273,
"eval_steps_per_second": 2.285,
"eval_wer": 0.145928889389756,
"step": 52400
},
{
"epoch": 4.33,
"learning_rate": 0.00014743384435113757,
"loss": 0.3167,
"step": 52600
},
{
"epoch": 4.33,
"eval_loss": 0.11525892466306686,
"eval_runtime": 624.008,
"eval_samples_per_second": 18.325,
"eval_steps_per_second": 2.292,
"eval_wer": 0.1450047895418944,
"step": 52600
},
{
"epoch": 4.35,
"learning_rate": 0.00014684796406600918,
"loss": 0.3101,
"step": 52800
},
{
"epoch": 4.35,
"eval_loss": 0.11492661386728287,
"eval_runtime": 624.0638,
"eval_samples_per_second": 18.323,
"eval_steps_per_second": 2.291,
"eval_wer": 0.1450160590522342,
"step": 52800
},
{
"epoch": 4.37,
"learning_rate": 0.00014626208378088076,
"loss": 0.2972,
"step": 53000
},
{
"epoch": 4.37,
"eval_loss": 0.11436022818088531,
"eval_runtime": 621.413,
"eval_samples_per_second": 18.402,
"eval_steps_per_second": 2.301,
"eval_wer": 0.14395672508029525,
"step": 53000
},
{
"epoch": 4.39,
"learning_rate": 0.00014567620349575236,
"loss": 0.2949,
"step": 53200
},
{
"epoch": 4.39,
"eval_loss": 0.11512508243322372,
"eval_runtime": 622.0613,
"eval_samples_per_second": 18.382,
"eval_steps_per_second": 2.299,
"eval_wer": 0.14511748464529217,
"step": 53200
},
{
"epoch": 4.41,
"learning_rate": 0.00014509032321062394,
"loss": 0.2998,
"step": 53400
},
{
"epoch": 4.41,
"eval_loss": 0.11325063556432724,
"eval_runtime": 625.3597,
"eval_samples_per_second": 18.285,
"eval_steps_per_second": 2.287,
"eval_wer": 0.14369752634248042,
"step": 53400
},
{
"epoch": 4.43,
"learning_rate": 0.00014450444292549554,
"loss": 0.3033,
"step": 53600
},
{
"epoch": 4.43,
"eval_loss": 0.11504179239273071,
"eval_runtime": 631.902,
"eval_samples_per_second": 18.096,
"eval_steps_per_second": 2.263,
"eval_wer": 0.14047444638530457,
"step": 53600
},
{
"epoch": 4.45,
"learning_rate": 0.00014391856264036714,
"loss": 0.3064,
"step": 53800
},
{
"epoch": 4.45,
"eval_loss": 0.1125454306602478,
"eval_runtime": 621.7758,
"eval_samples_per_second": 18.391,
"eval_steps_per_second": 2.3,
"eval_wer": 0.1426381923705415,
"step": 53800
},
{
"epoch": 4.47,
"learning_rate": 0.00014333268235523872,
"loss": 0.2942,
"step": 54000
},
{
"epoch": 4.47,
"eval_loss": 0.11342581361532211,
"eval_runtime": 632.3216,
"eval_samples_per_second": 18.084,
"eval_steps_per_second": 2.262,
"eval_wer": 0.14604158449315377,
"step": 54000
},
{
"epoch": 4.49,
"learning_rate": 0.00014274680207011033,
"loss": 0.2907,
"step": 54200
},
{
"epoch": 4.49,
"eval_loss": 0.11338940262794495,
"eval_runtime": 631.9817,
"eval_samples_per_second": 18.094,
"eval_steps_per_second": 2.263,
"eval_wer": 0.1434721361356849,
"step": 54200
},
{
"epoch": 4.51,
"learning_rate": 0.00014216385118640757,
"loss": 0.3061,
"step": 54400
},
{
"epoch": 4.51,
"eval_loss": 0.11131487786769867,
"eval_runtime": 619.3147,
"eval_samples_per_second": 18.464,
"eval_steps_per_second": 2.309,
"eval_wer": 0.14222122048796978,
"step": 54400
},
{
"epoch": 4.52,
"learning_rate": 0.00014157797090127915,
"loss": 0.2872,
"step": 54600
},
{
"epoch": 4.52,
"eval_loss": 0.11378352344036102,
"eval_runtime": 627.6236,
"eval_samples_per_second": 18.22,
"eval_steps_per_second": 2.278,
"eval_wer": 0.14586127232771737,
"step": 54600
},
{
"epoch": 4.54,
"learning_rate": 0.00014099209061615075,
"loss": 0.291,
"step": 54800
},
{
"epoch": 4.54,
"eval_loss": 0.10948885232210159,
"eval_runtime": 631.6042,
"eval_samples_per_second": 18.105,
"eval_steps_per_second": 2.264,
"eval_wer": 0.14297627768073476,
"step": 54800
},
{
"epoch": 4.56,
"learning_rate": 0.00014040621033102236,
"loss": 0.2916,
"step": 55000
},
{
"epoch": 4.56,
"eval_loss": 0.11261311173439026,
"eval_runtime": 629.602,
"eval_samples_per_second": 18.162,
"eval_steps_per_second": 2.271,
"eval_wer": 0.13918972220657014,
"step": 55000
},
{
"epoch": 4.58,
"learning_rate": 0.00013982033004589393,
"loss": 0.295,
"step": 55200
},
{
"epoch": 4.58,
"eval_loss": 0.11116189509630203,
"eval_runtime": 631.1044,
"eval_samples_per_second": 18.119,
"eval_steps_per_second": 2.266,
"eval_wer": 0.13987716233729644,
"step": 55200
},
{
"epoch": 4.6,
"learning_rate": 0.00013923444976076554,
"loss": 0.2953,
"step": 55400
},
{
"epoch": 4.6,
"eval_loss": 0.11264733970165253,
"eval_runtime": 630.3645,
"eval_samples_per_second": 18.14,
"eval_steps_per_second": 2.269,
"eval_wer": 0.13953907702710316,
"step": 55400
},
{
"epoch": 4.62,
"learning_rate": 0.00013864856947563714,
"loss": 0.2934,
"step": 55600
},
{
"epoch": 4.62,
"eval_loss": 0.11191383749246597,
"eval_runtime": 638.5461,
"eval_samples_per_second": 17.908,
"eval_steps_per_second": 2.239,
"eval_wer": 0.1429199301290359,
"step": 55600
},
{
"epoch": 4.64,
"learning_rate": 0.00013806268919050872,
"loss": 0.2995,
"step": 55800
},
{
"epoch": 4.64,
"eval_loss": 0.11275320500135422,
"eval_runtime": 636.369,
"eval_samples_per_second": 17.969,
"eval_steps_per_second": 2.247,
"eval_wer": 0.1417929790950583,
"step": 55800
},
{
"epoch": 4.66,
"learning_rate": 0.00013747680890538032,
"loss": 0.2908,
"step": 56000
},
{
"epoch": 4.66,
"eval_loss": 0.11625451594591141,
"eval_runtime": 629.3289,
"eval_samples_per_second": 18.17,
"eval_steps_per_second": 2.272,
"eval_wer": 0.14449766157660449,
"step": 56000
},
{
"epoch": 4.68,
"learning_rate": 0.0001368909286202519,
"loss": 0.2982,
"step": 56200
},
{
"epoch": 4.68,
"eval_loss": 0.1119445189833641,
"eval_runtime": 627.9078,
"eval_samples_per_second": 18.211,
"eval_steps_per_second": 2.277,
"eval_wer": 0.14262692286020173,
"step": 56200
},
{
"epoch": 4.7,
"learning_rate": 0.0001363050483351235,
"loss": 0.2907,
"step": 56400
},
{
"epoch": 4.7,
"eval_loss": 0.11290817707777023,
"eval_runtime": 625.336,
"eval_samples_per_second": 18.286,
"eval_steps_per_second": 2.287,
"eval_wer": 0.1417028230123401,
"step": 56400
},
{
"epoch": 4.72,
"learning_rate": 0.0001357191680499951,
"loss": 0.2884,
"step": 56600
},
{
"epoch": 4.72,
"eval_loss": 0.11267752945423126,
"eval_runtime": 623.6566,
"eval_samples_per_second": 18.335,
"eval_steps_per_second": 2.293,
"eval_wer": 0.14219868146729026,
"step": 56600
},
{
"epoch": 4.74,
"learning_rate": 0.00013513328776486669,
"loss": 0.2967,
"step": 56800
},
{
"epoch": 4.74,
"eval_loss": 0.11243223398923874,
"eval_runtime": 624.4114,
"eval_samples_per_second": 18.313,
"eval_steps_per_second": 2.29,
"eval_wer": 0.14279596551529836,
"step": 56800
},
{
"epoch": 4.76,
"learning_rate": 0.0001345474074797383,
"loss": 0.2938,
"step": 57000
},
{
"epoch": 4.76,
"eval_loss": 0.11092329025268555,
"eval_runtime": 621.6714,
"eval_samples_per_second": 18.394,
"eval_steps_per_second": 2.3,
"eval_wer": 0.13847974305516425,
"step": 57000
},
{
"epoch": 4.78,
"learning_rate": 0.00013396445659603554,
"loss": 0.2814,
"step": 57200
},
{
"epoch": 4.78,
"eval_loss": 0.11275891214609146,
"eval_runtime": 621.8116,
"eval_samples_per_second": 18.39,
"eval_steps_per_second": 2.3,
"eval_wer": 0.13922353073758945,
"step": 57200
},
{
"epoch": 4.8,
"learning_rate": 0.00013337857631090711,
"loss": 0.2972,
"step": 57400
},
{
"epoch": 4.8,
"eval_loss": 0.1118135005235672,
"eval_runtime": 626.7556,
"eval_samples_per_second": 18.245,
"eval_steps_per_second": 2.282,
"eval_wer": 0.14214233391559136,
"step": 57400
},
{
"epoch": 4.82,
"learning_rate": 0.00013279269602577872,
"loss": 0.2824,
"step": 57600
},
{
"epoch": 4.82,
"eval_loss": 0.11107096076011658,
"eval_runtime": 623.6389,
"eval_samples_per_second": 18.336,
"eval_steps_per_second": 2.293,
"eval_wer": 0.14098157435059447,
"step": 57600
},
{
"epoch": 4.84,
"learning_rate": 0.00013220681574065032,
"loss": 0.2876,
"step": 57800
},
{
"epoch": 4.84,
"eval_loss": 0.11149298399686813,
"eval_runtime": 623.7048,
"eval_samples_per_second": 18.334,
"eval_steps_per_second": 2.293,
"eval_wer": 0.13867132473094043,
"step": 57800
},
{
"epoch": 4.86,
"learning_rate": 0.0001316209354555219,
"loss": 0.2821,
"step": 58000
},
{
"epoch": 4.86,
"eval_loss": 0.10840985924005508,
"eval_runtime": 625.8552,
"eval_samples_per_second": 18.271,
"eval_steps_per_second": 2.285,
"eval_wer": 0.1385473601172029,
"step": 58000
},
{
"epoch": 4.87,
"learning_rate": 0.0001310350551703935,
"loss": 0.2816,
"step": 58200
},
{
"epoch": 4.87,
"eval_loss": 0.11007586866617203,
"eval_runtime": 625.5014,
"eval_samples_per_second": 18.281,
"eval_steps_per_second": 2.286,
"eval_wer": 0.13653011776638305,
"step": 58200
},
{
"epoch": 4.89,
"learning_rate": 0.00013045210428669075,
"loss": 0.2992,
"step": 58400
},
{
"epoch": 4.89,
"eval_loss": 0.10946887731552124,
"eval_runtime": 620.2255,
"eval_samples_per_second": 18.437,
"eval_steps_per_second": 2.306,
"eval_wer": 0.14015890009579085,
"step": 58400
},
{
"epoch": 4.91,
"learning_rate": 0.00012986622400156233,
"loss": 0.2912,
"step": 58600
},
{
"epoch": 4.91,
"eval_loss": 0.10773813724517822,
"eval_runtime": 625.4145,
"eval_samples_per_second": 18.284,
"eval_steps_per_second": 2.286,
"eval_wer": 0.1377584943934186,
"step": 58600
},
{
"epoch": 4.93,
"learning_rate": 0.00012928034371643393,
"loss": 0.2956,
"step": 58800
},
{
"epoch": 4.93,
"eval_loss": 0.10763510316610336,
"eval_runtime": 627.2025,
"eval_samples_per_second": 18.232,
"eval_steps_per_second": 2.28,
"eval_wer": 0.13772468586239928,
"step": 58800
},
{
"epoch": 4.95,
"learning_rate": 0.00012869446343130554,
"loss": 0.3034,
"step": 59000
},
{
"epoch": 4.95,
"eval_loss": 0.10751395672559738,
"eval_runtime": 627.4457,
"eval_samples_per_second": 18.225,
"eval_steps_per_second": 2.279,
"eval_wer": 0.13743167859356512,
"step": 59000
},
{
"epoch": 4.97,
"learning_rate": 0.0001281085831461771,
"loss": 0.3127,
"step": 59200
},
{
"epoch": 4.97,
"eval_loss": 0.10920178145170212,
"eval_runtime": 626.5767,
"eval_samples_per_second": 18.25,
"eval_steps_per_second": 2.282,
"eval_wer": 0.1391559136755508,
"step": 59200
},
{
"epoch": 4.99,
"learning_rate": 0.00012752270286104872,
"loss": 0.3078,
"step": 59400
},
{
"epoch": 4.99,
"eval_loss": 0.10621806979179382,
"eval_runtime": 627.2538,
"eval_samples_per_second": 18.23,
"eval_steps_per_second": 2.28,
"eval_wer": 0.1387389417929791,
"step": 59400
},
{
"epoch": 5.01,
"learning_rate": 0.00012693682257592032,
"loss": 0.2782,
"step": 59600
},
{
"epoch": 5.01,
"eval_loss": 0.1064351499080658,
"eval_runtime": 627.6844,
"eval_samples_per_second": 18.218,
"eval_steps_per_second": 2.278,
"eval_wer": 0.13708232377303206,
"step": 59600
},
{
"epoch": 5.03,
"learning_rate": 0.0001263509422907919,
"loss": 0.2751,
"step": 59800
},
{
"epoch": 5.03,
"eval_loss": 0.10696742683649063,
"eval_runtime": 622.6157,
"eval_samples_per_second": 18.366,
"eval_steps_per_second": 2.297,
"eval_wer": 0.13444525835352453,
"step": 59800
},
{
"epoch": 5.05,
"learning_rate": 0.0001257650620056635,
"loss": 0.2582,
"step": 60000
},
{
"epoch": 5.05,
"eval_loss": 0.10697264224290848,
"eval_runtime": 630.057,
"eval_samples_per_second": 18.149,
"eval_steps_per_second": 2.27,
"eval_wer": 0.13461430100862118,
"step": 60000
},
{
"epoch": 5.07,
"learning_rate": 0.00012517918172053508,
"loss": 0.2641,
"step": 60200
},
{
"epoch": 5.07,
"eval_loss": 0.10726083815097809,
"eval_runtime": 627.7279,
"eval_samples_per_second": 18.216,
"eval_steps_per_second": 2.278,
"eval_wer": 0.13570744351157943,
"step": 60200
},
{
"epoch": 5.09,
"learning_rate": 0.00012459330143540668,
"loss": 0.2709,
"step": 60400
},
{
"epoch": 5.09,
"eval_loss": 0.1082502007484436,
"eval_runtime": 631.7872,
"eval_samples_per_second": 18.099,
"eval_steps_per_second": 2.263,
"eval_wer": 0.13455795345692229,
"step": 60400
},
{
"epoch": 5.11,
"learning_rate": 0.0001240074211502783,
"loss": 0.2834,
"step": 60600
},
{
"epoch": 5.11,
"eval_loss": 0.10695182532072067,
"eval_runtime": 628.9494,
"eval_samples_per_second": 18.181,
"eval_steps_per_second": 2.274,
"eval_wer": 0.13725136642812868,
"step": 60600
},
{
"epoch": 5.13,
"learning_rate": 0.00012342154086514986,
"loss": 0.2723,
"step": 60800
},
{
"epoch": 5.13,
"eval_loss": 0.10714374482631683,
"eval_runtime": 627.1877,
"eval_samples_per_second": 18.232,
"eval_steps_per_second": 2.28,
"eval_wer": 0.1403166732405477,
"step": 60800
},
{
"epoch": 5.02,
"learning_rate": 0.00012283566058002147,
"loss": 0.2895,
"step": 61000
},
{
"epoch": 5.02,
"eval_loss": 0.10630907863378525,
"eval_runtime": 724.1222,
"eval_samples_per_second": 15.792,
"eval_steps_per_second": 1.975,
"eval_wer": 0.1340395559812926,
"step": 61000
},
{
"epoch": 5.04,
"learning_rate": 0.00012224978029489307,
"loss": 0.2791,
"step": 61200
},
{
"epoch": 5.04,
"eval_loss": 0.10776282101869583,
"eval_runtime": 714.1344,
"eval_samples_per_second": 16.012,
"eval_steps_per_second": 2.002,
"eval_wer": 0.13479461317405758,
"step": 61200
},
{
"epoch": 5.06,
"learning_rate": 0.00012166390000976466,
"loss": 0.2689,
"step": 61400
},
{
"epoch": 5.06,
"eval_loss": 0.10609008371829987,
"eval_runtime": 717.7674,
"eval_samples_per_second": 15.931,
"eval_steps_per_second": 1.992,
"eval_wer": 0.13410717304333128,
"step": 61400
},
{
"epoch": 5.08,
"learning_rate": 0.00012107801972463625,
"loss": 0.2639,
"step": 61600
},
{
"epoch": 5.08,
"eval_loss": 0.10747672617435455,
"eval_runtime": 708.6123,
"eval_samples_per_second": 16.137,
"eval_steps_per_second": 2.018,
"eval_wer": 0.13658646531808194,
"step": 61600
},
{
"epoch": 5.1,
"learning_rate": 0.00012049213943950784,
"loss": 0.2811,
"step": 61800
},
{
"epoch": 5.1,
"eval_loss": 0.10639283061027527,
"eval_runtime": 699.5143,
"eval_samples_per_second": 16.347,
"eval_steps_per_second": 2.044,
"eval_wer": 0.13498619484983376,
"step": 61800
},
{
"epoch": 5.12,
"learning_rate": 0.00011990625915437945,
"loss": 0.2708,
"step": 62000
},
{
"epoch": 5.12,
"eval_loss": 0.1074819564819336,
"eval_runtime": 707.2617,
"eval_samples_per_second": 16.168,
"eval_steps_per_second": 2.022,
"eval_wer": 0.13471572660167916,
"step": 62000
},
{
"epoch": 5.14,
"learning_rate": 0.00011932037886925104,
"loss": 0.2711,
"step": 62200
},
{
"epoch": 5.14,
"eval_loss": 0.10513726621866226,
"eval_runtime": 711.5872,
"eval_samples_per_second": 16.07,
"eval_steps_per_second": 2.01,
"eval_wer": 0.13240547698202512,
"step": 62200
},
{
"epoch": 5.16,
"learning_rate": 0.00011873742798554829,
"loss": 0.2739,
"step": 62400
},
{
"epoch": 5.16,
"eval_loss": 0.10640209913253784,
"eval_runtime": 710.3202,
"eval_samples_per_second": 16.098,
"eval_steps_per_second": 2.013,
"eval_wer": 0.1323265904096467,
"step": 62400
},
{
"epoch": 5.17,
"learning_rate": 0.00011815154770041988,
"loss": 0.2737,
"step": 62600
},
{
"epoch": 5.17,
"eval_loss": 0.10621224343776703,
"eval_runtime": 709.0146,
"eval_samples_per_second": 16.128,
"eval_steps_per_second": 2.017,
"eval_wer": 0.13518904603594975,
"step": 62600
},
{
"epoch": 5.19,
"learning_rate": 0.00011756566741529147,
"loss": 0.266,
"step": 62800
},
{
"epoch": 5.19,
"eval_loss": 0.10414595156908035,
"eval_runtime": 703.9804,
"eval_samples_per_second": 16.243,
"eval_steps_per_second": 2.031,
"eval_wer": 0.13109821378261113,
"step": 62800
},
{
"epoch": 5.21,
"learning_rate": 0.00011697978713016306,
"loss": 0.272,
"step": 63000
},
{
"epoch": 5.21,
"eval_loss": 0.10723841935396194,
"eval_runtime": 704.9142,
"eval_samples_per_second": 16.222,
"eval_steps_per_second": 2.029,
"eval_wer": 0.13118836986532936,
"step": 63000
},
{
"epoch": 5.23,
"learning_rate": 0.00011639390684503466,
"loss": 0.2631,
"step": 63200
},
{
"epoch": 5.23,
"eval_loss": 0.10395067185163498,
"eval_runtime": 709.9351,
"eval_samples_per_second": 16.107,
"eval_steps_per_second": 2.014,
"eval_wer": 0.13021919197610865,
"step": 63200
},
{
"epoch": 5.25,
"learning_rate": 0.00011580802655990625,
"loss": 0.2677,
"step": 63400
},
{
"epoch": 5.25,
"eval_loss": 0.10302858054637909,
"eval_runtime": 716.0431,
"eval_samples_per_second": 15.97,
"eval_steps_per_second": 1.997,
"eval_wer": 0.13177438440299769,
"step": 63400
},
{
"epoch": 5.27,
"learning_rate": 0.00011522214627477784,
"loss": 0.2537,
"step": 63600
},
{
"epoch": 5.27,
"eval_loss": 0.105635866522789,
"eval_runtime": 717.4391,
"eval_samples_per_second": 15.939,
"eval_steps_per_second": 1.993,
"eval_wer": 0.13281117935425707,
"step": 63600
},
{
"epoch": 5.29,
"learning_rate": 0.00011463626598964943,
"loss": 0.2817,
"step": 63800
},
{
"epoch": 5.29,
"eval_loss": 0.10486125200986862,
"eval_runtime": 713.1716,
"eval_samples_per_second": 16.034,
"eval_steps_per_second": 2.005,
"eval_wer": 0.1323265904096467,
"step": 63800
},
{
"epoch": 5.31,
"learning_rate": 0.00011405038570452104,
"loss": 0.261,
"step": 64000
},
{
"epoch": 5.31,
"eval_loss": 0.10378312319517136,
"eval_runtime": 707.893,
"eval_samples_per_second": 16.154,
"eval_steps_per_second": 2.02,
"eval_wer": 0.1305572772863019,
"step": 64000
},
{
"epoch": 5.33,
"learning_rate": 0.00011346450541939263,
"loss": 0.2822,
"step": 64200
},
{
"epoch": 5.33,
"eval_loss": 0.10581466555595398,
"eval_runtime": 716.437,
"eval_samples_per_second": 15.961,
"eval_steps_per_second": 1.996,
"eval_wer": 0.12975714205217784,
"step": 64200
},
{
"epoch": 5.35,
"learning_rate": 0.00011287862513426422,
"loss": 0.2725,
"step": 64400
},
{
"epoch": 5.35,
"eval_loss": 0.10494490712881088,
"eval_runtime": 715.1416,
"eval_samples_per_second": 15.99,
"eval_steps_per_second": 2.0,
"eval_wer": 0.13041077365188483,
"step": 64400
},
{
"epoch": 5.37,
"learning_rate": 0.00011229274484913581,
"loss": 0.2601,
"step": 64600
},
{
"epoch": 5.37,
"eval_loss": 0.1038796454668045,
"eval_runtime": 716.2768,
"eval_samples_per_second": 15.964,
"eval_steps_per_second": 1.996,
"eval_wer": 0.12908097143179129,
"step": 64600
},
{
"epoch": 5.39,
"learning_rate": 0.0001117068645640074,
"loss": 0.2637,
"step": 64800
},
{
"epoch": 5.39,
"eval_loss": 0.10526276379823685,
"eval_runtime": 717.256,
"eval_samples_per_second": 15.943,
"eval_steps_per_second": 1.994,
"eval_wer": 0.1309291711275145,
"step": 64800
},
{
"epoch": 5.41,
"learning_rate": 0.00011112098427887902,
"loss": 0.2646,
"step": 65000
},
{
"epoch": 5.41,
"eval_loss": 0.10593494772911072,
"eval_runtime": 711.2752,
"eval_samples_per_second": 16.077,
"eval_steps_per_second": 2.01,
"eval_wer": 0.13076012847241789,
"step": 65000
},
{
"epoch": 5.43,
"learning_rate": 0.00011053510399375061,
"loss": 0.2593,
"step": 65200
},
{
"epoch": 5.43,
"eval_loss": 0.10260586440563202,
"eval_runtime": 710.5911,
"eval_samples_per_second": 16.092,
"eval_steps_per_second": 2.012,
"eval_wer": 0.12839353130106496,
"step": 65200
},
{
"epoch": 5.45,
"learning_rate": 0.0001099492237086222,
"loss": 0.2764,
"step": 65400
},
{
"epoch": 5.45,
"eval_loss": 0.1039929986000061,
"eval_runtime": 711.9108,
"eval_samples_per_second": 16.062,
"eval_steps_per_second": 2.009,
"eval_wer": 0.12882177269397643,
"step": 65400
},
{
"epoch": 5.47,
"learning_rate": 0.00010936334342349379,
"loss": 0.2557,
"step": 65600
},
{
"epoch": 5.47,
"eval_loss": 0.10381390899419785,
"eval_runtime": 718.0919,
"eval_samples_per_second": 15.924,
"eval_steps_per_second": 1.991,
"eval_wer": 0.12913731898349018,
"step": 65600
},
{
"epoch": 5.49,
"learning_rate": 0.00010877746313836539,
"loss": 0.2571,
"step": 65800
},
{
"epoch": 5.49,
"eval_loss": 0.10302343964576721,
"eval_runtime": 711.5912,
"eval_samples_per_second": 16.07,
"eval_steps_per_second": 2.01,
"eval_wer": 0.1304671212035837,
"step": 65800
},
{
"epoch": 5.51,
"learning_rate": 0.00010819158285323698,
"loss": 0.2703,
"step": 66000
},
{
"epoch": 5.51,
"eval_loss": 0.1036553829908371,
"eval_runtime": 714.6453,
"eval_samples_per_second": 16.001,
"eval_steps_per_second": 2.001,
"eval_wer": 0.12699611201893277,
"step": 66000
},
{
"epoch": 5.52,
"learning_rate": 0.00010760570256810857,
"loss": 0.2603,
"step": 66200
},
{
"epoch": 5.52,
"eval_loss": 0.102656789124012,
"eval_runtime": 711.5823,
"eval_samples_per_second": 16.07,
"eval_steps_per_second": 2.01,
"eval_wer": 0.12859638248718094,
"step": 66200
},
{
"epoch": 5.54,
"learning_rate": 0.00010701982228298016,
"loss": 0.2501,
"step": 66400
},
{
"epoch": 5.54,
"eval_loss": 0.1020718440413475,
"eval_runtime": 708.9234,
"eval_samples_per_second": 16.13,
"eval_steps_per_second": 2.017,
"eval_wer": 0.12927255310756747,
"step": 66400
},
{
"epoch": 5.56,
"learning_rate": 0.00010643394199785177,
"loss": 0.2615,
"step": 66600
},
{
"epoch": 5.56,
"eval_loss": 0.10426247119903564,
"eval_runtime": 712.0372,
"eval_samples_per_second": 16.06,
"eval_steps_per_second": 2.008,
"eval_wer": 0.1299036456865949,
"step": 66600
},
{
"epoch": 5.58,
"learning_rate": 0.00010584806171272336,
"loss": 0.2669,
"step": 66800
},
{
"epoch": 5.58,
"eval_loss": 0.10160184651613235,
"eval_runtime": 715.9766,
"eval_samples_per_second": 15.971,
"eval_steps_per_second": 1.997,
"eval_wer": 0.12859638248718094,
"step": 66800
},
{
"epoch": 5.6,
"learning_rate": 0.00010526218142759495,
"loss": 0.2737,
"step": 67000
},
{
"epoch": 5.6,
"eval_loss": 0.0998615026473999,
"eval_runtime": 721.1944,
"eval_samples_per_second": 15.856,
"eval_steps_per_second": 1.983,
"eval_wer": 0.1280554459908717,
"step": 67000
},
{
"epoch": 5.62,
"learning_rate": 0.0001046792305438922,
"loss": 0.2686,
"step": 67200
},
{
"epoch": 5.62,
"eval_loss": 0.1005900576710701,
"eval_runtime": 720.5097,
"eval_samples_per_second": 15.871,
"eval_steps_per_second": 1.985,
"eval_wer": 0.12931763114892658,
"step": 67200
},
{
"epoch": 5.64,
"learning_rate": 0.00010409335025876379,
"loss": 0.2638,
"step": 67400
},
{
"epoch": 5.64,
"eval_loss": 0.10066718608140945,
"eval_runtime": 716.9838,
"eval_samples_per_second": 15.949,
"eval_steps_per_second": 1.994,
"eval_wer": 0.12787513382543528,
"step": 67400
},
{
"epoch": 5.66,
"learning_rate": 0.00010351039937506102,
"loss": 0.2657,
"step": 67600
},
{
"epoch": 5.66,
"eval_loss": 0.10130422562360764,
"eval_runtime": 718.8149,
"eval_samples_per_second": 15.908,
"eval_steps_per_second": 1.989,
"eval_wer": 0.12775116921169774,
"step": 67600
},
{
"epoch": 5.68,
"learning_rate": 0.00010292451908993261,
"loss": 0.2648,
"step": 67800
},
{
"epoch": 5.68,
"eval_loss": 0.10149582475423813,
"eval_runtime": 721.2563,
"eval_samples_per_second": 15.854,
"eval_steps_per_second": 1.983,
"eval_wer": 0.12784132529441597,
"step": 67800
},
{
"epoch": 5.7,
"learning_rate": 0.0001023386388048042,
"loss": 0.2524,
"step": 68000
},
{
"epoch": 5.7,
"eval_loss": 0.09992196410894394,
"eval_runtime": 715.5922,
"eval_samples_per_second": 15.98,
"eval_steps_per_second": 1.998,
"eval_wer": 0.12749197047388292,
"step": 68000
},
{
"epoch": 5.72,
"learning_rate": 0.0001017527585196758,
"loss": 0.2546,
"step": 68200
},
{
"epoch": 5.72,
"eval_loss": 0.09948063641786575,
"eval_runtime": 707.0025,
"eval_samples_per_second": 16.174,
"eval_steps_per_second": 2.023,
"eval_wer": 0.12589170000563477,
"step": 68200
},
{
"epoch": 5.74,
"learning_rate": 0.0001011668782345474,
"loss": 0.2622,
"step": 68400
},
{
"epoch": 5.74,
"eval_loss": 0.10015752166509628,
"eval_runtime": 713.843,
"eval_samples_per_second": 16.019,
"eval_steps_per_second": 2.003,
"eval_wer": 0.12627486335718713,
"step": 68400
},
{
"epoch": 5.76,
"learning_rate": 0.00010058099794941899,
"loss": 0.2604,
"step": 68600
},
{
"epoch": 5.76,
"eval_loss": 0.1018703505396843,
"eval_runtime": 721.4552,
"eval_samples_per_second": 15.85,
"eval_steps_per_second": 1.982,
"eval_wer": 0.1254071110610244,
"step": 68600
},
{
"epoch": 5.78,
"learning_rate": 9.999511766429058e-05,
"loss": 0.2458,
"step": 68800
},
{
"epoch": 5.78,
"eval_loss": 0.1008736789226532,
"eval_runtime": 701.5996,
"eval_samples_per_second": 16.298,
"eval_steps_per_second": 2.038,
"eval_wer": 0.12576773539189723,
"step": 68800
},
{
"epoch": 5.8,
"learning_rate": 9.940923737916218e-05,
"loss": 0.2608,
"step": 69000
},
{
"epoch": 5.8,
"eval_loss": 0.10070067644119263,
"eval_runtime": 712.046,
"eval_samples_per_second": 16.059,
"eval_steps_per_second": 2.008,
"eval_wer": 0.12631994139854624,
"step": 69000
},
{
"epoch": 5.82,
"learning_rate": 9.882335709403377e-05,
"loss": 0.2633,
"step": 69200
},
{
"epoch": 5.82,
"eval_loss": 0.09837665408849716,
"eval_runtime": 708.3742,
"eval_samples_per_second": 16.143,
"eval_steps_per_second": 2.019,
"eval_wer": 0.12583535245393587,
"step": 69200
},
{
"epoch": 5.84,
"learning_rate": 9.824040621033102e-05,
"loss": 0.2526,
"step": 69400
},
{
"epoch": 5.84,
"eval_loss": 0.10069932788610458,
"eval_runtime": 725.7524,
"eval_samples_per_second": 15.756,
"eval_steps_per_second": 1.97,
"eval_wer": 0.12542965008170395,
"step": 69400
},
{
"epoch": 5.86,
"learning_rate": 9.765452592520261e-05,
"loss": 0.2476,
"step": 69600
},
{
"epoch": 5.86,
"eval_loss": 0.10035388171672821,
"eval_runtime": 710.9719,
"eval_samples_per_second": 16.084,
"eval_steps_per_second": 2.011,
"eval_wer": 0.12496760015777314,
"step": 69600
},
{
"epoch": 5.87,
"learning_rate": 9.70686456400742e-05,
"loss": 0.2607,
"step": 69800
},
{
"epoch": 5.87,
"eval_loss": 0.10133133828639984,
"eval_runtime": 715.255,
"eval_samples_per_second": 15.987,
"eval_steps_per_second": 1.999,
"eval_wer": 0.12650025356398265,
"step": 69800
},
{
"epoch": 5.89,
"learning_rate": 9.648276535494579e-05,
"loss": 0.2606,
"step": 70000
},
{
"epoch": 5.89,
"eval_loss": 0.09976745396852493,
"eval_runtime": 710.9411,
"eval_samples_per_second": 16.084,
"eval_steps_per_second": 2.011,
"eval_wer": 0.1242914295373866,
"step": 70000
},
{
"epoch": 5.91,
"learning_rate": 9.58968850698174e-05,
"loss": 0.258,
"step": 70200
},
{
"epoch": 5.91,
"eval_loss": 0.09873379021883011,
"eval_runtime": 708.9039,
"eval_samples_per_second": 16.131,
"eval_steps_per_second": 2.017,
"eval_wer": 0.12497886966811292,
"step": 70200
},
{
"epoch": 5.93,
"learning_rate": 9.531100478468898e-05,
"loss": 0.262,
"step": 70400
},
{
"epoch": 5.93,
"eval_loss": 0.09941908717155457,
"eval_runtime": 713.9341,
"eval_samples_per_second": 16.017,
"eval_steps_per_second": 2.003,
"eval_wer": 0.12625232433650757,
"step": 70400
},
{
"epoch": 5.95,
"learning_rate": 9.472512449956058e-05,
"loss": 0.2684,
"step": 70600
},
{
"epoch": 5.95,
"eval_loss": 0.09816844016313553,
"eval_runtime": 710.6891,
"eval_samples_per_second": 16.09,
"eval_steps_per_second": 2.012,
"eval_wer": 0.12258973347608046,
"step": 70600
},
{
"epoch": 6.02,
"learning_rate": 9.413924421443217e-05,
"loss": 0.247,
"step": 70800
},
{
"epoch": 6.02,
"eval_loss": 0.10028348863124847,
"eval_runtime": 662.0676,
"eval_samples_per_second": 17.272,
"eval_steps_per_second": 2.16,
"eval_wer": 0.12441539415112414,
"step": 70800
},
{
"epoch": 6.04,
"learning_rate": 9.355336392930377e-05,
"loss": 0.2482,
"step": 71000
},
{
"epoch": 6.04,
"eval_loss": 0.0990142971277237,
"eval_runtime": 649.2239,
"eval_samples_per_second": 17.613,
"eval_steps_per_second": 2.203,
"eval_wer": 0.1230405138896715,
"step": 71000
},
{
"epoch": 6.06,
"learning_rate": 9.296748364417536e-05,
"loss": 0.2385,
"step": 71200
},
{
"epoch": 6.06,
"eval_loss": 0.09822484850883484,
"eval_runtime": 660.7912,
"eval_samples_per_second": 17.305,
"eval_steps_per_second": 2.164,
"eval_wer": 0.12372795402039781,
"step": 71200
},
{
"epoch": 6.08,
"learning_rate": 9.238160335904695e-05,
"loss": 0.2406,
"step": 71400
},
{
"epoch": 6.08,
"eval_loss": 0.09724367409944534,
"eval_runtime": 660.8872,
"eval_samples_per_second": 17.302,
"eval_steps_per_second": 2.164,
"eval_wer": 0.12193610187637346,
"step": 71400
},
{
"epoch": 6.1,
"learning_rate": 9.179572307391854e-05,
"loss": 0.2579,
"step": 71600
},
{
"epoch": 6.1,
"eval_loss": 0.0971040278673172,
"eval_runtime": 674.9194,
"eval_samples_per_second": 16.943,
"eval_steps_per_second": 2.119,
"eval_wer": 0.12212768355214966,
"step": 71600
},
{
"epoch": 6.12,
"learning_rate": 9.120984278879016e-05,
"loss": 0.2512,
"step": 71800
},
{
"epoch": 6.12,
"eval_loss": 0.09761016815900803,
"eval_runtime": 670.6191,
"eval_samples_per_second": 17.051,
"eval_steps_per_second": 2.132,
"eval_wer": 0.12180086775229616,
"step": 71800
},
{
"epoch": 6.14,
"learning_rate": 9.062396250366175e-05,
"loss": 0.2435,
"step": 72000
},
{
"epoch": 6.14,
"eval_loss": 0.09776688367128372,
"eval_runtime": 668.7679,
"eval_samples_per_second": 17.099,
"eval_steps_per_second": 2.138,
"eval_wer": 0.12095565447681299,
"step": 72000
},
{
"epoch": 6.16,
"learning_rate": 9.003808221853334e-05,
"loss": 0.2526,
"step": 72200
},
{
"epoch": 6.16,
"eval_loss": 0.09796804934740067,
"eval_runtime": 666.8275,
"eval_samples_per_second": 17.148,
"eval_steps_per_second": 2.144,
"eval_wer": 0.1238744576548149,
"step": 72200
},
{
"epoch": 6.17,
"learning_rate": 8.945220193340493e-05,
"loss": 0.2472,
"step": 72400
},
{
"epoch": 6.17,
"eval_loss": 0.09801238030195236,
"eval_runtime": 673.7542,
"eval_samples_per_second": 16.972,
"eval_steps_per_second": 2.122,
"eval_wer": 0.12542965008170395,
"step": 72400
},
{
"epoch": 6.19,
"learning_rate": 8.886632164827653e-05,
"loss": 0.2438,
"step": 72600
},
{
"epoch": 6.19,
"eval_loss": 0.0977615937590599,
"eval_runtime": 664.5529,
"eval_samples_per_second": 17.207,
"eval_steps_per_second": 2.152,
"eval_wer": 0.12182340677297572,
"step": 72600
},
{
"epoch": 6.21,
"learning_rate": 8.828044136314813e-05,
"loss": 0.2375,
"step": 72800
},
{
"epoch": 6.21,
"eval_loss": 0.09897564351558685,
"eval_runtime": 659.823,
"eval_samples_per_second": 17.33,
"eval_steps_per_second": 2.167,
"eval_wer": 0.12198117991773258,
"step": 72800
},
{
"epoch": 6.23,
"learning_rate": 8.769456107801972e-05,
"loss": 0.2419,
"step": 73000
},
{
"epoch": 6.23,
"eval_loss": 0.09719140082597733,
"eval_runtime": 670.2577,
"eval_samples_per_second": 17.061,
"eval_steps_per_second": 2.134,
"eval_wer": 0.11912999380176931,
"step": 73000
},
{
"epoch": 6.25,
"learning_rate": 8.71086807928913e-05,
"loss": 0.2441,
"step": 73200
},
{
"epoch": 6.25,
"eval_loss": 0.09728872776031494,
"eval_runtime": 692.8136,
"eval_samples_per_second": 16.505,
"eval_steps_per_second": 2.064,
"eval_wer": 0.12141770440074379,
"step": 73200
},
{
"epoch": 6.27,
"learning_rate": 8.652280050776291e-05,
"loss": 0.2314,
"step": 73400
},
{
"epoch": 6.27,
"eval_loss": 0.09700626879930496,
"eval_runtime": 686.6118,
"eval_samples_per_second": 16.654,
"eval_steps_per_second": 2.083,
"eval_wer": 0.12061756916661971,
"step": 73400
},
{
"epoch": 6.29,
"learning_rate": 8.59369202226345e-05,
"loss": 0.2533,
"step": 73600
},
{
"epoch": 6.29,
"eval_loss": 0.09654780477285385,
"eval_runtime": 683.2657,
"eval_samples_per_second": 16.736,
"eval_steps_per_second": 2.093,
"eval_wer": 0.1190398377190511,
"step": 73600
},
{
"epoch": 6.31,
"learning_rate": 8.535103993750609e-05,
"loss": 0.2357,
"step": 73800
},
{
"epoch": 6.31,
"eval_loss": 0.09661402553319931,
"eval_runtime": 682.2598,
"eval_samples_per_second": 16.76,
"eval_steps_per_second": 2.096,
"eval_wer": 0.12017805826336846,
"step": 73800
},
{
"epoch": 6.33,
"learning_rate": 8.476515965237768e-05,
"loss": 0.2466,
"step": 74000
},
{
"epoch": 6.33,
"eval_loss": 0.09645663946866989,
"eval_runtime": 689.4454,
"eval_samples_per_second": 16.586,
"eval_steps_per_second": 2.074,
"eval_wer": 0.11943427058094326,
"step": 74000
},
{
"epoch": 6.35,
"learning_rate": 8.417927936724929e-05,
"loss": 0.246,
"step": 74200
},
{
"epoch": 6.35,
"eval_loss": 0.09545984119176865,
"eval_runtime": 679.0158,
"eval_samples_per_second": 16.841,
"eval_steps_per_second": 2.106,
"eval_wer": 0.11880317800191581,
"step": 74200
},
{
"epoch": 6.37,
"learning_rate": 8.359339908212088e-05,
"loss": 0.2309,
"step": 74400
},
{
"epoch": 6.37,
"eval_loss": 0.09694214910268784,
"eval_runtime": 677.6907,
"eval_samples_per_second": 16.873,
"eval_steps_per_second": 2.11,
"eval_wer": 0.11869048289851807,
"step": 74400
},
{
"epoch": 6.39,
"learning_rate": 8.300751879699247e-05,
"loss": 0.2334,
"step": 74600
},
{
"epoch": 6.39,
"eval_loss": 0.0962836816906929,
"eval_runtime": 683.8832,
"eval_samples_per_second": 16.721,
"eval_steps_per_second": 2.091,
"eval_wer": 0.12112469713190961,
"step": 74600
},
{
"epoch": 6.41,
"learning_rate": 8.242163851186406e-05,
"loss": 0.2343,
"step": 74800
},
{
"epoch": 6.41,
"eval_loss": 0.09781304746866226,
"eval_runtime": 685.7457,
"eval_samples_per_second": 16.675,
"eval_steps_per_second": 2.085,
"eval_wer": 0.11866794387783851,
"step": 74800
},
{
"epoch": 6.43,
"learning_rate": 8.183575822673568e-05,
"loss": 0.2387,
"step": 75000
},
{
"epoch": 6.43,
"eval_loss": 0.09602531045675278,
"eval_runtime": 672.2565,
"eval_samples_per_second": 17.01,
"eval_steps_per_second": 2.127,
"eval_wer": 0.11829605003662591,
"step": 75000
},
{
"epoch": 6.45,
"learning_rate": 8.124987794160727e-05,
"loss": 0.25,
"step": 75200
},
{
"epoch": 6.45,
"eval_loss": 0.09615187346935272,
"eval_runtime": 682.05,
"eval_samples_per_second": 16.766,
"eval_steps_per_second": 2.097,
"eval_wer": 0.1192764974361864,
"step": 75200
},
{
"epoch": 6.47,
"learning_rate": 8.06669270579045e-05,
"loss": 0.2317,
"step": 75400
},
{
"epoch": 6.47,
"eval_loss": 0.09546995908021927,
"eval_runtime": 690.2183,
"eval_samples_per_second": 16.567,
"eval_steps_per_second": 2.072,
"eval_wer": 0.11836366709866457,
"step": 75400
},
{
"epoch": 6.49,
"learning_rate": 8.008104677277609e-05,
"loss": 0.2301,
"step": 75600
},
{
"epoch": 6.49,
"eval_loss": 0.09542080760002136,
"eval_runtime": 681.8498,
"eval_samples_per_second": 16.771,
"eval_steps_per_second": 2.097,
"eval_wer": 0.11834112807798501,
"step": 75600
},
{
"epoch": 6.51,
"learning_rate": 7.949516648764768e-05,
"loss": 0.2405,
"step": 75800
},
{
"epoch": 6.51,
"eval_loss": 0.09432049840688705,
"eval_runtime": 677.928,
"eval_samples_per_second": 16.868,
"eval_steps_per_second": 2.109,
"eval_wer": 0.11672958809939708,
"step": 75800
},
{
"epoch": 6.52,
"learning_rate": 7.891221560394493e-05,
"loss": 0.2345,
"step": 76000
},
{
"epoch": 6.52,
"eval_loss": 0.09489911794662476,
"eval_runtime": 688.6398,
"eval_samples_per_second": 16.605,
"eval_steps_per_second": 2.077,
"eval_wer": 0.11725925508536654,
"step": 76000
},
{
"epoch": 6.54,
"learning_rate": 7.832633531881652e-05,
"loss": 0.2267,
"step": 76200
},
{
"epoch": 6.54,
"eval_loss": 0.09413082152605057,
"eval_runtime": 680.2461,
"eval_samples_per_second": 16.81,
"eval_steps_per_second": 2.102,
"eval_wer": 0.11842001465036345,
"step": 76200
},
{
"epoch": 6.56,
"learning_rate": 7.774045503368811e-05,
"loss": 0.2293,
"step": 76400
},
{
"epoch": 6.56,
"eval_loss": 0.09459416568279266,
"eval_runtime": 658.8476,
"eval_samples_per_second": 17.356,
"eval_steps_per_second": 2.17,
"eval_wer": 0.11623372964444695,
"step": 76400
},
{
"epoch": 6.58,
"learning_rate": 7.715457474855971e-05,
"loss": 0.2312,
"step": 76600
},
{
"epoch": 6.58,
"eval_loss": 0.09610540419816971,
"eval_runtime": 661.5363,
"eval_samples_per_second": 17.286,
"eval_steps_per_second": 2.162,
"eval_wer": 0.1151405871414887,
"step": 76600
},
{
"epoch": 6.6,
"learning_rate": 7.65686944634313e-05,
"loss": 0.2343,
"step": 76800
},
{
"epoch": 6.6,
"eval_loss": 0.09503426402807236,
"eval_runtime": 680.9869,
"eval_samples_per_second": 16.792,
"eval_steps_per_second": 2.1,
"eval_wer": 0.11631261621682538,
"step": 76800
},
{
"epoch": 6.62,
"learning_rate": 7.59828141783029e-05,
"loss": 0.2366,
"step": 77000
},
{
"epoch": 6.62,
"eval_loss": 0.09373170137405396,
"eval_runtime": 677.558,
"eval_samples_per_second": 16.877,
"eval_steps_per_second": 2.111,
"eval_wer": 0.11597453090663211,
"step": 77000
},
{
"epoch": 6.64,
"learning_rate": 7.539693389317448e-05,
"loss": 0.2439,
"step": 77200
},
{
"epoch": 6.64,
"eval_loss": 0.09325527399778366,
"eval_runtime": 664.5936,
"eval_samples_per_second": 17.206,
"eval_steps_per_second": 2.152,
"eval_wer": 0.11638023327886403,
"step": 77200
},
{
"epoch": 6.66,
"learning_rate": 7.481105360804607e-05,
"loss": 0.2307,
"step": 77400
},
{
"epoch": 6.66,
"eval_loss": 0.09506206959486008,
"eval_runtime": 678.3069,
"eval_samples_per_second": 16.858,
"eval_steps_per_second": 2.108,
"eval_wer": 0.1172817941060461,
"step": 77400
},
{
"epoch": 6.68,
"learning_rate": 7.422517332291768e-05,
"loss": 0.2387,
"step": 77600
},
{
"epoch": 6.68,
"eval_loss": 0.0931260883808136,
"eval_runtime": 685.8319,
"eval_samples_per_second": 16.673,
"eval_steps_per_second": 2.085,
"eval_wer": 0.11590691384459345,
"step": 77600
},
{
"epoch": 6.7,
"learning_rate": 7.363929303778927e-05,
"loss": 0.2268,
"step": 77800
},
{
"epoch": 6.7,
"eval_loss": 0.0957166850566864,
"eval_runtime": 683.3247,
"eval_samples_per_second": 16.734,
"eval_steps_per_second": 2.093,
"eval_wer": 0.11711275145094946,
"step": 77800
},
{
"epoch": 6.72,
"learning_rate": 7.305341275266087e-05,
"loss": 0.2316,
"step": 78000
},
{
"epoch": 6.72,
"eval_loss": 0.09374788403511047,
"eval_runtime": 684.0333,
"eval_samples_per_second": 16.717,
"eval_steps_per_second": 2.091,
"eval_wer": 0.1139798275764918,
"step": 78000
},
{
"epoch": 6.74,
"learning_rate": 7.246753246753246e-05,
"loss": 0.2319,
"step": 78200
},
{
"epoch": 6.74,
"eval_loss": 0.09412852674722672,
"eval_runtime": 683.7255,
"eval_samples_per_second": 16.725,
"eval_steps_per_second": 2.091,
"eval_wer": 0.1150504310587705,
"step": 78200
},
{
"epoch": 6.76,
"learning_rate": 7.188165218240405e-05,
"loss": 0.2399,
"step": 78400
},
{
"epoch": 6.76,
"eval_loss": 0.09368865191936493,
"eval_runtime": 695.8,
"eval_samples_per_second": 16.434,
"eval_steps_per_second": 2.055,
"eval_wer": 0.11510677861046938,
"step": 78400
},
{
"epoch": 6.78,
"learning_rate": 7.129577189727565e-05,
"loss": 0.2282,
"step": 78600
},
{
"epoch": 6.78,
"eval_loss": 0.09468115866184235,
"eval_runtime": 692.8715,
"eval_samples_per_second": 16.504,
"eval_steps_per_second": 2.064,
"eval_wer": 0.11432918239702484,
"step": 78600
},
{
"epoch": 6.8,
"learning_rate": 7.070989161214725e-05,
"loss": 0.2406,
"step": 78800
},
{
"epoch": 6.8,
"eval_loss": 0.09301230311393738,
"eval_runtime": 675.0001,
"eval_samples_per_second": 16.941,
"eval_steps_per_second": 2.119,
"eval_wer": 0.11670704907871753,
"step": 78800
},
{
"epoch": 6.82,
"learning_rate": 7.012401132701884e-05,
"loss": 0.2367,
"step": 79000
},
{
"epoch": 6.82,
"eval_loss": 0.09292880445718765,
"eval_runtime": 678.9288,
"eval_samples_per_second": 16.843,
"eval_steps_per_second": 2.106,
"eval_wer": 0.11399109708683158,
"step": 79000
},
{
"epoch": 6.84,
"learning_rate": 6.953813104189044e-05,
"loss": 0.2225,
"step": 79200
},
{
"epoch": 6.84,
"eval_loss": 0.09368370473384857,
"eval_runtime": 662.1759,
"eval_samples_per_second": 17.269,
"eval_steps_per_second": 2.16,
"eval_wer": 0.11385586296275427,
"step": 79200
},
{
"epoch": 6.86,
"learning_rate": 6.895225075676203e-05,
"loss": 0.2242,
"step": 79400
},
{
"epoch": 6.86,
"eval_loss": 0.09303466975688934,
"eval_runtime": 669.81,
"eval_samples_per_second": 17.072,
"eval_steps_per_second": 2.135,
"eval_wer": 0.11382205443173495,
"step": 79400
},
{
"epoch": 6.87,
"learning_rate": 6.836637047163362e-05,
"loss": 0.2319,
"step": 79600
},
{
"epoch": 6.87,
"eval_loss": 0.09515677392482758,
"eval_runtime": 675.7005,
"eval_samples_per_second": 16.923,
"eval_steps_per_second": 2.116,
"eval_wer": 0.11462218966585902,
"step": 79600
},
{
"epoch": 6.89,
"learning_rate": 6.778049018650522e-05,
"loss": 0.2383,
"step": 79800
},
{
"epoch": 6.89,
"eval_loss": 0.09353630244731903,
"eval_runtime": 680.3127,
"eval_samples_per_second": 16.808,
"eval_steps_per_second": 2.102,
"eval_wer": 0.11421648729362709,
"step": 79800
},
{
"epoch": 6.91,
"learning_rate": 6.719460990137682e-05,
"loss": 0.228,
"step": 80000
},
{
"epoch": 6.91,
"eval_loss": 0.09211862087249756,
"eval_runtime": 677.5612,
"eval_samples_per_second": 16.877,
"eval_steps_per_second": 2.111,
"eval_wer": 0.11403617512819068,
"step": 80000
},
{
"epoch": 6.93,
"learning_rate": 6.660872961624841e-05,
"loss": 0.232,
"step": 80200
},
{
"epoch": 6.93,
"eval_loss": 0.09219860285520554,
"eval_runtime": 667.4301,
"eval_samples_per_second": 17.133,
"eval_steps_per_second": 2.143,
"eval_wer": 0.11532089930692511,
"step": 80200
},
{
"epoch": 6.95,
"learning_rate": 6.602577873254564e-05,
"loss": 0.2403,
"step": 80400
},
{
"epoch": 6.95,
"eval_loss": 0.09069675952196121,
"eval_runtime": 670.4564,
"eval_samples_per_second": 17.056,
"eval_steps_per_second": 2.133,
"eval_wer": 0.1124020961289232,
"step": 80400
},
{
"epoch": 6.97,
"learning_rate": 6.543989844741723e-05,
"loss": 0.2574,
"step": 80600
},
{
"epoch": 6.97,
"eval_loss": 0.09040801972150803,
"eval_runtime": 680.0348,
"eval_samples_per_second": 16.815,
"eval_steps_per_second": 2.103,
"eval_wer": 0.11377697639037584,
"step": 80600
},
{
"epoch": 6.99,
"learning_rate": 6.485694756371448e-05,
"loss": 0.2617,
"step": 80800
},
{
"epoch": 6.99,
"eval_loss": 0.08986030519008636,
"eval_runtime": 664.2336,
"eval_samples_per_second": 17.215,
"eval_steps_per_second": 2.153,
"eval_wer": 0.11516312616216826,
"step": 80800
},
{
"epoch": 7.01,
"learning_rate": 6.427106727858607e-05,
"loss": 0.2235,
"step": 81000
},
{
"epoch": 7.01,
"eval_loss": 0.0911833718419075,
"eval_runtime": 673.0343,
"eval_samples_per_second": 16.99,
"eval_steps_per_second": 2.125,
"eval_wer": 0.11346143010086211,
"step": 81000
},
{
"epoch": 7.03,
"learning_rate": 6.368518699345766e-05,
"loss": 0.2211,
"step": 81200
},
{
"epoch": 7.03,
"eval_loss": 0.09049921482801437,
"eval_runtime": 664.6179,
"eval_samples_per_second": 17.205,
"eval_steps_per_second": 2.152,
"eval_wer": 0.11221051445314702,
"step": 81200
},
{
"epoch": 7.05,
"learning_rate": 6.309930670832925e-05,
"loss": 0.2141,
"step": 81400
},
{
"epoch": 7.05,
"eval_loss": 0.09099965542554855,
"eval_runtime": 653.4138,
"eval_samples_per_second": 17.5,
"eval_steps_per_second": 2.189,
"eval_wer": 0.11219924494280724,
"step": 81400
},
{
"epoch": 7.07,
"learning_rate": 6.251342642320086e-05,
"loss": 0.2077,
"step": 81600
},
{
"epoch": 7.07,
"eval_loss": 0.0929802879691124,
"eval_runtime": 654.1785,
"eval_samples_per_second": 17.48,
"eval_steps_per_second": 2.186,
"eval_wer": 0.11382205443173495,
"step": 81600
},
{
"epoch": 7.09,
"learning_rate": 6.192754613807245e-05,
"loss": 0.2094,
"step": 81800
},
{
"epoch": 7.09,
"eval_loss": 0.09322798252105713,
"eval_runtime": 659.1034,
"eval_samples_per_second": 17.349,
"eval_steps_per_second": 2.17,
"eval_wer": 0.1118386206119344,
"step": 81800
},
{
"epoch": 7.11,
"learning_rate": 6.134166585294405e-05,
"loss": 0.221,
"step": 82000
},
{
"epoch": 7.11,
"eval_loss": 0.09150510281324387,
"eval_runtime": 660.2794,
"eval_samples_per_second": 17.318,
"eval_steps_per_second": 2.166,
"eval_wer": 0.110452470840142,
"step": 82000
},
{
"epoch": 7.13,
"learning_rate": 6.0755785567815635e-05,
"loss": 0.2132,
"step": 82200
},
{
"epoch": 7.13,
"eval_loss": 0.092040054500103,
"eval_runtime": 657.507,
"eval_samples_per_second": 17.391,
"eval_steps_per_second": 2.175,
"eval_wer": 0.11068913055727729,
"step": 82200
},
{
"epoch": 7.15,
"learning_rate": 6.016990528268724e-05,
"loss": 0.2157,
"step": 82400
},
{
"epoch": 7.15,
"eval_loss": 0.09085466712713242,
"eval_runtime": 665.7916,
"eval_samples_per_second": 17.175,
"eval_steps_per_second": 2.148,
"eval_wer": 0.1125373302530005,
"step": 82400
},
{
"epoch": 7.17,
"learning_rate": 5.958402499755883e-05,
"loss": 0.2246,
"step": 82600
},
{
"epoch": 7.17,
"eval_loss": 0.09079894423484802,
"eval_runtime": 660.1771,
"eval_samples_per_second": 17.321,
"eval_steps_per_second": 2.166,
"eval_wer": 0.11159069138445935,
"step": 82600
},
{
"epoch": 7.19,
"learning_rate": 5.899814471243042e-05,
"loss": 0.2181,
"step": 82800
},
{
"epoch": 7.19,
"eval_loss": 0.09172764420509338,
"eval_runtime": 661.7619,
"eval_samples_per_second": 17.28,
"eval_steps_per_second": 2.161,
"eval_wer": 0.11192877669465262,
"step": 82800
},
{
"epoch": 7.2,
"learning_rate": 5.841226442730202e-05,
"loss": 0.2203,
"step": 83000
},
{
"epoch": 7.2,
"eval_loss": 0.09090258926153183,
"eval_runtime": 662.2479,
"eval_samples_per_second": 17.267,
"eval_steps_per_second": 2.159,
"eval_wer": 0.11027215867470558,
"step": 83000
},
{
"epoch": 7.22,
"learning_rate": 5.782638414217361e-05,
"loss": 0.2191,
"step": 83200
},
{
"epoch": 7.22,
"eval_loss": 0.09051696956157684,
"eval_runtime": 662.1226,
"eval_samples_per_second": 17.27,
"eval_steps_per_second": 2.16,
"eval_wer": 0.109798839240435,
"step": 83200
},
{
"epoch": 7.24,
"learning_rate": 5.7240503857045205e-05,
"loss": 0.2252,
"step": 83400
},
{
"epoch": 7.24,
"eval_loss": 0.08852972090244293,
"eval_runtime": 663.1512,
"eval_samples_per_second": 17.243,
"eval_steps_per_second": 2.156,
"eval_wer": 0.1117484645292162,
"step": 83400
},
{
"epoch": 7.26,
"learning_rate": 5.6654623571916796e-05,
"loss": 0.2222,
"step": 83600
},
{
"epoch": 7.26,
"eval_loss": 0.0903807133436203,
"eval_runtime": 667.5255,
"eval_samples_per_second": 17.13,
"eval_steps_per_second": 2.142,
"eval_wer": 0.11038485377810334,
"step": 83600
},
{
"epoch": 7.28,
"learning_rate": 5.606874328678839e-05,
"loss": 0.2127,
"step": 83800
},
{
"epoch": 7.28,
"eval_loss": 0.09016119688749313,
"eval_runtime": 657.2492,
"eval_samples_per_second": 17.398,
"eval_steps_per_second": 2.176,
"eval_wer": 0.11103848537781033,
"step": 83800
},
{
"epoch": 7.3,
"learning_rate": 5.5482863001659984e-05,
"loss": 0.2145,
"step": 84000
},
{
"epoch": 7.3,
"eval_loss": 0.09145020693540573,
"eval_runtime": 658.2658,
"eval_samples_per_second": 17.371,
"eval_steps_per_second": 2.172,
"eval_wer": 0.11002422944723052,
"step": 84000
},
{
"epoch": 7.32,
"learning_rate": 5.489698271653159e-05,
"loss": 0.2256,
"step": 84200
},
{
"epoch": 7.32,
"eval_loss": 0.09001456201076508,
"eval_runtime": 660.2198,
"eval_samples_per_second": 17.32,
"eval_steps_per_second": 2.166,
"eval_wer": 0.11011438552994872,
"step": 84200
},
{
"epoch": 7.34,
"learning_rate": 5.431110243140318e-05,
"loss": 0.2334,
"step": 84400
},
{
"epoch": 7.34,
"eval_loss": 0.09009411185979843,
"eval_runtime": 657.4443,
"eval_samples_per_second": 17.393,
"eval_steps_per_second": 2.175,
"eval_wer": 0.11022708063334648,
"step": 84400
},
{
"epoch": 7.36,
"learning_rate": 5.3725222146274776e-05,
"loss": 0.2171,
"step": 84600
},
{
"epoch": 7.36,
"eval_loss": 0.08927768468856812,
"eval_runtime": 658.5101,
"eval_samples_per_second": 17.365,
"eval_steps_per_second": 2.172,
"eval_wer": 0.11080182566067505,
"step": 84600
},
{
"epoch": 7.38,
"learning_rate": 5.3139341861146366e-05,
"loss": 0.2247,
"step": 84800
},
{
"epoch": 7.38,
"eval_loss": 0.08871866762638092,
"eval_runtime": 657.6113,
"eval_samples_per_second": 17.389,
"eval_steps_per_second": 2.175,
"eval_wer": 0.10952837099228038,
"step": 84800
},
{
"epoch": 7.4,
"learning_rate": 5.2553461576017963e-05,
"loss": 0.225,
"step": 85000
},
{
"epoch": 7.4,
"eval_loss": 0.08847151696681976,
"eval_runtime": 657.4131,
"eval_samples_per_second": 17.394,
"eval_steps_per_second": 2.175,
"eval_wer": 0.10948329295092128,
"step": 85000
},
{
"epoch": 7.42,
"learning_rate": 5.1967581290889554e-05,
"loss": 0.2263,
"step": 85200
},
{
"epoch": 7.42,
"eval_loss": 0.08873692154884338,
"eval_runtime": 658.6562,
"eval_samples_per_second": 17.361,
"eval_steps_per_second": 2.171,
"eval_wer": 0.10950583197160084,
"step": 85200
},
{
"epoch": 7.44,
"learning_rate": 5.1384630407186794e-05,
"loss": 0.205,
"step": 85400
},
{
"epoch": 7.44,
"eval_loss": 0.08996891975402832,
"eval_runtime": 662.3112,
"eval_samples_per_second": 17.265,
"eval_steps_per_second": 2.159,
"eval_wer": 0.10919028568208711,
"step": 85400
},
{
"epoch": 7.46,
"learning_rate": 5.0798750122058385e-05,
"loss": 0.2153,
"step": 85600
},
{
"epoch": 7.46,
"eval_loss": 0.09001825749874115,
"eval_runtime": 663.8308,
"eval_samples_per_second": 17.226,
"eval_steps_per_second": 2.154,
"eval_wer": 0.10957344903363948,
"step": 85600
},
{
"epoch": 7.48,
"learning_rate": 5.021286983692998e-05,
"loss": 0.2175,
"step": 85800
},
{
"epoch": 7.48,
"eval_loss": 0.08824647217988968,
"eval_runtime": 665.8794,
"eval_samples_per_second": 17.173,
"eval_steps_per_second": 2.148,
"eval_wer": 0.10828872485490505,
"step": 85800
},
{
"epoch": 7.5,
"learning_rate": 4.962698955180157e-05,
"loss": 0.2169,
"step": 86000
},
{
"epoch": 7.5,
"eval_loss": 0.08869241178035736,
"eval_runtime": 664.8058,
"eval_samples_per_second": 17.201,
"eval_steps_per_second": 2.151,
"eval_wer": 0.10858173212373923,
"step": 86000
},
{
"epoch": 7.52,
"learning_rate": 4.904110926667317e-05,
"loss": 0.2234,
"step": 86200
},
{
"epoch": 7.52,
"eval_loss": 0.08755665272474289,
"eval_runtime": 662.3879,
"eval_samples_per_second": 17.263,
"eval_steps_per_second": 2.159,
"eval_wer": 0.10818729926184707,
"step": 86200
},
{
"epoch": 7.54,
"learning_rate": 4.845522898154476e-05,
"loss": 0.2112,
"step": 86400
},
{
"epoch": 7.54,
"eval_loss": 0.08796130865812302,
"eval_runtime": 660.9811,
"eval_samples_per_second": 17.3,
"eval_steps_per_second": 2.163,
"eval_wer": 0.10853665408238013,
"step": 86400
},
{
"epoch": 7.55,
"learning_rate": 4.7869348696416365e-05,
"loss": 0.2122,
"step": 86600
},
{
"epoch": 7.55,
"eval_loss": 0.08818641304969788,
"eval_runtime": 659.8525,
"eval_samples_per_second": 17.33,
"eval_steps_per_second": 2.167,
"eval_wer": 0.10849157604102101,
"step": 86600
},
{
"epoch": 7.57,
"learning_rate": 4.728639781271359e-05,
"loss": 0.2134,
"step": 86800
},
{
"epoch": 7.57,
"eval_loss": 0.08850608021020889,
"eval_runtime": 663.3892,
"eval_samples_per_second": 17.237,
"eval_steps_per_second": 2.156,
"eval_wer": 0.10823237730320617,
"step": 86800
},
{
"epoch": 7.59,
"learning_rate": 4.6700517527585196e-05,
"loss": 0.2218,
"step": 87000
},
{
"epoch": 7.59,
"eval_loss": 0.08732796460390091,
"eval_runtime": 663.6661,
"eval_samples_per_second": 17.23,
"eval_steps_per_second": 2.155,
"eval_wer": 0.10806333464810954,
"step": 87000
},
{
"epoch": 7.61,
"learning_rate": 4.6114637242456786e-05,
"loss": 0.2098,
"step": 87200
},
{
"epoch": 7.61,
"eval_loss": 0.08799753338098526,
"eval_runtime": 660.746,
"eval_samples_per_second": 17.306,
"eval_steps_per_second": 2.164,
"eval_wer": 0.1077590578689356,
"step": 87200
},
{
"epoch": 7.63,
"learning_rate": 4.5528756957328383e-05,
"loss": 0.2185,
"step": 87400
},
{
"epoch": 7.63,
"eval_loss": 0.08814089745283127,
"eval_runtime": 659.5596,
"eval_samples_per_second": 17.337,
"eval_steps_per_second": 2.168,
"eval_wer": 0.10757874570349918,
"step": 87400
},
{
"epoch": 7.65,
"learning_rate": 4.4942876672199974e-05,
"loss": 0.2036,
"step": 87600
},
{
"epoch": 7.65,
"eval_loss": 0.08803264051675797,
"eval_runtime": 659.0171,
"eval_samples_per_second": 17.352,
"eval_steps_per_second": 2.17,
"eval_wer": 0.10823237730320617,
"step": 87600
},
{
"epoch": 7.67,
"learning_rate": 4.435699638707157e-05,
"loss": 0.2064,
"step": 87800
},
{
"epoch": 7.67,
"eval_loss": 0.08712273836135864,
"eval_runtime": 663.9763,
"eval_samples_per_second": 17.222,
"eval_steps_per_second": 2.154,
"eval_wer": 0.10770271031723672,
"step": 87800
},
{
"epoch": 7.69,
"learning_rate": 4.377111610194316e-05,
"loss": 0.2141,
"step": 88000
},
{
"epoch": 7.69,
"eval_loss": 0.08767861127853394,
"eval_runtime": 653.4457,
"eval_samples_per_second": 17.5,
"eval_steps_per_second": 2.188,
"eval_wer": 0.10619259593170677,
"step": 88000
},
{
"epoch": 7.71,
"learning_rate": 4.318523581681476e-05,
"loss": 0.2168,
"step": 88200
},
{
"epoch": 7.71,
"eval_loss": 0.0869930163025856,
"eval_runtime": 653.5133,
"eval_samples_per_second": 17.498,
"eval_steps_per_second": 2.188,
"eval_wer": 0.10565165943539753,
"step": 88200
},
{
"epoch": 7.73,
"learning_rate": 4.259935553168635e-05,
"loss": 0.2157,
"step": 88400
},
{
"epoch": 7.73,
"eval_loss": 0.0869561955332756,
"eval_runtime": 657.2321,
"eval_samples_per_second": 17.399,
"eval_steps_per_second": 2.176,
"eval_wer": 0.10656448977291937,
"step": 88400
},
{
"epoch": 7.75,
"learning_rate": 4.2013475246557954e-05,
"loss": 0.2151,
"step": 88600
},
{
"epoch": 7.75,
"eval_loss": 0.08736027032136917,
"eval_runtime": 655.7458,
"eval_samples_per_second": 17.438,
"eval_steps_per_second": 2.181,
"eval_wer": 0.10630529103510453,
"step": 88600
},
{
"epoch": 7.77,
"learning_rate": 4.1427594961429544e-05,
"loss": 0.2115,
"step": 88800
},
{
"epoch": 7.77,
"eval_loss": 0.0879904106259346,
"eval_runtime": 656.2337,
"eval_samples_per_second": 17.425,
"eval_steps_per_second": 2.179,
"eval_wer": 0.10746605060010142,
"step": 88800
},
{
"epoch": 7.79,
"learning_rate": 4.084171467630114e-05,
"loss": 0.2125,
"step": 89000
},
{
"epoch": 7.79,
"eval_loss": 0.08856356143951416,
"eval_runtime": 658.7488,
"eval_samples_per_second": 17.359,
"eval_steps_per_second": 2.171,
"eval_wer": 0.10648560320054094,
"step": 89000
},
{
"epoch": 7.81,
"learning_rate": 4.0258763792598375e-05,
"loss": 0.2036,
"step": 89200
},
{
"epoch": 7.81,
"eval_loss": 0.08776041120290756,
"eval_runtime": 656.4464,
"eval_samples_per_second": 17.42,
"eval_steps_per_second": 2.178,
"eval_wer": 0.10588831915253283,
"step": 89200
},
{
"epoch": 7.83,
"learning_rate": 3.967288350746997e-05,
"loss": 0.2199,
"step": 89400
},
{
"epoch": 7.83,
"eval_loss": 0.08602162450551987,
"eval_runtime": 658.2289,
"eval_samples_per_second": 17.372,
"eval_steps_per_second": 2.172,
"eval_wer": 0.10615878740068745,
"step": 89400
},
{
"epoch": 8.02,
"learning_rate": 3.908700322234156e-05,
"loss": 0.2055,
"step": 89600
},
{
"epoch": 8.02,
"eval_loss": 0.08735963702201843,
"eval_runtime": 649.7905,
"eval_samples_per_second": 17.598,
"eval_steps_per_second": 2.201,
"eval_wer": 0.10638417760748295,
"step": 89600
},
{
"epoch": 8.04,
"learning_rate": 3.850112293721316e-05,
"loss": 0.2011,
"step": 89800
},
{
"epoch": 8.04,
"eval_loss": 0.08764158189296722,
"eval_runtime": 640.7104,
"eval_samples_per_second": 17.847,
"eval_steps_per_second": 2.232,
"eval_wer": 0.10567419845607709,
"step": 89800
},
{
"epoch": 8.06,
"learning_rate": 3.791524265208475e-05,
"loss": 0.2018,
"step": 90000
},
{
"epoch": 8.06,
"eval_loss": 0.08688807487487793,
"eval_runtime": 642.3443,
"eval_samples_per_second": 17.802,
"eval_steps_per_second": 2.226,
"eval_wer": 0.10522341804248606,
"step": 90000
},
{
"epoch": 8.08,
"learning_rate": 3.732936236695635e-05,
"loss": 0.2052,
"step": 90200
},
{
"epoch": 8.08,
"eval_loss": 0.08650859445333481,
"eval_runtime": 640.5273,
"eval_samples_per_second": 17.852,
"eval_steps_per_second": 2.233,
"eval_wer": 0.10556150335267933,
"step": 90200
},
{
"epoch": 8.1,
"learning_rate": 3.6743482081827945e-05,
"loss": 0.2128,
"step": 90400
},
{
"epoch": 8.1,
"eval_loss": 0.08721867948770523,
"eval_runtime": 644.1835,
"eval_samples_per_second": 17.751,
"eval_steps_per_second": 2.22,
"eval_wer": 0.10627148250408519,
"step": 90400
},
{
"epoch": 8.12,
"learning_rate": 3.616053119812518e-05,
"loss": 0.2054,
"step": 90600
},
{
"epoch": 8.12,
"eval_loss": 0.08693686872720718,
"eval_runtime": 640.4586,
"eval_samples_per_second": 17.854,
"eval_steps_per_second": 2.233,
"eval_wer": 0.10453597791175974,
"step": 90600
},
{
"epoch": 8.14,
"learning_rate": 3.5574650912996776e-05,
"loss": 0.2064,
"step": 90800
},
{
"epoch": 8.14,
"eval_loss": 0.08682414889335632,
"eval_runtime": 645.5348,
"eval_samples_per_second": 17.714,
"eval_steps_per_second": 2.215,
"eval_wer": 0.10422043162224601,
"step": 90800
},
{
"epoch": 8.16,
"learning_rate": 3.4988770627868374e-05,
"loss": 0.2003,
"step": 91000
},
{
"epoch": 8.16,
"eval_loss": 0.08698801696300507,
"eval_runtime": 642.0155,
"eval_samples_per_second": 17.811,
"eval_steps_per_second": 2.227,
"eval_wer": 0.10504310587704964,
"step": 91000
},
{
"epoch": 8.17,
"learning_rate": 3.4402890342739964e-05,
"loss": 0.2051,
"step": 91200
},
{
"epoch": 8.17,
"eval_loss": 0.08681213855743408,
"eval_runtime": 639.0151,
"eval_samples_per_second": 17.895,
"eval_steps_per_second": 2.238,
"eval_wer": 0.10517834000112695,
"step": 91200
},
{
"epoch": 8.19,
"learning_rate": 3.381701005761156e-05,
"loss": 0.205,
"step": 91400
},
{
"epoch": 8.19,
"eval_loss": 0.08681774884462357,
"eval_runtime": 647.2922,
"eval_samples_per_second": 17.666,
"eval_steps_per_second": 2.209,
"eval_wer": 0.10460359497379838,
"step": 91400
},
{
"epoch": 8.21,
"learning_rate": 3.323112977248315e-05,
"loss": 0.2045,
"step": 91600
},
{
"epoch": 8.21,
"eval_loss": 0.08683190494775772,
"eval_runtime": 640.6094,
"eval_samples_per_second": 17.85,
"eval_steps_per_second": 2.232,
"eval_wer": 0.10384853778103341,
"step": 91600
},
{
"epoch": 8.23,
"learning_rate": 3.264524948735475e-05,
"loss": 0.2073,
"step": 91800
},
{
"epoch": 8.23,
"eval_loss": 0.08680137246847153,
"eval_runtime": 644.4426,
"eval_samples_per_second": 17.744,
"eval_steps_per_second": 2.219,
"eval_wer": 0.10420916211190624,
"step": 91800
},
{
"epoch": 8.25,
"learning_rate": 3.205936920222635e-05,
"loss": 0.1989,
"step": 92000
},
{
"epoch": 8.25,
"eval_loss": 0.08712614327669144,
"eval_runtime": 642.565,
"eval_samples_per_second": 17.796,
"eval_steps_per_second": 2.225,
"eval_wer": 0.10425424015326534,
"step": 92000
},
{
"epoch": 8.27,
"learning_rate": 3.147348891709794e-05,
"loss": 0.1929,
"step": 92200
},
{
"epoch": 8.27,
"eval_loss": 0.08767101913690567,
"eval_runtime": 645.2302,
"eval_samples_per_second": 17.722,
"eval_steps_per_second": 2.216,
"eval_wer": 0.10409646700850848,
"step": 92200
},
{
"epoch": 8.29,
"learning_rate": 3.0887608631969534e-05,
"loss": 0.2116,
"step": 92400
},
{
"epoch": 8.29,
"eval_loss": 0.08523967117071152,
"eval_runtime": 645.8547,
"eval_samples_per_second": 17.705,
"eval_steps_per_second": 2.214,
"eval_wer": 0.10381472925001409,
"step": 92400
},
{
"epoch": 8.31,
"learning_rate": 3.030172834684113e-05,
"loss": 0.1991,
"step": 92600
},
{
"epoch": 8.31,
"eval_loss": 0.08694258332252502,
"eval_runtime": 638.7288,
"eval_samples_per_second": 17.903,
"eval_steps_per_second": 2.239,
"eval_wer": 0.10360060855355835,
"step": 92600
},
{
"epoch": 8.33,
"learning_rate": 2.971584806171272e-05,
"loss": 0.2045,
"step": 92800
},
{
"epoch": 8.33,
"eval_loss": 0.08679590374231339,
"eval_runtime": 641.8956,
"eval_samples_per_second": 17.814,
"eval_steps_per_second": 2.228,
"eval_wer": 0.10344283540880149,
"step": 92800
},
{
"epoch": 8.35,
"learning_rate": 2.9129967776584313e-05,
"loss": 0.2081,
"step": 93000
},
{
"epoch": 8.35,
"eval_loss": 0.0871407687664032,
"eval_runtime": 641.4271,
"eval_samples_per_second": 17.827,
"eval_steps_per_second": 2.229,
"eval_wer": 0.10428804868428466,
"step": 93000
},
{
"epoch": 8.37,
"learning_rate": 2.8544087491455907e-05,
"loss": 0.1915,
"step": 93200
},
{
"epoch": 8.37,
"eval_loss": 0.0871988832950592,
"eval_runtime": 645.7411,
"eval_samples_per_second": 17.708,
"eval_steps_per_second": 2.215,
"eval_wer": 0.10367949512593677,
"step": 93200
},
{
"epoch": 8.39,
"learning_rate": 2.7958207206327504e-05,
"loss": 0.1893,
"step": 93400
},
{
"epoch": 8.39,
"eval_loss": 0.08661910146474838,
"eval_runtime": 641.6227,
"eval_samples_per_second": 17.822,
"eval_steps_per_second": 2.229,
"eval_wer": 0.1032512537330253,
"step": 93400
},
{
"epoch": 8.41,
"learning_rate": 2.7372326921199098e-05,
"loss": 0.1927,
"step": 93600
},
{
"epoch": 8.41,
"eval_loss": 0.08692566305398941,
"eval_runtime": 645.917,
"eval_samples_per_second": 17.704,
"eval_steps_per_second": 2.214,
"eval_wer": 0.1028342818504536,
"step": 93600
},
{
"epoch": 8.43,
"learning_rate": 2.6786446636070692e-05,
"loss": 0.1987,
"step": 93800
},
{
"epoch": 8.43,
"eval_loss": 0.08724019676446915,
"eval_runtime": 641.5,
"eval_samples_per_second": 17.825,
"eval_steps_per_second": 2.229,
"eval_wer": 0.10263143066433764,
"step": 93800
},
{
"epoch": 8.45,
"learning_rate": 2.6200566350942286e-05,
"loss": 0.2088,
"step": 94000
},
{
"epoch": 8.45,
"eval_loss": 0.08689233660697937,
"eval_runtime": 638.7681,
"eval_samples_per_second": 17.902,
"eval_steps_per_second": 2.239,
"eval_wer": 0.10304840254690933,
"step": 94000
},
{
"epoch": 8.47,
"learning_rate": 2.5614686065813883e-05,
"loss": 0.1929,
"step": 94200
},
{
"epoch": 8.47,
"eval_loss": 0.08683472126722336,
"eval_runtime": 643.1191,
"eval_samples_per_second": 17.781,
"eval_steps_per_second": 2.224,
"eval_wer": 0.10273285625739562,
"step": 94200
},
{
"epoch": 8.49,
"learning_rate": 2.5028805780685477e-05,
"loss": 0.1931,
"step": 94400
},
{
"epoch": 8.49,
"eval_loss": 0.08680200576782227,
"eval_runtime": 643.6223,
"eval_samples_per_second": 17.767,
"eval_steps_per_second": 2.222,
"eval_wer": 0.1028342818504536,
"step": 94400
},
{
"epoch": 8.51,
"learning_rate": 2.4445854896982714e-05,
"loss": 0.2008,
"step": 94600
},
{
"epoch": 8.51,
"eval_loss": 0.08561909943819046,
"eval_runtime": 640.5789,
"eval_samples_per_second": 17.851,
"eval_steps_per_second": 2.232,
"eval_wer": 0.10308221107792867,
"step": 94600
},
{
"epoch": 8.52,
"learning_rate": 2.3859974611854308e-05,
"loss": 0.1971,
"step": 94800
},
{
"epoch": 8.52,
"eval_loss": 0.0856679379940033,
"eval_runtime": 643.6696,
"eval_samples_per_second": 17.765,
"eval_steps_per_second": 2.222,
"eval_wer": 0.10286809038147293,
"step": 94800
},
{
"epoch": 8.54,
"learning_rate": 2.3274094326725902e-05,
"loss": 0.1915,
"step": 95000
},
{
"epoch": 8.54,
"eval_loss": 0.08586091548204422,
"eval_runtime": 644.3313,
"eval_samples_per_second": 17.747,
"eval_steps_per_second": 2.219,
"eval_wer": 0.10251873556093988,
"step": 95000
},
{
"epoch": 8.56,
"learning_rate": 2.2691143443023142e-05,
"loss": 0.2011,
"step": 95200
},
{
"epoch": 8.56,
"eval_loss": 0.08547823131084442,
"eval_runtime": 642.5453,
"eval_samples_per_second": 17.796,
"eval_steps_per_second": 2.226,
"eval_wer": 0.10172986983715558,
"step": 95200
},
{
"epoch": 8.58,
"learning_rate": 2.2105263157894733e-05,
"loss": 0.1931,
"step": 95400
},
{
"epoch": 8.58,
"eval_loss": 0.0860673114657402,
"eval_runtime": 644.3949,
"eval_samples_per_second": 17.745,
"eval_steps_per_second": 2.219,
"eval_wer": 0.10129035893390433,
"step": 95400
},
{
"epoch": 8.6,
"learning_rate": 2.1519382872766327e-05,
"loss": 0.2008,
"step": 95600
},
{
"epoch": 8.6,
"eval_loss": 0.08597339689731598,
"eval_runtime": 643.5265,
"eval_samples_per_second": 17.769,
"eval_steps_per_second": 2.222,
"eval_wer": 0.10132416746492365,
"step": 95600
},
{
"epoch": 8.62,
"learning_rate": 2.093350258763792e-05,
"loss": 0.2045,
"step": 95800
},
{
"epoch": 8.62,
"eval_loss": 0.08469708263874054,
"eval_runtime": 649.2866,
"eval_samples_per_second": 17.612,
"eval_steps_per_second": 2.202,
"eval_wer": 0.10094100411337127,
"step": 95800
},
{
"epoch": 8.64,
"learning_rate": 2.0347622302509518e-05,
"loss": 0.2027,
"step": 96000
},
{
"epoch": 8.64,
"eval_loss": 0.0852479636669159,
"eval_runtime": 641.0893,
"eval_samples_per_second": 17.837,
"eval_steps_per_second": 2.231,
"eval_wer": 0.10149321012002029,
"step": 96000
},
{
"epoch": 8.66,
"learning_rate": 1.9761742017381112e-05,
"loss": 0.1984,
"step": 96200
},
{
"epoch": 8.66,
"eval_loss": 0.08589636534452438,
"eval_runtime": 636.8856,
"eval_samples_per_second": 17.955,
"eval_steps_per_second": 2.245,
"eval_wer": 0.10201160759564996,
"step": 96200
},
{
"epoch": 8.68,
"learning_rate": 1.9175861732252706e-05,
"loss": 0.1946,
"step": 96400
},
{
"epoch": 8.68,
"eval_loss": 0.08547361940145493,
"eval_runtime": 640.9334,
"eval_samples_per_second": 17.841,
"eval_steps_per_second": 2.231,
"eval_wer": 0.1017636783681749,
"step": 96400
},
{
"epoch": 8.7,
"learning_rate": 1.8589981447124303e-05,
"loss": 0.1991,
"step": 96600
},
{
"epoch": 8.7,
"eval_loss": 0.08481213450431824,
"eval_runtime": 641.2548,
"eval_samples_per_second": 17.832,
"eval_steps_per_second": 2.23,
"eval_wer": 0.101808756409534,
"step": 96600
},
{
"epoch": 8.72,
"learning_rate": 1.8004101161995897e-05,
"loss": 0.1936,
"step": 96800
},
{
"epoch": 8.72,
"eval_loss": 0.08544305711984634,
"eval_runtime": 645.1596,
"eval_samples_per_second": 17.724,
"eval_steps_per_second": 2.217,
"eval_wer": 0.10132416746492365,
"step": 96800
},
{
"epoch": 8.74,
"learning_rate": 1.7418220876867494e-05,
"loss": 0.1965,
"step": 97000
},
{
"epoch": 8.74,
"eval_loss": 0.0854332447052002,
"eval_runtime": 639.5304,
"eval_samples_per_second": 17.88,
"eval_steps_per_second": 2.236,
"eval_wer": 0.10099735166507015,
"step": 97000
},
{
"epoch": 8.76,
"learning_rate": 1.6832340591739088e-05,
"loss": 0.1906,
"step": 97200
},
{
"epoch": 8.76,
"eval_loss": 0.08577127009630203,
"eval_runtime": 639.6566,
"eval_samples_per_second": 17.877,
"eval_steps_per_second": 2.236,
"eval_wer": 0.10094100411337127,
"step": 97200
},
{
"epoch": 8.78,
"learning_rate": 1.6246460306610682e-05,
"loss": 0.1938,
"step": 97400
},
{
"epoch": 8.78,
"eval_loss": 0.08535514771938324,
"eval_runtime": 643.0482,
"eval_samples_per_second": 17.782,
"eval_steps_per_second": 2.224,
"eval_wer": 0.10100862117540993,
"step": 97400
},
{
"epoch": 8.8,
"learning_rate": 1.5660580021482276e-05,
"loss": 0.2027,
"step": 97600
},
{
"epoch": 8.8,
"eval_loss": 0.08470670878887177,
"eval_runtime": 638.835,
"eval_samples_per_second": 17.9,
"eval_steps_per_second": 2.238,
"eval_wer": 0.10085084803065307,
"step": 97600
},
{
"epoch": 8.82,
"learning_rate": 1.507469973635387e-05,
"loss": 0.1932,
"step": 97800
},
{
"epoch": 8.82,
"eval_loss": 0.0843362957239151,
"eval_runtime": 643.5712,
"eval_samples_per_second": 17.768,
"eval_steps_per_second": 2.222,
"eval_wer": 0.10097481264439061,
"step": 97800
},
{
"epoch": 8.84,
"learning_rate": 1.4488819451225464e-05,
"loss": 0.1857,
"step": 98000
},
{
"epoch": 8.84,
"eval_loss": 0.08466717600822449,
"eval_runtime": 644.2589,
"eval_samples_per_second": 17.749,
"eval_steps_per_second": 2.22,
"eval_wer": 0.1001408688792472,
"step": 98000
},
{
"epoch": 8.86,
"learning_rate": 1.390293916609706e-05,
"loss": 0.1871,
"step": 98200
},
{
"epoch": 8.86,
"eval_loss": 0.08466171473264694,
"eval_runtime": 645.4241,
"eval_samples_per_second": 17.717,
"eval_steps_per_second": 2.216,
"eval_wer": 0.10034372006536316,
"step": 98200
},
{
"epoch": 8.87,
"learning_rate": 1.3317058880968653e-05,
"loss": 0.1917,
"step": 98400
},
{
"epoch": 8.87,
"eval_loss": 0.08486426621675491,
"eval_runtime": 640.712,
"eval_samples_per_second": 17.847,
"eval_steps_per_second": 2.232,
"eval_wer": 0.10045641516876092,
"step": 98400
},
{
"epoch": 8.89,
"learning_rate": 1.2731178595840249e-05,
"loss": 0.2035,
"step": 98600
},
{
"epoch": 8.89,
"eval_loss": 0.08421877771615982,
"eval_runtime": 643.294,
"eval_samples_per_second": 17.776,
"eval_steps_per_second": 2.223,
"eval_wer": 0.100050712796529,
"step": 98600
},
{
"epoch": 8.91,
"learning_rate": 1.2145298310711843e-05,
"loss": 0.1946,
"step": 98800
},
{
"epoch": 8.91,
"eval_loss": 0.08399970084428787,
"eval_runtime": 640.6136,
"eval_samples_per_second": 17.85,
"eval_steps_per_second": 2.232,
"eval_wer": 0.1000957908378881,
"step": 98800
},
{
"epoch": 8.93,
"learning_rate": 1.1559418025583438e-05,
"loss": 0.2038,
"step": 99000
},
{
"epoch": 8.93,
"eval_loss": 0.08454040437936783,
"eval_runtime": 643.6723,
"eval_samples_per_second": 17.765,
"eval_steps_per_second": 2.222,
"eval_wer": 0.10106496872710881,
"step": 99000
},
{
"epoch": 8.95,
"learning_rate": 1.0973537740455032e-05,
"loss": 0.2043,
"step": 99200
},
{
"epoch": 8.95,
"eval_loss": 0.08372523635625839,
"eval_runtime": 644.4701,
"eval_samples_per_second": 17.743,
"eval_steps_per_second": 2.219,
"eval_wer": 0.10090719558235195,
"step": 99200
},
{
"epoch": 8.97,
"learning_rate": 1.0387657455326628e-05,
"loss": 0.2244,
"step": 99400
},
{
"epoch": 8.97,
"eval_loss": 0.08242122083902359,
"eval_runtime": 643.4311,
"eval_samples_per_second": 17.772,
"eval_steps_per_second": 2.222,
"eval_wer": 0.10090719558235195,
"step": 99400
},
{
"epoch": 8.99,
"learning_rate": 9.801777170198222e-06,
"loss": 0.2166,
"step": 99600
},
{
"epoch": 8.99,
"eval_loss": 0.08180003613233566,
"eval_runtime": 642.4939,
"eval_samples_per_second": 17.798,
"eval_steps_per_second": 2.226,
"eval_wer": 0.09989293965177214,
"step": 99600
},
{
"epoch": 9.01,
"learning_rate": 9.215896885069816e-06,
"loss": 0.1912,
"step": 99800
},
{
"epoch": 9.01,
"eval_loss": 0.0824543908238411,
"eval_runtime": 639.0239,
"eval_samples_per_second": 17.894,
"eval_steps_per_second": 2.238,
"eval_wer": 0.0998591311207528,
"step": 99800
},
{
"epoch": 9.03,
"learning_rate": 8.630016599941411e-06,
"loss": 0.1859,
"step": 100000
},
{
"epoch": 9.03,
"eval_loss": 0.08340790867805481,
"eval_runtime": 641.2003,
"eval_samples_per_second": 17.834,
"eval_steps_per_second": 2.23,
"eval_wer": 0.09992674818279146,
"step": 100000
},
{
"epoch": 9.05,
"learning_rate": 8.044136314813005e-06,
"loss": 0.1773,
"step": 100200
},
{
"epoch": 9.05,
"eval_loss": 0.08390292525291443,
"eval_runtime": 643.4716,
"eval_samples_per_second": 17.771,
"eval_steps_per_second": 2.222,
"eval_wer": 0.0995773933622584,
"step": 100200
},
{
"epoch": 9.07,
"learning_rate": 7.458256029684601e-06,
"loss": 0.1782,
"step": 100400
},
{
"epoch": 9.07,
"eval_loss": 0.08477972447872162,
"eval_runtime": 656.0288,
"eval_samples_per_second": 17.431,
"eval_steps_per_second": 2.18,
"eval_wer": 0.09971262748633572,
"step": 100400
},
{
"epoch": 9.09,
"learning_rate": 6.875305145981837e-06,
"loss": 0.1756,
"step": 100600
},
{
"epoch": 9.09,
"eval_loss": 0.08468695729970932,
"eval_runtime": 639.7418,
"eval_samples_per_second": 17.874,
"eval_steps_per_second": 2.235,
"eval_wer": 0.09964501042429706,
"step": 100600
},
{
"epoch": 9.11,
"learning_rate": 6.289424860853432e-06,
"loss": 0.1922,
"step": 100800
},
{
"epoch": 9.11,
"eval_loss": 0.08449111133813858,
"eval_runtime": 644.0375,
"eval_samples_per_second": 17.755,
"eval_steps_per_second": 2.22,
"eval_wer": 0.09962247140361752,
"step": 100800
},
{
"epoch": 9.13,
"learning_rate": 5.7035445757250265e-06,
"loss": 0.1859,
"step": 101000
},
{
"epoch": 9.13,
"eval_loss": 0.08459131419658661,
"eval_runtime": 642.2544,
"eval_samples_per_second": 17.804,
"eval_steps_per_second": 2.227,
"eval_wer": 0.09975770552769482,
"step": 101000
},
{
"epoch": 9.15,
"learning_rate": 5.117664290596621e-06,
"loss": 0.1845,
"step": 101200
},
{
"epoch": 9.15,
"eval_loss": 0.08437124639749527,
"eval_runtime": 642.6621,
"eval_samples_per_second": 17.793,
"eval_steps_per_second": 2.225,
"eval_wer": 0.09970135797599594,
"step": 101200
},
{
"epoch": 9.17,
"learning_rate": 4.531784005468216e-06,
"loss": 0.1956,
"step": 101400
},
{
"epoch": 9.17,
"eval_loss": 0.08400815725326538,
"eval_runtime": 639.7693,
"eval_samples_per_second": 17.874,
"eval_steps_per_second": 2.235,
"eval_wer": 0.09974643601735504,
"step": 101400
},
{
"epoch": 9.19,
"learning_rate": 3.945903720339811e-06,
"loss": 0.1915,
"step": 101600
},
{
"epoch": 9.19,
"eval_loss": 0.0842614620923996,
"eval_runtime": 639.7904,
"eval_samples_per_second": 17.873,
"eval_steps_per_second": 2.235,
"eval_wer": 0.09966754944497662,
"step": 101600
},
{
"epoch": 9.2,
"learning_rate": 3.360023435211405e-06,
"loss": 0.1876,
"step": 101800
},
{
"epoch": 9.2,
"eval_loss": 0.08413951843976974,
"eval_runtime": 638.0015,
"eval_samples_per_second": 17.923,
"eval_steps_per_second": 2.241,
"eval_wer": 0.09988167014143236,
"step": 101800
},
{
"epoch": 9.22,
"learning_rate": 2.7741431500829998e-06,
"loss": 0.1898,
"step": 102000
},
{
"epoch": 9.22,
"eval_loss": 0.08397097885608673,
"eval_runtime": 635.7725,
"eval_samples_per_second": 17.986,
"eval_steps_per_second": 2.249,
"eval_wer": 0.09959993238293796,
"step": 102000
},
{
"epoch": 9.24,
"learning_rate": 2.188262864954594e-06,
"loss": 0.2012,
"step": 102200
},
{
"epoch": 9.24,
"eval_loss": 0.08381262421607971,
"eval_runtime": 637.045,
"eval_samples_per_second": 17.95,
"eval_steps_per_second": 2.245,
"eval_wer": 0.09993801769313124,
"step": 102200
},
{
"epoch": 9.26,
"learning_rate": 1.6023825798261886e-06,
"loss": 0.1891,
"step": 102400
},
{
"epoch": 9.26,
"eval_loss": 0.0839412659406662,
"eval_runtime": 636.5331,
"eval_samples_per_second": 17.965,
"eval_steps_per_second": 2.247,
"eval_wer": 0.0996788189553164,
"step": 102400
},
{
"epoch": 9.28,
"learning_rate": 1.0165022946977834e-06,
"loss": 0.1746,
"step": 102600
},
{
"epoch": 9.28,
"eval_loss": 0.08403033018112183,
"eval_runtime": 633.7847,
"eval_samples_per_second": 18.042,
"eval_steps_per_second": 2.256,
"eval_wer": 0.09998309573449034,
"step": 102600
},
{
"epoch": 9.3,
"learning_rate": 4.3355141099501997e-07,
"loss": 0.1859,
"step": 102800
},
{
"epoch": 9.3,
"eval_loss": 0.08405481278896332,
"eval_runtime": 633.0898,
"eval_samples_per_second": 18.062,
"eval_steps_per_second": 2.259,
"eval_wer": 0.09982532258973348,
"step": 102800
},
{
"epoch": 9.31,
"step": 102910,
"total_flos": 1.7369851149894887e+20,
"train_loss": 0.025842480747058687,
"train_runtime": 56787.2686,
"train_samples_per_second": 18.122,
"train_steps_per_second": 1.812
}
],
"max_steps": 102910,
"num_train_epochs": 10,
"total_flos": 1.7369851149894887e+20,
"trial_name": null,
"trial_params": null
}