wav2vec2-large-xlsr-53-Georgian / trainer_state.json
MehdiHosseiniMoghadam's picture
Add model files
9db48fb
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 112.12090680100755,
"global_step": 22200,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.01,
"learning_rate": 0.0003,
"loss": 6.4459,
"step": 200
},
{
"epoch": 1.01,
"eval_loss": 3.1488852500915527,
"eval_runtime": 134.1012,
"eval_samples_per_second": 4.892,
"eval_wer": 1.0,
"step": 200
},
{
"epoch": 2.02,
"learning_rate": 0.00029898648648648646,
"loss": 3.0913,
"step": 400
},
{
"epoch": 2.02,
"eval_loss": 3.1127500534057617,
"eval_runtime": 138.7081,
"eval_samples_per_second": 4.729,
"eval_wer": 1.0,
"step": 400
},
{
"epoch": 3.03,
"learning_rate": 0.00029797297297297294,
"loss": 3.0716,
"step": 600
},
{
"epoch": 3.03,
"eval_loss": 3.0870425701141357,
"eval_runtime": 138.315,
"eval_samples_per_second": 4.743,
"eval_wer": 1.0,
"step": 600
},
{
"epoch": 4.04,
"learning_rate": 0.0002969594594594594,
"loss": 3.0298,
"step": 800
},
{
"epoch": 4.04,
"eval_loss": 3.0003437995910645,
"eval_runtime": 134.8731,
"eval_samples_per_second": 4.864,
"eval_wer": 1.0,
"step": 800
},
{
"epoch": 5.05,
"learning_rate": 0.0002959459459459459,
"loss": 1.728,
"step": 1000
},
{
"epoch": 5.05,
"eval_loss": 0.805480420589447,
"eval_runtime": 135.0581,
"eval_samples_per_second": 4.857,
"eval_wer": 0.8985599322321051,
"step": 1000
},
{
"epoch": 6.06,
"learning_rate": 0.0002949324324324324,
"loss": 0.6228,
"step": 1200
},
{
"epoch": 6.06,
"eval_loss": 0.6153338551521301,
"eval_runtime": 138.3824,
"eval_samples_per_second": 4.74,
"eval_wer": 0.8263447691656078,
"step": 1200
},
{
"epoch": 7.07,
"learning_rate": 0.0002939189189189189,
"loss": 0.4109,
"step": 1400
},
{
"epoch": 7.07,
"eval_loss": 0.5761246085166931,
"eval_runtime": 136.2401,
"eval_samples_per_second": 4.815,
"eval_wer": 0.8009318085556968,
"step": 1400
},
{
"epoch": 8.08,
"learning_rate": 0.00029290540540540536,
"loss": 0.3384,
"step": 1600
},
{
"epoch": 8.08,
"eval_loss": 0.6021555662155151,
"eval_runtime": 135.414,
"eval_samples_per_second": 4.844,
"eval_wer": 0.7981787378229563,
"step": 1600
},
{
"epoch": 9.09,
"learning_rate": 0.0002918918918918919,
"loss": 0.2676,
"step": 1800
},
{
"epoch": 9.09,
"eval_loss": 0.556929349899292,
"eval_runtime": 136.0159,
"eval_samples_per_second": 4.823,
"eval_wer": 0.7505294366793731,
"step": 1800
},
{
"epoch": 10.1,
"learning_rate": 0.0002908783783783784,
"loss": 0.2321,
"step": 2000
},
{
"epoch": 10.1,
"eval_loss": 0.6468214392662048,
"eval_runtime": 135.5988,
"eval_samples_per_second": 4.838,
"eval_wer": 0.7736128759000424,
"step": 2000
},
{
"epoch": 11.11,
"learning_rate": 0.00028986486486486487,
"loss": 0.2031,
"step": 2200
},
{
"epoch": 11.11,
"eval_loss": 0.6612684726715088,
"eval_runtime": 135.8609,
"eval_samples_per_second": 4.828,
"eval_wer": 0.7884371029224905,
"step": 2200
},
{
"epoch": 12.12,
"learning_rate": 0.00028885135135135135,
"loss": 0.1853,
"step": 2400
},
{
"epoch": 12.12,
"eval_loss": 0.6352970600128174,
"eval_runtime": 135.9654,
"eval_samples_per_second": 4.825,
"eval_wer": 0.736552308343922,
"step": 2400
},
{
"epoch": 13.13,
"learning_rate": 0.0002878378378378378,
"loss": 0.1826,
"step": 2600
},
{
"epoch": 13.13,
"eval_loss": 0.6177716851234436,
"eval_runtime": 136.1311,
"eval_samples_per_second": 4.819,
"eval_wer": 0.7238458280389666,
"step": 2600
},
{
"epoch": 14.14,
"learning_rate": 0.00028682432432432426,
"loss": 0.1627,
"step": 2800
},
{
"epoch": 14.14,
"eval_loss": 0.6629394888877869,
"eval_runtime": 135.7236,
"eval_samples_per_second": 4.833,
"eval_wer": 0.734011012282931,
"step": 2800
},
{
"epoch": 15.15,
"learning_rate": 0.0002858108108108108,
"loss": 0.1506,
"step": 3000
},
{
"epoch": 15.15,
"eval_loss": 0.6606569886207581,
"eval_runtime": 137.5748,
"eval_samples_per_second": 4.768,
"eval_wer": 0.7272342227869547,
"step": 3000
},
{
"epoch": 16.16,
"learning_rate": 0.0002847972972972973,
"loss": 0.1432,
"step": 3200
},
{
"epoch": 16.16,
"eval_loss": 0.6748045086860657,
"eval_runtime": 135.8657,
"eval_samples_per_second": 4.828,
"eval_wer": 0.7335874629394324,
"step": 3200
},
{
"epoch": 17.17,
"learning_rate": 0.00028378378378378377,
"loss": 0.1396,
"step": 3400
},
{
"epoch": 17.17,
"eval_loss": 0.6931908130645752,
"eval_runtime": 136.0012,
"eval_samples_per_second": 4.823,
"eval_wer": 0.7236340533672173,
"step": 3400
},
{
"epoch": 18.18,
"learning_rate": 0.00028277027027027025,
"loss": 0.1397,
"step": 3600
},
{
"epoch": 18.18,
"eval_loss": 0.6838018894195557,
"eval_runtime": 135.7614,
"eval_samples_per_second": 4.832,
"eval_wer": 0.7316814908936892,
"step": 3600
},
{
"epoch": 19.19,
"learning_rate": 0.00028175675675675674,
"loss": 0.1317,
"step": 3800
},
{
"epoch": 19.19,
"eval_loss": 0.689399242401123,
"eval_runtime": 136.2101,
"eval_samples_per_second": 4.816,
"eval_wer": 0.7242693773824651,
"step": 3800
},
{
"epoch": 20.2,
"learning_rate": 0.0002807432432432432,
"loss": 0.1225,
"step": 4000
},
{
"epoch": 20.2,
"eval_loss": 0.7114871144294739,
"eval_runtime": 135.7901,
"eval_samples_per_second": 4.831,
"eval_wer": 0.745446844557391,
"step": 4000
},
{
"epoch": 21.21,
"learning_rate": 0.0002797297297297297,
"loss": 0.121,
"step": 4200
},
{
"epoch": 21.21,
"eval_loss": 0.7714667916297913,
"eval_runtime": 144.4676,
"eval_samples_per_second": 4.541,
"eval_wer": 0.7439644218551461,
"step": 4200
},
{
"epoch": 22.22,
"learning_rate": 0.0002787162162162162,
"loss": 0.1214,
"step": 4400
},
{
"epoch": 22.22,
"eval_loss": 0.6892368197441101,
"eval_runtime": 141.5565,
"eval_samples_per_second": 4.634,
"eval_wer": 0.7246929267259635,
"step": 4400
},
{
"epoch": 23.23,
"learning_rate": 0.00027770270270270267,
"loss": 0.1201,
"step": 4600
},
{
"epoch": 23.23,
"eval_loss": 0.7176805734634399,
"eval_runtime": 136.4081,
"eval_samples_per_second": 4.809,
"eval_wer": 0.7329521389241846,
"step": 4600
},
{
"epoch": 24.24,
"learning_rate": 0.00027668918918918916,
"loss": 0.1144,
"step": 4800
},
{
"epoch": 24.24,
"eval_loss": 0.7144946455955505,
"eval_runtime": 135.6564,
"eval_samples_per_second": 4.836,
"eval_wer": 0.7143159678102499,
"step": 4800
},
{
"epoch": 25.25,
"learning_rate": 0.00027567567567567564,
"loss": 0.1087,
"step": 5000
},
{
"epoch": 25.25,
"eval_loss": 0.6824408769607544,
"eval_runtime": 146.0202,
"eval_samples_per_second": 4.493,
"eval_wer": 0.7551884794578568,
"step": 5000
},
{
"epoch": 26.26,
"learning_rate": 0.0002746621621621621,
"loss": 0.1088,
"step": 5200
},
{
"epoch": 26.26,
"eval_loss": 0.7299026846885681,
"eval_runtime": 136.6707,
"eval_samples_per_second": 4.8,
"eval_wer": 0.7293519695044473,
"step": 5200
},
{
"epoch": 27.27,
"learning_rate": 0.0002736486486486486,
"loss": 0.1033,
"step": 5400
},
{
"epoch": 27.27,
"eval_loss": 0.7187995910644531,
"eval_runtime": 135.6478,
"eval_samples_per_second": 4.836,
"eval_wer": 0.7187632359169843,
"step": 5400
},
{
"epoch": 28.28,
"learning_rate": 0.0002726351351351351,
"loss": 0.1035,
"step": 5600
},
{
"epoch": 28.28,
"eval_loss": 0.7574965953826904,
"eval_runtime": 135.5201,
"eval_samples_per_second": 4.841,
"eval_wer": 0.743117323168149,
"step": 5600
},
{
"epoch": 29.29,
"learning_rate": 0.0002716216216216216,
"loss": 0.1052,
"step": 5800
},
{
"epoch": 29.29,
"eval_loss": 0.7272396683692932,
"eval_runtime": 135.608,
"eval_samples_per_second": 4.837,
"eval_wer": 0.7181279119017365,
"step": 5800
},
{
"epoch": 30.3,
"learning_rate": 0.00027060810810810806,
"loss": 0.1074,
"step": 6000
},
{
"epoch": 30.3,
"eval_loss": 0.7088936567306519,
"eval_runtime": 135.3489,
"eval_samples_per_second": 4.847,
"eval_wer": 0.7011859381617959,
"step": 6000
},
{
"epoch": 31.31,
"learning_rate": 0.0002695945945945946,
"loss": 0.105,
"step": 6200
},
{
"epoch": 31.31,
"eval_loss": 0.7318005561828613,
"eval_runtime": 136.2308,
"eval_samples_per_second": 4.815,
"eval_wer": 0.7157983905124947,
"step": 6200
},
{
"epoch": 32.32,
"learning_rate": 0.0002685810810810811,
"loss": 0.0937,
"step": 6400
},
{
"epoch": 32.32,
"eval_loss": 0.743655264377594,
"eval_runtime": 135.8626,
"eval_samples_per_second": 4.828,
"eval_wer": 0.7115628970775095,
"step": 6400
},
{
"epoch": 33.33,
"learning_rate": 0.00026756756756756756,
"loss": 0.0976,
"step": 6600
},
{
"epoch": 33.33,
"eval_loss": 0.7406659126281738,
"eval_runtime": 136.2332,
"eval_samples_per_second": 4.815,
"eval_wer": 0.7257518000847099,
"step": 6600
},
{
"epoch": 34.34,
"learning_rate": 0.00026655405405405405,
"loss": 0.0961,
"step": 6800
},
{
"epoch": 34.34,
"eval_loss": 0.7474074959754944,
"eval_runtime": 136.361,
"eval_samples_per_second": 4.811,
"eval_wer": 0.729987293519695,
"step": 6800
},
{
"epoch": 35.35,
"learning_rate": 0.0002655405405405405,
"loss": 0.0922,
"step": 7000
},
{
"epoch": 35.35,
"eval_loss": 0.7413117289543152,
"eval_runtime": 137.8262,
"eval_samples_per_second": 4.76,
"eval_wer": 0.7399407030919102,
"step": 7000
},
{
"epoch": 36.36,
"learning_rate": 0.000264527027027027,
"loss": 0.0897,
"step": 7200
},
{
"epoch": 36.36,
"eval_loss": 0.7571277618408203,
"eval_runtime": 135.8962,
"eval_samples_per_second": 4.827,
"eval_wer": 0.7467174925878864,
"step": 7200
},
{
"epoch": 37.37,
"learning_rate": 0.0002635135135135135,
"loss": 0.0936,
"step": 7400
},
{
"epoch": 37.37,
"eval_loss": 0.7212100028991699,
"eval_runtime": 136.3693,
"eval_samples_per_second": 4.81,
"eval_wer": 0.7162219398559933,
"step": 7400
},
{
"epoch": 38.38,
"learning_rate": 0.0002625,
"loss": 0.0898,
"step": 7600
},
{
"epoch": 38.38,
"eval_loss": 0.751598060131073,
"eval_runtime": 138.668,
"eval_samples_per_second": 4.731,
"eval_wer": 0.7210927573062261,
"step": 7600
},
{
"epoch": 39.39,
"learning_rate": 0.00026148648648648647,
"loss": 0.0902,
"step": 7800
},
{
"epoch": 39.39,
"eval_loss": 0.7493733167648315,
"eval_runtime": 136.1591,
"eval_samples_per_second": 4.818,
"eval_wer": 0.7477763659466328,
"step": 7800
},
{
"epoch": 40.4,
"learning_rate": 0.00026047297297297295,
"loss": 0.0847,
"step": 8000
},
{
"epoch": 40.4,
"eval_loss": 0.6728424429893494,
"eval_runtime": 140.5502,
"eval_samples_per_second": 4.667,
"eval_wer": 0.7306226175349428,
"step": 8000
},
{
"epoch": 41.41,
"learning_rate": 0.00025945945945945944,
"loss": 0.0866,
"step": 8200
},
{
"epoch": 41.41,
"eval_loss": 0.749858558177948,
"eval_runtime": 146.7628,
"eval_samples_per_second": 4.47,
"eval_wer": 0.7151630664972469,
"step": 8200
},
{
"epoch": 42.42,
"learning_rate": 0.0002584459459459459,
"loss": 0.0809,
"step": 8400
},
{
"epoch": 42.42,
"eval_loss": 0.7739278078079224,
"eval_runtime": 136.5403,
"eval_samples_per_second": 4.804,
"eval_wer": 0.7429055484963998,
"step": 8400
},
{
"epoch": 43.43,
"learning_rate": 0.0002574324324324324,
"loss": 0.0847,
"step": 8600
},
{
"epoch": 43.43,
"eval_loss": 0.7759637236595154,
"eval_runtime": 136.7555,
"eval_samples_per_second": 4.797,
"eval_wer": 0.7244811520542143,
"step": 8600
},
{
"epoch": 44.44,
"learning_rate": 0.0002564189189189189,
"loss": 0.0852,
"step": 8800
},
{
"epoch": 44.44,
"eval_loss": 0.7829259634017944,
"eval_runtime": 139.6603,
"eval_samples_per_second": 4.697,
"eval_wer": 0.7227869546802203,
"step": 8800
},
{
"epoch": 45.45,
"learning_rate": 0.00025540540540540537,
"loss": 0.0802,
"step": 9000
},
{
"epoch": 45.45,
"eval_loss": 0.7056646347045898,
"eval_runtime": 135.8647,
"eval_samples_per_second": 4.828,
"eval_wer": 0.7100804743752647,
"step": 9000
},
{
"epoch": 46.46,
"learning_rate": 0.0002543918918918919,
"loss": 0.0794,
"step": 9200
},
{
"epoch": 46.46,
"eval_loss": 0.7538515329360962,
"eval_runtime": 140.8763,
"eval_samples_per_second": 4.657,
"eval_wer": 0.7098686997035154,
"step": 9200
},
{
"epoch": 47.47,
"learning_rate": 0.0002533783783783784,
"loss": 0.0827,
"step": 9400
},
{
"epoch": 47.47,
"eval_loss": 0.7439035773277283,
"eval_runtime": 143.0424,
"eval_samples_per_second": 4.586,
"eval_wer": 0.7151630664972469,
"step": 9400
},
{
"epoch": 48.48,
"learning_rate": 0.0002523648648648648,
"loss": 0.0803,
"step": 9600
},
{
"epoch": 48.48,
"eval_loss": 0.7053723335266113,
"eval_runtime": 143.445,
"eval_samples_per_second": 4.573,
"eval_wer": 0.7075391783142736,
"step": 9600
},
{
"epoch": 49.49,
"learning_rate": 0.0002513513513513513,
"loss": 0.0781,
"step": 9800
},
{
"epoch": 49.49,
"eval_loss": 0.8703842163085938,
"eval_runtime": 143.62,
"eval_samples_per_second": 4.568,
"eval_wer": 0.7630241423125794,
"step": 9800
},
{
"epoch": 50.5,
"learning_rate": 0.0002503378378378378,
"loss": 0.0766,
"step": 10000
},
{
"epoch": 50.5,
"eval_loss": 0.7902593612670898,
"eval_runtime": 139.0704,
"eval_samples_per_second": 4.717,
"eval_wer": 0.7130453197797544,
"step": 10000
},
{
"epoch": 51.51,
"learning_rate": 0.0002493243243243243,
"loss": 0.0771,
"step": 10200
},
{
"epoch": 51.51,
"eval_loss": 0.7181321978569031,
"eval_runtime": 138.4984,
"eval_samples_per_second": 4.737,
"eval_wer": 0.7149512918254977,
"step": 10200
},
{
"epoch": 52.52,
"learning_rate": 0.0002483108108108108,
"loss": 0.0713,
"step": 10400
},
{
"epoch": 52.52,
"eval_loss": 0.7941905856132507,
"eval_runtime": 137.9511,
"eval_samples_per_second": 4.755,
"eval_wer": 0.7164337145277425,
"step": 10400
},
{
"epoch": 53.53,
"learning_rate": 0.0002472972972972973,
"loss": 0.0761,
"step": 10600
},
{
"epoch": 53.53,
"eval_loss": 0.8347806334495544,
"eval_runtime": 137.6637,
"eval_samples_per_second": 4.765,
"eval_wer": 0.7100804743752647,
"step": 10600
},
{
"epoch": 54.54,
"learning_rate": 0.0002462837837837838,
"loss": 0.0721,
"step": 10800
},
{
"epoch": 54.54,
"eval_loss": 0.7271831035614014,
"eval_runtime": 137.7418,
"eval_samples_per_second": 4.763,
"eval_wer": 0.7024565861922915,
"step": 10800
},
{
"epoch": 55.55,
"learning_rate": 0.00024527027027027026,
"loss": 0.0684,
"step": 11000
},
{
"epoch": 55.55,
"eval_loss": 0.7921620011329651,
"eval_runtime": 137.9904,
"eval_samples_per_second": 4.754,
"eval_wer": 0.6977975434138077,
"step": 11000
},
{
"epoch": 56.56,
"learning_rate": 0.00024425675675675675,
"loss": 0.0733,
"step": 11200
},
{
"epoch": 56.56,
"eval_loss": 0.782407820224762,
"eval_runtime": 138.0874,
"eval_samples_per_second": 4.751,
"eval_wer": 0.7052096569250318,
"step": 11200
},
{
"epoch": 57.57,
"learning_rate": 0.00024324324324324323,
"loss": 0.0723,
"step": 11400
},
{
"epoch": 57.57,
"eval_loss": 0.7807161211967468,
"eval_runtime": 137.5671,
"eval_samples_per_second": 4.769,
"eval_wer": 0.6994917407878017,
"step": 11400
},
{
"epoch": 58.58,
"learning_rate": 0.00024222972972972971,
"loss": 0.0701,
"step": 11600
},
{
"epoch": 58.58,
"eval_loss": 0.7515387535095215,
"eval_runtime": 138.0585,
"eval_samples_per_second": 4.752,
"eval_wer": 0.7085980516730199,
"step": 11600
},
{
"epoch": 59.59,
"learning_rate": 0.0002412162162162162,
"loss": 0.0687,
"step": 11800
},
{
"epoch": 59.59,
"eval_loss": 0.7535402774810791,
"eval_runtime": 137.596,
"eval_samples_per_second": 4.768,
"eval_wer": 0.688267683185091,
"step": 11800
},
{
"epoch": 60.6,
"learning_rate": 0.00024020270270270268,
"loss": 0.0676,
"step": 12000
},
{
"epoch": 60.6,
"eval_loss": 0.7971649169921875,
"eval_runtime": 138.6186,
"eval_samples_per_second": 4.732,
"eval_wer": 0.7132570944515036,
"step": 12000
},
{
"epoch": 61.61,
"learning_rate": 0.00023918918918918917,
"loss": 0.0733,
"step": 12200
},
{
"epoch": 61.61,
"eval_loss": 0.7672501802444458,
"eval_runtime": 138.3057,
"eval_samples_per_second": 4.743,
"eval_wer": 0.711139347734011,
"step": 12200
},
{
"epoch": 62.62,
"learning_rate": 0.00023817567567567568,
"loss": 0.0661,
"step": 12400
},
{
"epoch": 62.62,
"eval_loss": 0.7474766373634338,
"eval_runtime": 138.3209,
"eval_samples_per_second": 4.743,
"eval_wer": 0.6975857687420585,
"step": 12400
},
{
"epoch": 63.63,
"learning_rate": 0.00023716216216216216,
"loss": 0.0666,
"step": 12600
},
{
"epoch": 63.63,
"eval_loss": 0.7444884181022644,
"eval_runtime": 137.4553,
"eval_samples_per_second": 4.772,
"eval_wer": 0.7083862770012707,
"step": 12600
},
{
"epoch": 64.64,
"learning_rate": 0.00023614864864864862,
"loss": 0.0712,
"step": 12800
},
{
"epoch": 64.64,
"eval_loss": 0.7816994190216064,
"eval_runtime": 138.1127,
"eval_samples_per_second": 4.75,
"eval_wer": 0.7210927573062261,
"step": 12800
},
{
"epoch": 65.65,
"learning_rate": 0.0002351351351351351,
"loss": 0.063,
"step": 13000
},
{
"epoch": 65.65,
"eval_loss": 0.8192810416221619,
"eval_runtime": 137.4083,
"eval_samples_per_second": 4.774,
"eval_wer": 0.7092333756882677,
"step": 13000
},
{
"epoch": 66.66,
"learning_rate": 0.00023412162162162159,
"loss": 0.0681,
"step": 13200
},
{
"epoch": 66.66,
"eval_loss": 0.7333322763442993,
"eval_runtime": 137.9838,
"eval_samples_per_second": 4.754,
"eval_wer": 0.698009318085557,
"step": 13200
},
{
"epoch": 67.68,
"learning_rate": 0.00023310810810810807,
"loss": 0.0642,
"step": 13400
},
{
"epoch": 67.68,
"eval_loss": 0.7417888045310974,
"eval_runtime": 137.6106,
"eval_samples_per_second": 4.767,
"eval_wer": 0.7083862770012707,
"step": 13400
},
{
"epoch": 68.69,
"learning_rate": 0.00023209459459459458,
"loss": 0.0622,
"step": 13600
},
{
"epoch": 68.69,
"eval_loss": 0.7969706654548645,
"eval_runtime": 137.6918,
"eval_samples_per_second": 4.764,
"eval_wer": 0.7329521389241846,
"step": 13600
},
{
"epoch": 69.7,
"learning_rate": 0.00023108108108108106,
"loss": 0.0639,
"step": 13800
},
{
"epoch": 69.7,
"eval_loss": 0.8013876080513,
"eval_runtime": 137.5846,
"eval_samples_per_second": 4.768,
"eval_wer": 0.6988564167725541,
"step": 13800
},
{
"epoch": 70.71,
"learning_rate": 0.00023006756756756755,
"loss": 0.065,
"step": 14000
},
{
"epoch": 70.71,
"eval_loss": 0.7792071104049683,
"eval_runtime": 137.6266,
"eval_samples_per_second": 4.767,
"eval_wer": 0.7043625582380347,
"step": 14000
},
{
"epoch": 71.72,
"learning_rate": 0.00022905405405405403,
"loss": 0.0608,
"step": 14200
},
{
"epoch": 71.72,
"eval_loss": 0.7951736450195312,
"eval_runtime": 138.4177,
"eval_samples_per_second": 4.739,
"eval_wer": 0.6944091486658196,
"step": 14200
},
{
"epoch": 72.73,
"learning_rate": 0.00022804054054054052,
"loss": 0.0557,
"step": 14400
},
{
"epoch": 72.73,
"eval_loss": 0.8266920447349548,
"eval_runtime": 138.5687,
"eval_samples_per_second": 4.734,
"eval_wer": 0.6977975434138077,
"step": 14400
},
{
"epoch": 73.74,
"learning_rate": 0.00022702702702702703,
"loss": 0.0592,
"step": 14600
},
{
"epoch": 73.74,
"eval_loss": 0.8056704998016357,
"eval_runtime": 137.1892,
"eval_samples_per_second": 4.782,
"eval_wer": 0.7075391783142736,
"step": 14600
},
{
"epoch": 74.75,
"learning_rate": 0.0002260135135135135,
"loss": 0.064,
"step": 14800
},
{
"epoch": 74.75,
"eval_loss": 0.815148115158081,
"eval_runtime": 137.9946,
"eval_samples_per_second": 4.754,
"eval_wer": 0.7009741634900466,
"step": 14800
},
{
"epoch": 75.76,
"learning_rate": 0.000225,
"loss": 0.0603,
"step": 15000
},
{
"epoch": 75.76,
"eval_loss": 0.7697699069976807,
"eval_runtime": 138.1754,
"eval_samples_per_second": 4.748,
"eval_wer": 0.7124099957645066,
"step": 15000
},
{
"epoch": 76.77,
"learning_rate": 0.00022398648648648645,
"loss": 0.0613,
"step": 15200
},
{
"epoch": 76.77,
"eval_loss": 0.7657320499420166,
"eval_runtime": 137.8551,
"eval_samples_per_second": 4.759,
"eval_wer": 0.7170690385429903,
"step": 15200
},
{
"epoch": 77.78,
"learning_rate": 0.00022297297297297293,
"loss": 0.0602,
"step": 15400
},
{
"epoch": 77.78,
"eval_loss": 0.7715324759483337,
"eval_runtime": 137.9821,
"eval_samples_per_second": 4.754,
"eval_wer": 0.716857263871241,
"step": 15400
},
{
"epoch": 78.79,
"learning_rate": 0.00022195945945945945,
"loss": 0.0597,
"step": 15600
},
{
"epoch": 78.79,
"eval_loss": 0.7833596467971802,
"eval_runtime": 137.7858,
"eval_samples_per_second": 4.761,
"eval_wer": 0.7132570944515036,
"step": 15600
},
{
"epoch": 79.8,
"learning_rate": 0.00022094594594594593,
"loss": 0.0585,
"step": 15800
},
{
"epoch": 79.8,
"eval_loss": 0.8398387432098389,
"eval_runtime": 137.7412,
"eval_samples_per_second": 4.763,
"eval_wer": 0.7088098263447692,
"step": 15800
},
{
"epoch": 80.81,
"learning_rate": 0.0002199324324324324,
"loss": 0.056,
"step": 16000
},
{
"epoch": 80.81,
"eval_loss": 0.8182487487792969,
"eval_runtime": 137.8628,
"eval_samples_per_second": 4.758,
"eval_wer": 0.7128335451080051,
"step": 16000
},
{
"epoch": 81.82,
"learning_rate": 0.0002189189189189189,
"loss": 0.06,
"step": 16200
},
{
"epoch": 81.82,
"eval_loss": 0.8023802638053894,
"eval_runtime": 137.792,
"eval_samples_per_second": 4.761,
"eval_wer": 0.6918678526048284,
"step": 16200
},
{
"epoch": 82.83,
"learning_rate": 0.00021790540540540538,
"loss": 0.0542,
"step": 16400
},
{
"epoch": 82.83,
"eval_loss": 0.7613797187805176,
"eval_runtime": 138.0605,
"eval_samples_per_second": 4.752,
"eval_wer": 0.6916560779330791,
"step": 16400
},
{
"epoch": 83.84,
"learning_rate": 0.0002168918918918919,
"loss": 0.0565,
"step": 16600
},
{
"epoch": 83.84,
"eval_loss": 0.7780935764312744,
"eval_runtime": 138.2761,
"eval_samples_per_second": 4.744,
"eval_wer": 0.7153748411689962,
"step": 16600
},
{
"epoch": 84.85,
"learning_rate": 0.00021587837837837838,
"loss": 0.0518,
"step": 16800
},
{
"epoch": 84.85,
"eval_loss": 0.8466140031814575,
"eval_runtime": 138.8619,
"eval_samples_per_second": 4.724,
"eval_wer": 0.7475645912748835,
"step": 16800
},
{
"epoch": 85.86,
"learning_rate": 0.00021486486486486486,
"loss": 0.0566,
"step": 17000
},
{
"epoch": 85.86,
"eval_loss": 0.8004465699195862,
"eval_runtime": 137.4262,
"eval_samples_per_second": 4.773,
"eval_wer": 0.7064803049555273,
"step": 17000
},
{
"epoch": 86.87,
"learning_rate": 0.00021385135135135134,
"loss": 0.0535,
"step": 17200
},
{
"epoch": 86.87,
"eval_loss": 0.8326082825660706,
"eval_runtime": 137.6615,
"eval_samples_per_second": 4.765,
"eval_wer": 0.7043625582380347,
"step": 17200
},
{
"epoch": 87.88,
"learning_rate": 0.0002128378378378378,
"loss": 0.0483,
"step": 17400
},
{
"epoch": 87.88,
"eval_loss": 0.7926554083824158,
"eval_runtime": 138.0063,
"eval_samples_per_second": 4.753,
"eval_wer": 0.7251164760694621,
"step": 17400
},
{
"epoch": 88.89,
"learning_rate": 0.00021182432432432428,
"loss": 0.0486,
"step": 17600
},
{
"epoch": 88.89,
"eval_loss": 0.7882806062698364,
"eval_runtime": 138.7006,
"eval_samples_per_second": 4.73,
"eval_wer": 0.6899618805590851,
"step": 17600
},
{
"epoch": 89.9,
"learning_rate": 0.0002108108108108108,
"loss": 0.0504,
"step": 17800
},
{
"epoch": 89.9,
"eval_loss": 0.7685484290122986,
"eval_runtime": 138.3804,
"eval_samples_per_second": 4.741,
"eval_wer": 0.6939855993223211,
"step": 17800
},
{
"epoch": 90.91,
"learning_rate": 0.00020979729729729728,
"loss": 0.056,
"step": 18000
},
{
"epoch": 90.91,
"eval_loss": 0.848064124584198,
"eval_runtime": 137.1191,
"eval_samples_per_second": 4.784,
"eval_wer": 0.7007623888182973,
"step": 18000
},
{
"epoch": 91.92,
"learning_rate": 0.00020878378378378376,
"loss": 0.049,
"step": 18200
},
{
"epoch": 91.92,
"eval_loss": 0.845516562461853,
"eval_runtime": 137.1172,
"eval_samples_per_second": 4.784,
"eval_wer": 0.7119864464210081,
"step": 18200
},
{
"epoch": 92.93,
"learning_rate": 0.00020777027027027025,
"loss": 0.0536,
"step": 18400
},
{
"epoch": 92.93,
"eval_loss": 0.7710561752319336,
"eval_runtime": 138.0433,
"eval_samples_per_second": 4.752,
"eval_wer": 0.6925031766200762,
"step": 18400
},
{
"epoch": 93.94,
"learning_rate": 0.00020675675675675673,
"loss": 0.0503,
"step": 18600
},
{
"epoch": 93.94,
"eval_loss": 0.8255069851875305,
"eval_runtime": 137.6117,
"eval_samples_per_second": 4.767,
"eval_wer": 0.7174925878864887,
"step": 18600
},
{
"epoch": 94.95,
"learning_rate": 0.00020574324324324324,
"loss": 0.0488,
"step": 18800
},
{
"epoch": 94.95,
"eval_loss": 0.8600437641143799,
"eval_runtime": 137.4326,
"eval_samples_per_second": 4.773,
"eval_wer": 0.7246929267259635,
"step": 18800
},
{
"epoch": 95.96,
"learning_rate": 0.00020472972972972972,
"loss": 0.0468,
"step": 19000
},
{
"epoch": 95.96,
"eval_loss": 0.7781614661216736,
"eval_runtime": 137.8454,
"eval_samples_per_second": 4.759,
"eval_wer": 0.7001270648030495,
"step": 19000
},
{
"epoch": 96.97,
"learning_rate": 0.0002037162162162162,
"loss": 0.0486,
"step": 19200
},
{
"epoch": 96.97,
"eval_loss": 0.7687584161758423,
"eval_runtime": 137.2673,
"eval_samples_per_second": 4.779,
"eval_wer": 0.7054214315967811,
"step": 19200
},
{
"epoch": 97.98,
"learning_rate": 0.0002027027027027027,
"loss": 0.0523,
"step": 19400
},
{
"epoch": 97.98,
"eval_loss": 0.8229833245277405,
"eval_runtime": 137.1013,
"eval_samples_per_second": 4.785,
"eval_wer": 0.7066920796272765,
"step": 19400
},
{
"epoch": 98.99,
"learning_rate": 0.00020168918918918915,
"loss": 0.0507,
"step": 19600
},
{
"epoch": 98.99,
"eval_loss": 0.761595606803894,
"eval_runtime": 137.3405,
"eval_samples_per_second": 4.776,
"eval_wer": 0.6910207539178315,
"step": 19600
},
{
"epoch": 100.0,
"learning_rate": 0.00020067567567567566,
"loss": 0.049,
"step": 19800
},
{
"epoch": 100.0,
"eval_loss": 0.8465907573699951,
"eval_runtime": 136.8552,
"eval_samples_per_second": 4.793,
"eval_wer": 0.704574332909784,
"step": 19800
},
{
"epoch": 101.01,
"learning_rate": 0.00019966216216216214,
"loss": 0.0502,
"step": 20000
},
{
"epoch": 101.01,
"eval_loss": 0.8005170226097107,
"eval_runtime": 137.3151,
"eval_samples_per_second": 4.777,
"eval_wer": 0.6925031766200762,
"step": 20000
},
{
"epoch": 102.02,
"learning_rate": 0.00019864864864864863,
"loss": 0.0443,
"step": 20200
},
{
"epoch": 102.02,
"eval_loss": 0.8749315142631531,
"eval_runtime": 137.9488,
"eval_samples_per_second": 4.755,
"eval_wer": 0.6927149512918255,
"step": 20200
},
{
"epoch": 103.03,
"learning_rate": 0.0001976351351351351,
"loss": 0.0486,
"step": 20400
},
{
"epoch": 103.03,
"eval_loss": 0.7846581339836121,
"eval_runtime": 136.7448,
"eval_samples_per_second": 4.797,
"eval_wer": 0.7124099957645066,
"step": 20400
},
{
"epoch": 104.04,
"learning_rate": 0.0001966216216216216,
"loss": 0.0455,
"step": 20600
},
{
"epoch": 104.04,
"eval_loss": 0.842466413974762,
"eval_runtime": 137.1975,
"eval_samples_per_second": 4.781,
"eval_wer": 0.7189750105887336,
"step": 20600
},
{
"epoch": 105.05,
"learning_rate": 0.00019560810810810808,
"loss": 0.0435,
"step": 20800
},
{
"epoch": 105.05,
"eval_loss": 0.8235080242156982,
"eval_runtime": 137.1509,
"eval_samples_per_second": 4.783,
"eval_wer": 0.6927149512918255,
"step": 20800
},
{
"epoch": 106.06,
"learning_rate": 0.0001945945945945946,
"loss": 0.0452,
"step": 21000
},
{
"epoch": 106.06,
"eval_loss": 0.7949621677398682,
"eval_runtime": 137.8819,
"eval_samples_per_second": 4.758,
"eval_wer": 0.6891147818720881,
"step": 21000
},
{
"epoch": 107.07,
"learning_rate": 0.00019358108108108107,
"loss": 0.0441,
"step": 21200
},
{
"epoch": 107.07,
"eval_loss": 0.8163775205612183,
"eval_runtime": 136.9828,
"eval_samples_per_second": 4.789,
"eval_wer": 0.6992799661160525,
"step": 21200
},
{
"epoch": 108.08,
"learning_rate": 0.00019256756756756756,
"loss": 0.0433,
"step": 21400
},
{
"epoch": 108.08,
"eval_loss": 0.9103622436523438,
"eval_runtime": 138.0294,
"eval_samples_per_second": 4.753,
"eval_wer": 0.7009741634900466,
"step": 21400
},
{
"epoch": 109.09,
"learning_rate": 0.00019155405405405404,
"loss": 0.0423,
"step": 21600
},
{
"epoch": 109.09,
"eval_loss": 0.8365850448608398,
"eval_runtime": 137.9595,
"eval_samples_per_second": 4.755,
"eval_wer": 0.6954680220245658,
"step": 21600
},
{
"epoch": 110.1,
"learning_rate": 0.0001905405405405405,
"loss": 0.0428,
"step": 21800
},
{
"epoch": 110.1,
"eval_loss": 0.9046308994293213,
"eval_runtime": 137.2986,
"eval_samples_per_second": 4.778,
"eval_wer": 0.6863617111393477,
"step": 21800
},
{
"epoch": 111.11,
"learning_rate": 0.00018952702702702704,
"loss": 0.0389,
"step": 22000
},
{
"epoch": 111.11,
"eval_loss": 0.8430789709091187,
"eval_runtime": 137.4909,
"eval_samples_per_second": 4.771,
"eval_wer": 0.6869970351545955,
"step": 22000
},
{
"epoch": 112.12,
"learning_rate": 0.0001885135135135135,
"loss": 0.0388,
"step": 22200
},
{
"epoch": 112.12,
"eval_loss": 0.8418474793434143,
"eval_runtime": 138.0347,
"eval_samples_per_second": 4.752,
"eval_wer": 0.6990681914443032,
"step": 22200
}
],
"max_steps": 59400,
"num_train_epochs": 300,
"total_flos": 3.071129167748675e+19,
"trial_name": null,
"trial_params": null
}