|
{ |
|
"best_metric": 0.5485906004905701, |
|
"best_model_checkpoint": "wav2vec2-large-xlsr-coraa-exp-17/checkpoint-1358", |
|
"epoch": 117.0, |
|
"global_step": 1638, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.07, |
|
"learning_rate": 0.0, |
|
"loss": 38.4208, |
|
"step": 1 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_cer": 1.2145950864422201, |
|
"eval_loss": 41.80952453613281, |
|
"eval_per": 1.0056887444128404, |
|
"eval_runtime": 16.4211, |
|
"eval_samples_per_second": 33.006, |
|
"eval_steps_per_second": 4.141, |
|
"eval_wer": 1.0056887444128404, |
|
"step": 14 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 12.287281036376953, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.3942, |
|
"eval_samples_per_second": 33.06, |
|
"eval_steps_per_second": 4.148, |
|
"eval_wer": 1.0, |
|
"step": 28 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 4.809342861175537, |
|
"eval_per": 1.0, |
|
"eval_runtime": 17.8009, |
|
"eval_samples_per_second": 30.448, |
|
"eval_steps_per_second": 3.82, |
|
"eval_wer": 1.0, |
|
"step": 42 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.9737813472747803, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.1587, |
|
"eval_samples_per_second": 33.542, |
|
"eval_steps_per_second": 4.208, |
|
"eval_wer": 1.0, |
|
"step": 56 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.6683900356292725, |
|
"eval_per": 1.0, |
|
"eval_runtime": 17.3608, |
|
"eval_samples_per_second": 31.22, |
|
"eval_steps_per_second": 3.917, |
|
"eval_wer": 1.0, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.5007262229919434, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.8377, |
|
"eval_samples_per_second": 32.19, |
|
"eval_steps_per_second": 4.039, |
|
"eval_wer": 1.0, |
|
"step": 84 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.3854148387908936, |
|
"eval_per": 1.0, |
|
"eval_runtime": 15.8896, |
|
"eval_samples_per_second": 34.11, |
|
"eval_steps_per_second": 4.28, |
|
"eval_wer": 1.0, |
|
"step": 98 |
|
}, |
|
{ |
|
"epoch": 7.14, |
|
"learning_rate": 3.853775853775854e-05, |
|
"loss": 11.8009, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.450645923614502, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.3597, |
|
"eval_samples_per_second": 33.13, |
|
"eval_steps_per_second": 4.157, |
|
"eval_wer": 1.0, |
|
"step": 112 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.178906202316284, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.1702, |
|
"eval_samples_per_second": 33.519, |
|
"eval_steps_per_second": 4.205, |
|
"eval_wer": 1.0, |
|
"step": 126 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.1274373531341553, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.9804, |
|
"eval_samples_per_second": 31.919, |
|
"eval_steps_per_second": 4.005, |
|
"eval_wer": 1.0, |
|
"step": 140 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.1624248027801514, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.0626, |
|
"eval_samples_per_second": 33.743, |
|
"eval_steps_per_second": 4.233, |
|
"eval_wer": 1.0, |
|
"step": 154 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.1065869331359863, |
|
"eval_per": 1.0, |
|
"eval_runtime": 15.7377, |
|
"eval_samples_per_second": 34.44, |
|
"eval_steps_per_second": 4.321, |
|
"eval_wer": 1.0, |
|
"step": 168 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0579798221588135, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.1086, |
|
"eval_samples_per_second": 33.647, |
|
"eval_steps_per_second": 4.221, |
|
"eval_wer": 1.0, |
|
"step": 182 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0477194786071777, |
|
"eval_per": 1.0, |
|
"eval_runtime": 17.7392, |
|
"eval_samples_per_second": 30.554, |
|
"eval_steps_per_second": 3.833, |
|
"eval_wer": 1.0, |
|
"step": 196 |
|
}, |
|
{ |
|
"epoch": 14.29, |
|
"learning_rate": 3.6613756613756616e-05, |
|
"loss": 3.0395, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.051933526992798, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.5102, |
|
"eval_samples_per_second": 32.828, |
|
"eval_steps_per_second": 4.119, |
|
"eval_wer": 1.0, |
|
"step": 210 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0363881587982178, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.6774, |
|
"eval_samples_per_second": 32.499, |
|
"eval_steps_per_second": 4.077, |
|
"eval_wer": 1.0, |
|
"step": 224 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.015160083770752, |
|
"eval_per": 1.0, |
|
"eval_runtime": 17.0522, |
|
"eval_samples_per_second": 31.785, |
|
"eval_steps_per_second": 3.988, |
|
"eval_wer": 1.0, |
|
"step": 238 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0166876316070557, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.1958, |
|
"eval_samples_per_second": 33.465, |
|
"eval_steps_per_second": 4.199, |
|
"eval_wer": 1.0, |
|
"step": 252 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0129683017730713, |
|
"eval_per": 1.0, |
|
"eval_runtime": 17.0594, |
|
"eval_samples_per_second": 31.771, |
|
"eval_steps_per_second": 3.986, |
|
"eval_wer": 1.0, |
|
"step": 266 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0103399753570557, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.6483, |
|
"eval_samples_per_second": 32.556, |
|
"eval_steps_per_second": 4.084, |
|
"eval_wer": 1.0, |
|
"step": 280 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.9993834495544434, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.1419, |
|
"eval_samples_per_second": 33.577, |
|
"eval_steps_per_second": 4.213, |
|
"eval_wer": 1.0, |
|
"step": 294 |
|
}, |
|
{ |
|
"epoch": 21.43, |
|
"learning_rate": 3.468975468975469e-05, |
|
"loss": 2.9424, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.999858856201172, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.4633, |
|
"eval_samples_per_second": 32.922, |
|
"eval_steps_per_second": 4.13, |
|
"eval_wer": 1.0, |
|
"step": 308 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.000885486602783, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.4157, |
|
"eval_samples_per_second": 33.017, |
|
"eval_steps_per_second": 4.142, |
|
"eval_wer": 1.0, |
|
"step": 322 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.002438545227051, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.3396, |
|
"eval_samples_per_second": 33.171, |
|
"eval_steps_per_second": 4.162, |
|
"eval_wer": 1.0, |
|
"step": 336 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.000091552734375, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.2524, |
|
"eval_samples_per_second": 33.349, |
|
"eval_steps_per_second": 4.184, |
|
"eval_wer": 1.0, |
|
"step": 350 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.989057779312134, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.9129, |
|
"eval_samples_per_second": 32.047, |
|
"eval_steps_per_second": 4.021, |
|
"eval_wer": 1.0, |
|
"step": 364 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.988072633743286, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.8979, |
|
"eval_samples_per_second": 32.075, |
|
"eval_steps_per_second": 4.024, |
|
"eval_wer": 1.0, |
|
"step": 378 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.97031569480896, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.5706, |
|
"eval_samples_per_second": 32.708, |
|
"eval_steps_per_second": 4.104, |
|
"eval_wer": 1.0, |
|
"step": 392 |
|
}, |
|
{ |
|
"epoch": 28.57, |
|
"learning_rate": 3.276575276575277e-05, |
|
"loss": 2.9154, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.9531471729278564, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.0162, |
|
"eval_samples_per_second": 33.841, |
|
"eval_steps_per_second": 4.246, |
|
"eval_wer": 1.0, |
|
"step": 406 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.920755624771118, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.2922, |
|
"eval_samples_per_second": 33.267, |
|
"eval_steps_per_second": 4.174, |
|
"eval_wer": 1.0, |
|
"step": 420 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.898137331008911, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.1037, |
|
"eval_samples_per_second": 33.657, |
|
"eval_steps_per_second": 4.223, |
|
"eval_wer": 1.0, |
|
"step": 434 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.8320581912994385, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.1007, |
|
"eval_samples_per_second": 33.663, |
|
"eval_steps_per_second": 4.223, |
|
"eval_wer": 1.0, |
|
"step": 448 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.7583184242248535, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.3232, |
|
"eval_samples_per_second": 33.204, |
|
"eval_steps_per_second": 4.166, |
|
"eval_wer": 1.0, |
|
"step": 462 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_cer": 0.9616014558689718, |
|
"eval_loss": 2.6405322551727295, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.4064, |
|
"eval_samples_per_second": 33.036, |
|
"eval_steps_per_second": 4.145, |
|
"eval_wer": 1.0, |
|
"step": 476 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_cer": 0.8832029117379436, |
|
"eval_loss": 2.5071756839752197, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.3137, |
|
"eval_samples_per_second": 33.224, |
|
"eval_steps_per_second": 4.168, |
|
"eval_wer": 1.0, |
|
"step": 490 |
|
}, |
|
{ |
|
"epoch": 35.71, |
|
"learning_rate": 3.0841750841750846e-05, |
|
"loss": 2.7552, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_cer": 0.6144131028207461, |
|
"eval_loss": 2.1546847820281982, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.1444, |
|
"eval_samples_per_second": 33.572, |
|
"eval_steps_per_second": 4.212, |
|
"eval_wer": 1.0, |
|
"step": 504 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_cer": 0.49958143767060964, |
|
"eval_loss": 1.7564772367477417, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.6494, |
|
"eval_samples_per_second": 32.554, |
|
"eval_steps_per_second": 4.084, |
|
"eval_wer": 1.0, |
|
"step": 518 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_cer": 0.40651501364877163, |
|
"eval_loss": 1.460233211517334, |
|
"eval_per": 1.0, |
|
"eval_runtime": 16.6864, |
|
"eval_samples_per_second": 32.482, |
|
"eval_steps_per_second": 4.075, |
|
"eval_wer": 1.0, |
|
"step": 532 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_cer": 0.36578707916287534, |
|
"eval_loss": 1.2268937826156616, |
|
"eval_per": 0.9892320195042665, |
|
"eval_runtime": 16.8505, |
|
"eval_samples_per_second": 32.165, |
|
"eval_steps_per_second": 4.035, |
|
"eval_wer": 0.989638358390898, |
|
"step": 546 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_cer": 0.3204731574158326, |
|
"eval_loss": 1.0905884504318237, |
|
"eval_per": 0.8833807395367737, |
|
"eval_runtime": 16.8204, |
|
"eval_samples_per_second": 32.223, |
|
"eval_steps_per_second": 4.043, |
|
"eval_wer": 0.8880536367330354, |
|
"step": 560 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_cer": 0.26314831665150135, |
|
"eval_loss": 0.9941390752792358, |
|
"eval_per": 0.6603006907761073, |
|
"eval_runtime": 16.4361, |
|
"eval_samples_per_second": 32.976, |
|
"eval_steps_per_second": 4.137, |
|
"eval_wer": 0.6771637545713125, |
|
"step": 574 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_cer": 0.23221110100090991, |
|
"eval_loss": 0.9132717847824097, |
|
"eval_per": 0.5154408776919951, |
|
"eval_runtime": 16.9668, |
|
"eval_samples_per_second": 31.945, |
|
"eval_steps_per_second": 4.008, |
|
"eval_wer": 0.5422592442096709, |
|
"step": 588 |
|
}, |
|
{ |
|
"epoch": 42.86, |
|
"learning_rate": 2.8917748917748916e-05, |
|
"loss": 1.4599, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_cer": 0.22413102820746134, |
|
"eval_loss": 0.8487069010734558, |
|
"eval_per": 0.48821617228768793, |
|
"eval_runtime": 16.6557, |
|
"eval_samples_per_second": 32.541, |
|
"eval_steps_per_second": 4.083, |
|
"eval_wer": 0.5142218610321008, |
|
"step": 602 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_cer": 0.22074613284804367, |
|
"eval_loss": 0.8211185336112976, |
|
"eval_per": 0.46261682242990654, |
|
"eval_runtime": 16.0355, |
|
"eval_samples_per_second": 33.8, |
|
"eval_steps_per_second": 4.241, |
|
"eval_wer": 0.48984152783421375, |
|
"step": 616 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_cer": 0.214049135577798, |
|
"eval_loss": 0.7671909332275391, |
|
"eval_per": 0.4518488419341731, |
|
"eval_runtime": 16.1929, |
|
"eval_samples_per_second": 33.471, |
|
"eval_steps_per_second": 4.199, |
|
"eval_wer": 0.48029256399837467, |
|
"step": 630 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_cer": 0.2092083712465878, |
|
"eval_loss": 0.7431579828262329, |
|
"eval_per": 0.44453474197480697, |
|
"eval_runtime": 16.359, |
|
"eval_samples_per_second": 33.132, |
|
"eval_steps_per_second": 4.157, |
|
"eval_wer": 0.4707436001625356, |
|
"step": 644 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_cer": 0.2059326660600546, |
|
"eval_loss": 0.7389556765556335, |
|
"eval_per": 0.42624949207639173, |
|
"eval_runtime": 16.6785, |
|
"eval_samples_per_second": 32.497, |
|
"eval_steps_per_second": 4.077, |
|
"eval_wer": 0.44920763917106865, |
|
"step": 658 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_cer": 0.2011282984531392, |
|
"eval_loss": 0.699397087097168, |
|
"eval_per": 0.41060544494108087, |
|
"eval_runtime": 16.5887, |
|
"eval_samples_per_second": 32.673, |
|
"eval_steps_per_second": 4.099, |
|
"eval_wer": 0.43478260869565216, |
|
"step": 672 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_cer": 0.19909008189262967, |
|
"eval_loss": 0.6998735070228577, |
|
"eval_per": 0.3998374644453474, |
|
"eval_runtime": 16.3728, |
|
"eval_samples_per_second": 33.104, |
|
"eval_steps_per_second": 4.153, |
|
"eval_wer": 0.4229987809833401, |
|
"step": 686 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"learning_rate": 2.6993746993746993e-05, |
|
"loss": 0.7585, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_cer": 0.19588717015468607, |
|
"eval_loss": 0.6737520098686218, |
|
"eval_per": 0.38825680617635105, |
|
"eval_runtime": 16.7385, |
|
"eval_samples_per_second": 32.38, |
|
"eval_steps_per_second": 4.062, |
|
"eval_wer": 0.4122308004876067, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"eval_cer": 0.19628753412192904, |
|
"eval_loss": 0.6696569919586182, |
|
"eval_per": 0.38581877285656235, |
|
"eval_runtime": 16.5913, |
|
"eval_samples_per_second": 32.668, |
|
"eval_steps_per_second": 4.099, |
|
"eval_wer": 0.4093864282811865, |
|
"step": 714 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"eval_cer": 0.19963603275705186, |
|
"eval_loss": 0.6706883907318115, |
|
"eval_per": 0.39536773669240144, |
|
"eval_runtime": 18.473, |
|
"eval_samples_per_second": 29.34, |
|
"eval_steps_per_second": 3.681, |
|
"eval_wer": 0.41629418935392115, |
|
"step": 728 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"eval_cer": 0.19417652411282985, |
|
"eval_loss": 0.6397454738616943, |
|
"eval_per": 0.38317757009345793, |
|
"eval_runtime": 16.3057, |
|
"eval_samples_per_second": 33.24, |
|
"eval_steps_per_second": 4.17, |
|
"eval_wer": 0.40308817553839904, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"eval_cer": 0.19388535031847134, |
|
"eval_loss": 0.6293218731880188, |
|
"eval_per": 0.38358390898008937, |
|
"eval_runtime": 16.6245, |
|
"eval_samples_per_second": 32.603, |
|
"eval_steps_per_second": 4.09, |
|
"eval_wer": 0.4039008533116619, |
|
"step": 756 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"eval_cer": 0.19457688808007279, |
|
"eval_loss": 0.6479354500770569, |
|
"eval_per": 0.3852092645266152, |
|
"eval_runtime": 17.0356, |
|
"eval_samples_per_second": 31.816, |
|
"eval_steps_per_second": 3.992, |
|
"eval_wer": 0.4026818366517676, |
|
"step": 770 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_cer": 0.19344858962693356, |
|
"eval_loss": 0.6307466626167297, |
|
"eval_per": 0.38216172287687933, |
|
"eval_runtime": 15.9943, |
|
"eval_samples_per_second": 33.887, |
|
"eval_steps_per_second": 4.252, |
|
"eval_wer": 0.39821210889882164, |
|
"step": 784 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"eval_cer": 0.190828025477707, |
|
"eval_loss": 0.6166068911552429, |
|
"eval_per": 0.36733035351483134, |
|
"eval_runtime": 18.3763, |
|
"eval_samples_per_second": 29.495, |
|
"eval_steps_per_second": 3.7, |
|
"eval_wer": 0.3843965867533523, |
|
"step": 798 |
|
}, |
|
{ |
|
"epoch": 57.14, |
|
"learning_rate": 2.506974506974507e-05, |
|
"loss": 0.5473, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"eval_cer": 0.19064604185623293, |
|
"eval_loss": 0.6098698377609253, |
|
"eval_per": 0.3707842340511987, |
|
"eval_runtime": 17.7821, |
|
"eval_samples_per_second": 30.48, |
|
"eval_steps_per_second": 3.824, |
|
"eval_wer": 0.3860219422998781, |
|
"step": 812 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"eval_cer": 0.19039126478616925, |
|
"eval_loss": 0.6007358431816101, |
|
"eval_per": 0.3730190979276717, |
|
"eval_runtime": 17.0728, |
|
"eval_samples_per_second": 31.746, |
|
"eval_steps_per_second": 3.983, |
|
"eval_wer": 0.386834620073141, |
|
"step": 826 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_cer": 0.19275705186533212, |
|
"eval_loss": 0.6191249489784241, |
|
"eval_per": 0.3744412840308818, |
|
"eval_runtime": 16.4977, |
|
"eval_samples_per_second": 32.853, |
|
"eval_steps_per_second": 4.122, |
|
"eval_wer": 0.3884599756196668, |
|
"step": 840 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"eval_cer": 0.1891901728844404, |
|
"eval_loss": 0.6014622449874878, |
|
"eval_per": 0.3732222673709874, |
|
"eval_runtime": 16.6101, |
|
"eval_samples_per_second": 32.631, |
|
"eval_steps_per_second": 4.094, |
|
"eval_wer": 0.3884599756196668, |
|
"step": 854 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"eval_cer": 0.19017288444040037, |
|
"eval_loss": 0.5964884757995605, |
|
"eval_per": 0.36875253961804144, |
|
"eval_runtime": 17.8493, |
|
"eval_samples_per_second": 30.365, |
|
"eval_steps_per_second": 3.81, |
|
"eval_wer": 0.3837870784234051, |
|
"step": 868 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"eval_cer": 0.19042766151046406, |
|
"eval_loss": 0.5926450490951538, |
|
"eval_per": 0.3667208451848842, |
|
"eval_runtime": 17.884, |
|
"eval_samples_per_second": 30.306, |
|
"eval_steps_per_second": 3.802, |
|
"eval_wer": 0.38256806176351077, |
|
"step": 882 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"eval_cer": 0.19210191082802547, |
|
"eval_loss": 0.6187658905982971, |
|
"eval_per": 0.376472978464039, |
|
"eval_runtime": 17.0859, |
|
"eval_samples_per_second": 31.722, |
|
"eval_steps_per_second": 3.98, |
|
"eval_wer": 0.39211702559934986, |
|
"step": 896 |
|
}, |
|
{ |
|
"epoch": 64.29, |
|
"learning_rate": 2.3145743145743147e-05, |
|
"loss": 0.443, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"eval_cer": 0.1891537761601456, |
|
"eval_loss": 0.5834715366363525, |
|
"eval_per": 0.36895570906135716, |
|
"eval_runtime": 16.6058, |
|
"eval_samples_per_second": 32.639, |
|
"eval_steps_per_second": 4.095, |
|
"eval_wer": 0.3829744006501422, |
|
"step": 910 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"eval_cer": 0.1902820746132848, |
|
"eval_loss": 0.5914222598075867, |
|
"eval_per": 0.3722064201544088, |
|
"eval_runtime": 17.2325, |
|
"eval_samples_per_second": 31.452, |
|
"eval_steps_per_second": 3.946, |
|
"eval_wer": 0.38703778951645673, |
|
"step": 924 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"eval_cer": 0.1875523202911738, |
|
"eval_loss": 0.582801878452301, |
|
"eval_per": 0.36265745631856966, |
|
"eval_runtime": 16.3441, |
|
"eval_samples_per_second": 33.162, |
|
"eval_steps_per_second": 4.161, |
|
"eval_wer": 0.3778951645672491, |
|
"step": 938 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"eval_cer": 0.1857324840764331, |
|
"eval_loss": 0.5744664072990417, |
|
"eval_per": 0.35757822023567654, |
|
"eval_runtime": 17.4764, |
|
"eval_samples_per_second": 31.013, |
|
"eval_steps_per_second": 3.891, |
|
"eval_wer": 0.3722064201544088, |
|
"step": 952 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"eval_cer": 0.18817106460418562, |
|
"eval_loss": 0.5785911083221436, |
|
"eval_per": 0.3632669646485169, |
|
"eval_runtime": 16.8602, |
|
"eval_samples_per_second": 32.147, |
|
"eval_steps_per_second": 4.033, |
|
"eval_wer": 0.3795205201137749, |
|
"step": 966 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"eval_cer": 0.1884258416742493, |
|
"eval_loss": 0.5868948698043823, |
|
"eval_per": 0.36042259244209673, |
|
"eval_runtime": 16.384, |
|
"eval_samples_per_second": 33.081, |
|
"eval_steps_per_second": 4.15, |
|
"eval_wer": 0.37505079236082894, |
|
"step": 980 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"eval_cer": 0.18878980891719746, |
|
"eval_loss": 0.592288076877594, |
|
"eval_per": 0.3596099146688338, |
|
"eval_runtime": 16.4263, |
|
"eval_samples_per_second": 32.996, |
|
"eval_steps_per_second": 4.14, |
|
"eval_wer": 0.37525396180414466, |
|
"step": 994 |
|
}, |
|
{ |
|
"epoch": 71.43, |
|
"learning_rate": 2.1221741221741224e-05, |
|
"loss": 0.3564, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"eval_cer": 0.18587807097361236, |
|
"eval_loss": 0.5706638097763062, |
|
"eval_per": 0.35778138967899226, |
|
"eval_runtime": 16.3727, |
|
"eval_samples_per_second": 33.104, |
|
"eval_steps_per_second": 4.153, |
|
"eval_wer": 0.37139374238114586, |
|
"step": 1008 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"eval_cer": 0.1856960873521383, |
|
"eval_loss": 0.5733203887939453, |
|
"eval_per": 0.35514018691588783, |
|
"eval_runtime": 16.1456, |
|
"eval_samples_per_second": 33.569, |
|
"eval_steps_per_second": 4.212, |
|
"eval_wer": 0.3699715562779358, |
|
"step": 1022 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"eval_cer": 0.1854413102820746, |
|
"eval_loss": 0.5731407403945923, |
|
"eval_per": 0.35656237301909793, |
|
"eval_runtime": 16.2817, |
|
"eval_samples_per_second": 33.289, |
|
"eval_steps_per_second": 4.176, |
|
"eval_wer": 0.370581064607883, |
|
"step": 1036 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"eval_cer": 0.18467697907188352, |
|
"eval_loss": 0.5643908381462097, |
|
"eval_per": 0.3531084924827306, |
|
"eval_runtime": 16.6661, |
|
"eval_samples_per_second": 32.521, |
|
"eval_steps_per_second": 4.08, |
|
"eval_wer": 0.3669240146281999, |
|
"step": 1050 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"eval_cer": 0.18522292993630574, |
|
"eval_loss": 0.5660921335220337, |
|
"eval_per": 0.3555465258025193, |
|
"eval_runtime": 16.5118, |
|
"eval_samples_per_second": 32.825, |
|
"eval_steps_per_second": 4.118, |
|
"eval_wer": 0.37017472572125154, |
|
"step": 1064 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"eval_cer": 0.18474977252047317, |
|
"eval_loss": 0.5705360174179077, |
|
"eval_per": 0.3512799674928891, |
|
"eval_runtime": 17.1186, |
|
"eval_samples_per_second": 31.661, |
|
"eval_steps_per_second": 3.972, |
|
"eval_wer": 0.3675335229581471, |
|
"step": 1078 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"eval_cer": 0.1835122838944495, |
|
"eval_loss": 0.5630640983581543, |
|
"eval_per": 0.35270215359609913, |
|
"eval_runtime": 17.2728, |
|
"eval_samples_per_second": 31.379, |
|
"eval_steps_per_second": 3.937, |
|
"eval_wer": 0.3671271840715156, |
|
"step": 1092 |
|
}, |
|
{ |
|
"epoch": 78.57, |
|
"learning_rate": 1.92977392977393e-05, |
|
"loss": 0.3456, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"eval_cer": 0.18311191992720655, |
|
"eval_loss": 0.5674863457679749, |
|
"eval_per": 0.35026412027631043, |
|
"eval_runtime": 16.31, |
|
"eval_samples_per_second": 33.231, |
|
"eval_steps_per_second": 4.169, |
|
"eval_wer": 0.3650954896383584, |
|
"step": 1106 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_cer": 0.1846041856232939, |
|
"eval_loss": 0.5696778297424316, |
|
"eval_per": 0.35067045916294187, |
|
"eval_runtime": 16.3755, |
|
"eval_samples_per_second": 33.098, |
|
"eval_steps_per_second": 4.153, |
|
"eval_wer": 0.3644859813084112, |
|
"step": 1120 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"eval_cer": 0.18409463148316652, |
|
"eval_loss": 0.5643677711486816, |
|
"eval_per": 0.34924827305973183, |
|
"eval_runtime": 16.3983, |
|
"eval_samples_per_second": 33.052, |
|
"eval_steps_per_second": 4.147, |
|
"eval_wer": 0.36306379520520116, |
|
"step": 1134 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"eval_cer": 0.1843494085532302, |
|
"eval_loss": 0.56571364402771, |
|
"eval_per": 0.34802925639983745, |
|
"eval_runtime": 16.5291, |
|
"eval_samples_per_second": 32.791, |
|
"eval_steps_per_second": 4.114, |
|
"eval_wer": 0.36265745631856966, |
|
"step": 1148 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"eval_cer": 0.1875523202911738, |
|
"eval_loss": 0.5830783247947693, |
|
"eval_per": 0.3522958147094677, |
|
"eval_runtime": 16.4238, |
|
"eval_samples_per_second": 33.001, |
|
"eval_steps_per_second": 4.14, |
|
"eval_wer": 0.36793986184477856, |
|
"step": 1162 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"eval_cer": 0.1861692447679709, |
|
"eval_loss": 0.5823647975921631, |
|
"eval_per": 0.3522958147094677, |
|
"eval_runtime": 17.5122, |
|
"eval_samples_per_second": 30.95, |
|
"eval_steps_per_second": 3.883, |
|
"eval_wer": 0.3659081674116213, |
|
"step": 1176 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"eval_cer": 0.18333030027297542, |
|
"eval_loss": 0.5567490458488464, |
|
"eval_per": 0.3508736286062576, |
|
"eval_runtime": 16.4517, |
|
"eval_samples_per_second": 32.945, |
|
"eval_steps_per_second": 4.133, |
|
"eval_wer": 0.36529865908167414, |
|
"step": 1190 |
|
}, |
|
{ |
|
"epoch": 85.71, |
|
"learning_rate": 1.7373737373737375e-05, |
|
"loss": 0.3073, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"eval_cer": 0.1851501364877161, |
|
"eval_loss": 0.5755050778388977, |
|
"eval_per": 0.35067045916294187, |
|
"eval_runtime": 17.6602, |
|
"eval_samples_per_second": 30.691, |
|
"eval_steps_per_second": 3.85, |
|
"eval_wer": 0.36489232019504264, |
|
"step": 1204 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"eval_cer": 0.18289353958143767, |
|
"eval_loss": 0.5590367913246155, |
|
"eval_per": 0.3449817147501016, |
|
"eval_runtime": 16.7556, |
|
"eval_samples_per_second": 32.347, |
|
"eval_steps_per_second": 4.058, |
|
"eval_wer": 0.3585940674522552, |
|
"step": 1218 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"eval_cer": 0.18347588717015467, |
|
"eval_loss": 0.5662943720817566, |
|
"eval_per": 0.34802925639983745, |
|
"eval_runtime": 16.6011, |
|
"eval_samples_per_second": 32.649, |
|
"eval_steps_per_second": 4.096, |
|
"eval_wer": 0.3610321007720439, |
|
"step": 1232 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"eval_cer": 0.18507734303912649, |
|
"eval_loss": 0.5733785629272461, |
|
"eval_per": 0.3468102397399431, |
|
"eval_runtime": 16.1986, |
|
"eval_samples_per_second": 33.46, |
|
"eval_steps_per_second": 4.198, |
|
"eval_wer": 0.3618447785453068, |
|
"step": 1246 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"eval_cer": 0.18303912647861692, |
|
"eval_loss": 0.5656831860542297, |
|
"eval_per": 0.34579439252336447, |
|
"eval_runtime": 16.3772, |
|
"eval_samples_per_second": 33.095, |
|
"eval_steps_per_second": 4.152, |
|
"eval_wer": 0.36021942299878096, |
|
"step": 1260 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"eval_cer": 0.18278434940855323, |
|
"eval_loss": 0.5650802850723267, |
|
"eval_per": 0.3441690369768387, |
|
"eval_runtime": 17.4779, |
|
"eval_samples_per_second": 31.011, |
|
"eval_steps_per_second": 3.891, |
|
"eval_wer": 0.35778138967899226, |
|
"step": 1274 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"eval_cer": 0.18202001819836214, |
|
"eval_loss": 0.5608470439910889, |
|
"eval_per": 0.3415278342137342, |
|
"eval_runtime": 16.5014, |
|
"eval_samples_per_second": 32.846, |
|
"eval_steps_per_second": 4.121, |
|
"eval_wer": 0.35574969524583505, |
|
"step": 1288 |
|
}, |
|
{ |
|
"epoch": 92.86, |
|
"learning_rate": 1.544973544973545e-05, |
|
"loss": 0.2836, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"eval_cer": 0.18067333939945404, |
|
"eval_loss": 0.5504541993141174, |
|
"eval_per": 0.3388866314506298, |
|
"eval_runtime": 16.701, |
|
"eval_samples_per_second": 32.453, |
|
"eval_steps_per_second": 4.072, |
|
"eval_wer": 0.3524989841527834, |
|
"step": 1302 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"eval_cer": 0.17979981801637854, |
|
"eval_loss": 0.5494620203971863, |
|
"eval_per": 0.33746444534741976, |
|
"eval_runtime": 17.2521, |
|
"eval_samples_per_second": 31.416, |
|
"eval_steps_per_second": 3.942, |
|
"eval_wer": 0.3500609508329947, |
|
"step": 1316 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"eval_cer": 0.1816196542311192, |
|
"eval_loss": 0.5693331360816956, |
|
"eval_per": 0.34315318976026005, |
|
"eval_runtime": 16.3033, |
|
"eval_samples_per_second": 33.245, |
|
"eval_steps_per_second": 4.171, |
|
"eval_wer": 0.35574969524583505, |
|
"step": 1330 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"eval_cer": 0.1822020018198362, |
|
"eval_loss": 0.5638025999069214, |
|
"eval_per": 0.34173100365705, |
|
"eval_runtime": 16.8945, |
|
"eval_samples_per_second": 32.081, |
|
"eval_steps_per_second": 4.025, |
|
"eval_wer": 0.3563592035757822, |
|
"step": 1344 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"eval_cer": 0.17969062784349407, |
|
"eval_loss": 0.5485906004905701, |
|
"eval_per": 0.3386834620073141, |
|
"eval_runtime": 16.6823, |
|
"eval_samples_per_second": 32.489, |
|
"eval_steps_per_second": 4.076, |
|
"eval_wer": 0.35107679804957337, |
|
"step": 1358 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"eval_cer": 0.18096451319381257, |
|
"eval_loss": 0.5618489980697632, |
|
"eval_per": 0.3415278342137342, |
|
"eval_runtime": 16.6547, |
|
"eval_samples_per_second": 32.543, |
|
"eval_steps_per_second": 4.083, |
|
"eval_wer": 0.3545306785859407, |
|
"step": 1372 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"eval_cer": 0.1799818016378526, |
|
"eval_loss": 0.5637105703353882, |
|
"eval_per": 0.33990247866720846, |
|
"eval_runtime": 16.8199, |
|
"eval_samples_per_second": 32.224, |
|
"eval_steps_per_second": 4.043, |
|
"eval_wer": 0.3514831369362048, |
|
"step": 1386 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"learning_rate": 1.3525733525733527e-05, |
|
"loss": 0.2502, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"eval_cer": 0.1810373066424022, |
|
"eval_loss": 0.5658114552497864, |
|
"eval_per": 0.3437626980902072, |
|
"eval_runtime": 16.859, |
|
"eval_samples_per_second": 32.149, |
|
"eval_steps_per_second": 4.033, |
|
"eval_wer": 0.3555465258025193, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 101.0, |
|
"eval_cer": 0.17954504094631482, |
|
"eval_loss": 0.552661657333374, |
|
"eval_per": 0.3411214953271028, |
|
"eval_runtime": 17.0552, |
|
"eval_samples_per_second": 31.779, |
|
"eval_steps_per_second": 3.987, |
|
"eval_wer": 0.3524989841527834, |
|
"step": 1414 |
|
}, |
|
{ |
|
"epoch": 102.0, |
|
"eval_cer": 0.18067333939945404, |
|
"eval_loss": 0.5701059699058533, |
|
"eval_per": 0.343965867533523, |
|
"eval_runtime": 17.649, |
|
"eval_samples_per_second": 30.71, |
|
"eval_steps_per_second": 3.853, |
|
"eval_wer": 0.3561560341324665, |
|
"step": 1428 |
|
}, |
|
{ |
|
"epoch": 103.0, |
|
"eval_cer": 0.17936305732484076, |
|
"eval_loss": 0.554296612739563, |
|
"eval_per": 0.3388866314506298, |
|
"eval_runtime": 16.2178, |
|
"eval_samples_per_second": 33.42, |
|
"eval_steps_per_second": 4.193, |
|
"eval_wer": 0.34965461194636327, |
|
"step": 1442 |
|
}, |
|
{ |
|
"epoch": 104.0, |
|
"eval_cer": 0.18034576888080073, |
|
"eval_loss": 0.5659683346748352, |
|
"eval_per": 0.33990247866720846, |
|
"eval_runtime": 16.8247, |
|
"eval_samples_per_second": 32.214, |
|
"eval_steps_per_second": 4.042, |
|
"eval_wer": 0.3508736286062576, |
|
"step": 1456 |
|
}, |
|
{ |
|
"epoch": 105.0, |
|
"eval_cer": 0.17950864422202, |
|
"eval_loss": 0.5542871952056885, |
|
"eval_per": 0.33990247866720846, |
|
"eval_runtime": 16.8641, |
|
"eval_samples_per_second": 32.139, |
|
"eval_steps_per_second": 4.032, |
|
"eval_wer": 0.3500609508329947, |
|
"step": 1470 |
|
}, |
|
{ |
|
"epoch": 106.0, |
|
"eval_cer": 0.181656050955414, |
|
"eval_loss": 0.5742031931877136, |
|
"eval_per": 0.34315318976026005, |
|
"eval_runtime": 16.2772, |
|
"eval_samples_per_second": 33.298, |
|
"eval_steps_per_second": 4.178, |
|
"eval_wer": 0.3547338480292564, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 107.0, |
|
"eval_cer": 0.178926296633303, |
|
"eval_loss": 0.5526788830757141, |
|
"eval_per": 0.33502641202763106, |
|
"eval_runtime": 16.3123, |
|
"eval_samples_per_second": 33.227, |
|
"eval_steps_per_second": 4.169, |
|
"eval_wer": 0.34538805363673303, |
|
"step": 1498 |
|
}, |
|
{ |
|
"epoch": 107.14, |
|
"learning_rate": 1.1601731601731604e-05, |
|
"loss": 0.2368, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 108.0, |
|
"eval_cer": 0.178926296633303, |
|
"eval_loss": 0.5576502084732056, |
|
"eval_per": 0.3378707842340512, |
|
"eval_runtime": 16.2769, |
|
"eval_samples_per_second": 33.299, |
|
"eval_steps_per_second": 4.178, |
|
"eval_wer": 0.34965461194636327, |
|
"step": 1512 |
|
}, |
|
{ |
|
"epoch": 109.0, |
|
"eval_cer": 0.1788898999090082, |
|
"eval_loss": 0.5539444088935852, |
|
"eval_per": 0.3356359203575782, |
|
"eval_runtime": 17.6723, |
|
"eval_samples_per_second": 30.669, |
|
"eval_steps_per_second": 3.848, |
|
"eval_wer": 0.3451848841934173, |
|
"step": 1526 |
|
}, |
|
{ |
|
"epoch": 110.0, |
|
"eval_cer": 0.18020018198362148, |
|
"eval_loss": 0.5699580311775208, |
|
"eval_per": 0.34173100365705, |
|
"eval_runtime": 16.5072, |
|
"eval_samples_per_second": 32.834, |
|
"eval_steps_per_second": 4.119, |
|
"eval_wer": 0.35168630637952053, |
|
"step": 1540 |
|
}, |
|
{ |
|
"epoch": 111.0, |
|
"eval_cer": 0.17939945404913557, |
|
"eval_loss": 0.5626676678657532, |
|
"eval_per": 0.33969930922389274, |
|
"eval_runtime": 16.5149, |
|
"eval_samples_per_second": 32.819, |
|
"eval_steps_per_second": 4.117, |
|
"eval_wer": 0.3500609508329947, |
|
"step": 1554 |
|
}, |
|
{ |
|
"epoch": 112.0, |
|
"eval_cer": 0.17965423111919926, |
|
"eval_loss": 0.5622020363807678, |
|
"eval_per": 0.3405119869971556, |
|
"eval_runtime": 18.514, |
|
"eval_samples_per_second": 29.275, |
|
"eval_steps_per_second": 3.673, |
|
"eval_wer": 0.34965461194636327, |
|
"step": 1568 |
|
}, |
|
{ |
|
"epoch": 113.0, |
|
"eval_cer": 0.18005459508644223, |
|
"eval_loss": 0.570824146270752, |
|
"eval_per": 0.3403088175538399, |
|
"eval_runtime": 16.7958, |
|
"eval_samples_per_second": 32.27, |
|
"eval_steps_per_second": 4.049, |
|
"eval_wer": 0.34945144250304755, |
|
"step": 1582 |
|
}, |
|
{ |
|
"epoch": 114.0, |
|
"eval_cer": 0.18045495905368517, |
|
"eval_loss": 0.5732950568199158, |
|
"eval_per": 0.3401056481105242, |
|
"eval_runtime": 17.5602, |
|
"eval_samples_per_second": 30.865, |
|
"eval_steps_per_second": 3.872, |
|
"eval_wer": 0.35107679804957337, |
|
"step": 1596 |
|
}, |
|
{ |
|
"epoch": 114.29, |
|
"learning_rate": 9.677729677729679e-06, |
|
"loss": 0.2288, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 115.0, |
|
"eval_cer": 0.17950864422202, |
|
"eval_loss": 0.5614627599716187, |
|
"eval_per": 0.3386834620073141, |
|
"eval_runtime": 18.0091, |
|
"eval_samples_per_second": 30.096, |
|
"eval_steps_per_second": 3.776, |
|
"eval_wer": 0.34863876472978467, |
|
"step": 1610 |
|
}, |
|
{ |
|
"epoch": 116.0, |
|
"eval_cer": 0.1808553230209281, |
|
"eval_loss": 0.5741183757781982, |
|
"eval_per": 0.33969930922389274, |
|
"eval_runtime": 16.588, |
|
"eval_samples_per_second": 32.674, |
|
"eval_steps_per_second": 4.099, |
|
"eval_wer": 0.34965461194636327, |
|
"step": 1624 |
|
}, |
|
{ |
|
"epoch": 117.0, |
|
"eval_cer": 0.17958143767060963, |
|
"eval_loss": 0.5609710812568665, |
|
"eval_per": 0.33726127590410404, |
|
"eval_runtime": 16.4333, |
|
"eval_samples_per_second": 32.982, |
|
"eval_steps_per_second": 4.138, |
|
"eval_wer": 0.3459975619666802, |
|
"step": 1638 |
|
}, |
|
{ |
|
"epoch": 117.0, |
|
"step": 1638, |
|
"total_flos": 1.462030946643386e+19, |
|
"train_loss": 1.771814914558979, |
|
"train_runtime": 12938.9921, |
|
"train_samples_per_second": 5.194, |
|
"train_steps_per_second": 0.162 |
|
} |
|
], |
|
"max_steps": 2100, |
|
"num_train_epochs": 150, |
|
"total_flos": 1.462030946643386e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|