|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 60.0, |
|
"global_step": 7440, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.81, |
|
"learning_rate": 3.3333333333333335e-05, |
|
"loss": 12.2551, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 0.81, |
|
"eval_loss": 4.356050968170166, |
|
"eval_runtime": 197.2044, |
|
"eval_samples_per_second": 9.351, |
|
"eval_wer": 1.0, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 1.61, |
|
"learning_rate": 6.666666666666667e-05, |
|
"loss": 3.2085, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 1.61, |
|
"eval_loss": 2.925891876220703, |
|
"eval_runtime": 199.5724, |
|
"eval_samples_per_second": 9.24, |
|
"eval_wer": 1.0, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 2.42, |
|
"learning_rate": 0.0001, |
|
"loss": 2.8642, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 2.42, |
|
"eval_loss": 2.8566176891326904, |
|
"eval_runtime": 201.2361, |
|
"eval_samples_per_second": 9.163, |
|
"eval_wer": 1.0, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 3.23, |
|
"learning_rate": 9.859943977591037e-05, |
|
"loss": 2.7372, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 3.23, |
|
"eval_loss": 2.3264265060424805, |
|
"eval_runtime": 202.5449, |
|
"eval_samples_per_second": 9.104, |
|
"eval_wer": 1.0, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 4.03, |
|
"learning_rate": 9.719887955182073e-05, |
|
"loss": 1.4523, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 4.03, |
|
"eval_loss": 0.6223726868629456, |
|
"eval_runtime": 203.3756, |
|
"eval_samples_per_second": 9.067, |
|
"eval_wer": 0.7100503449561812, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 4.84, |
|
"learning_rate": 9.579831932773111e-05, |
|
"loss": 0.7072, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 4.84, |
|
"eval_loss": 0.4705396890640259, |
|
"eval_runtime": 205.0375, |
|
"eval_samples_per_second": 8.993, |
|
"eval_wer": 0.5925787805332836, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 5.65, |
|
"learning_rate": 9.439775910364146e-05, |
|
"loss": 0.5552, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 5.65, |
|
"eval_loss": 0.39274999499320984, |
|
"eval_runtime": 205.4744, |
|
"eval_samples_per_second": 8.974, |
|
"eval_wer": 0.536826403132575, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 6.45, |
|
"learning_rate": 9.299719887955183e-05, |
|
"loss": 0.4751, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 6.45, |
|
"eval_loss": 0.36413395404815674, |
|
"eval_runtime": 206.0611, |
|
"eval_samples_per_second": 8.949, |
|
"eval_wer": 0.5096960656349059, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 7.26, |
|
"learning_rate": 9.159663865546218e-05, |
|
"loss": 0.4116, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 7.26, |
|
"eval_loss": 0.34078019857406616, |
|
"eval_runtime": 206.851, |
|
"eval_samples_per_second": 8.915, |
|
"eval_wer": 0.4906768599664367, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 8.06, |
|
"learning_rate": 9.019607843137255e-05, |
|
"loss": 0.3737, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 8.06, |
|
"eval_loss": 0.3288322687149048, |
|
"eval_runtime": 207.383, |
|
"eval_samples_per_second": 8.892, |
|
"eval_wer": 0.4697930262912549, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 8.87, |
|
"learning_rate": 8.879551820728292e-05, |
|
"loss": 0.338, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 8.87, |
|
"eval_loss": 0.3296125531196594, |
|
"eval_runtime": 207.5205, |
|
"eval_samples_per_second": 8.886, |
|
"eval_wer": 0.4619615886630617, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 9.68, |
|
"learning_rate": 8.739495798319329e-05, |
|
"loss": 0.3154, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 9.68, |
|
"eval_loss": 0.34391966462135315, |
|
"eval_runtime": 207.9354, |
|
"eval_samples_per_second": 8.868, |
|
"eval_wer": 0.4543166138355398, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 10.48, |
|
"learning_rate": 8.599439775910365e-05, |
|
"loss": 0.3054, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 10.48, |
|
"eval_loss": 0.3120010197162628, |
|
"eval_runtime": 206.6673, |
|
"eval_samples_per_second": 8.923, |
|
"eval_wer": 0.44173037479022936, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 11.29, |
|
"learning_rate": 8.4593837535014e-05, |
|
"loss": 0.2766, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 11.29, |
|
"eval_loss": 0.3251303434371948, |
|
"eval_runtime": 208.2654, |
|
"eval_samples_per_second": 8.854, |
|
"eval_wer": 0.439026664180496, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 12.1, |
|
"learning_rate": 8.319327731092437e-05, |
|
"loss": 0.2743, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 12.1, |
|
"eval_loss": 0.31674692034721375, |
|
"eval_runtime": 207.1288, |
|
"eval_samples_per_second": 8.903, |
|
"eval_wer": 0.43361924296102927, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 12.9, |
|
"learning_rate": 8.179271708683474e-05, |
|
"loss": 0.2615, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 12.9, |
|
"eval_loss": 0.31189170479774475, |
|
"eval_runtime": 206.6256, |
|
"eval_samples_per_second": 8.924, |
|
"eval_wer": 0.43492448256572813, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 13.71, |
|
"learning_rate": 8.039215686274511e-05, |
|
"loss": 0.2349, |
|
"step": 1700 |
|
}, |
|
{ |
|
"epoch": 13.71, |
|
"eval_loss": 0.3296045660972595, |
|
"eval_runtime": 208.4817, |
|
"eval_samples_per_second": 8.845, |
|
"eval_wer": 0.42988998694760394, |
|
"step": 1700 |
|
}, |
|
{ |
|
"epoch": 14.52, |
|
"learning_rate": 7.899159663865546e-05, |
|
"loss": 0.228, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 14.52, |
|
"eval_loss": 0.30033424496650696, |
|
"eval_runtime": 207.6073, |
|
"eval_samples_per_second": 8.882, |
|
"eval_wer": 0.4192616073093418, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 15.32, |
|
"learning_rate": 7.759103641456583e-05, |
|
"loss": 0.2243, |
|
"step": 1900 |
|
}, |
|
{ |
|
"epoch": 15.32, |
|
"eval_loss": 0.3134298026561737, |
|
"eval_runtime": 207.5471, |
|
"eval_samples_per_second": 8.885, |
|
"eval_wer": 0.4184225247063211, |
|
"step": 1900 |
|
}, |
|
{ |
|
"epoch": 16.13, |
|
"learning_rate": 7.619047619047618e-05, |
|
"loss": 0.2078, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 16.13, |
|
"eval_loss": 0.3405207097530365, |
|
"eval_runtime": 208.3189, |
|
"eval_samples_per_second": 8.852, |
|
"eval_wer": 0.4215923923177326, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 16.94, |
|
"learning_rate": 7.478991596638657e-05, |
|
"loss": 0.2127, |
|
"step": 2100 |
|
}, |
|
{ |
|
"epoch": 16.94, |
|
"eval_loss": 0.31670939922332764, |
|
"eval_runtime": 207.0917, |
|
"eval_samples_per_second": 8.904, |
|
"eval_wer": 0.4139474174902107, |
|
"step": 2100 |
|
}, |
|
{ |
|
"epoch": 17.74, |
|
"learning_rate": 7.338935574229692e-05, |
|
"loss": 0.2032, |
|
"step": 2200 |
|
}, |
|
{ |
|
"epoch": 17.74, |
|
"eval_loss": 0.30317744612693787, |
|
"eval_runtime": 207.7221, |
|
"eval_samples_per_second": 8.877, |
|
"eval_wer": 0.4090993846727578, |
|
"step": 2200 |
|
}, |
|
{ |
|
"epoch": 18.55, |
|
"learning_rate": 7.198879551820729e-05, |
|
"loss": 0.1853, |
|
"step": 2300 |
|
}, |
|
{ |
|
"epoch": 18.55, |
|
"eval_loss": 0.3155224025249481, |
|
"eval_runtime": 207.5316, |
|
"eval_samples_per_second": 8.885, |
|
"eval_wer": 0.40471750885698304, |
|
"step": 2300 |
|
}, |
|
{ |
|
"epoch": 19.35, |
|
"learning_rate": 7.058823529411765e-05, |
|
"loss": 0.1844, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 19.35, |
|
"eval_loss": 0.3215440511703491, |
|
"eval_runtime": 207.3486, |
|
"eval_samples_per_second": 8.893, |
|
"eval_wer": 0.4049972030579899, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 20.16, |
|
"learning_rate": 6.918767507002801e-05, |
|
"loss": 0.1871, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 20.16, |
|
"eval_loss": 0.30251652002334595, |
|
"eval_runtime": 207.2199, |
|
"eval_samples_per_second": 8.899, |
|
"eval_wer": 0.3992168562371807, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 20.97, |
|
"learning_rate": 6.778711484593838e-05, |
|
"loss": 0.1896, |
|
"step": 2600 |
|
}, |
|
{ |
|
"epoch": 20.97, |
|
"eval_loss": 0.3048883080482483, |
|
"eval_runtime": 207.9453, |
|
"eval_samples_per_second": 8.868, |
|
"eval_wer": 0.39996270743986573, |
|
"step": 2600 |
|
}, |
|
{ |
|
"epoch": 21.77, |
|
"learning_rate": 6.638655462184874e-05, |
|
"loss": 0.1775, |
|
"step": 2700 |
|
}, |
|
{ |
|
"epoch": 21.77, |
|
"eval_loss": 0.32283803820610046, |
|
"eval_runtime": 209.0912, |
|
"eval_samples_per_second": 8.819, |
|
"eval_wer": 0.40564982286033935, |
|
"step": 2700 |
|
}, |
|
{ |
|
"epoch": 22.58, |
|
"learning_rate": 6.498599439775911e-05, |
|
"loss": 0.1667, |
|
"step": 2800 |
|
}, |
|
{ |
|
"epoch": 22.58, |
|
"eval_loss": 0.31883877515792847, |
|
"eval_runtime": 207.5813, |
|
"eval_samples_per_second": 8.883, |
|
"eval_wer": 0.4055565914600037, |
|
"step": 2800 |
|
}, |
|
{ |
|
"epoch": 23.39, |
|
"learning_rate": 6.358543417366946e-05, |
|
"loss": 0.1714, |
|
"step": 2900 |
|
}, |
|
{ |
|
"epoch": 23.39, |
|
"eval_loss": 0.32032692432403564, |
|
"eval_runtime": 208.3503, |
|
"eval_samples_per_second": 8.85, |
|
"eval_wer": 0.3992168562371807, |
|
"step": 2900 |
|
}, |
|
{ |
|
"epoch": 24.19, |
|
"learning_rate": 6.218487394957983e-05, |
|
"loss": 0.1692, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 24.19, |
|
"eval_loss": 0.33072519302368164, |
|
"eval_runtime": 208.6398, |
|
"eval_samples_per_second": 8.838, |
|
"eval_wer": 0.40369196345329106, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"learning_rate": 6.078431372549019e-05, |
|
"loss": 0.1759, |
|
"step": 3100 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_loss": 0.3215318024158478, |
|
"eval_runtime": 207.9891, |
|
"eval_samples_per_second": 8.866, |
|
"eval_wer": 0.39912362483684505, |
|
"step": 3100 |
|
}, |
|
{ |
|
"epoch": 25.81, |
|
"learning_rate": 5.938375350140056e-05, |
|
"loss": 0.1561, |
|
"step": 3200 |
|
}, |
|
{ |
|
"epoch": 25.81, |
|
"eval_loss": 0.32872405648231506, |
|
"eval_runtime": 208.2303, |
|
"eval_samples_per_second": 8.856, |
|
"eval_wer": 0.40164087264590714, |
|
"step": 3200 |
|
}, |
|
{ |
|
"epoch": 26.61, |
|
"learning_rate": 5.7983193277310935e-05, |
|
"loss": 0.1459, |
|
"step": 3300 |
|
}, |
|
{ |
|
"epoch": 26.61, |
|
"eval_loss": 0.3299988806247711, |
|
"eval_runtime": 208.2294, |
|
"eval_samples_per_second": 8.856, |
|
"eval_wer": 0.40173410404624277, |
|
"step": 3300 |
|
}, |
|
{ |
|
"epoch": 27.42, |
|
"learning_rate": 5.658263305322129e-05, |
|
"loss": 0.1489, |
|
"step": 3400 |
|
}, |
|
{ |
|
"epoch": 27.42, |
|
"eval_loss": 0.3266052305698395, |
|
"eval_runtime": 207.8609, |
|
"eval_samples_per_second": 8.871, |
|
"eval_wer": 0.3958605258250979, |
|
"step": 3400 |
|
}, |
|
{ |
|
"epoch": 28.23, |
|
"learning_rate": 5.5182072829131656e-05, |
|
"loss": 0.1526, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 28.23, |
|
"eval_loss": 0.35196033120155334, |
|
"eval_runtime": 208.9297, |
|
"eval_samples_per_second": 8.826, |
|
"eval_wer": 0.39800484803281744, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 29.03, |
|
"learning_rate": 5.378151260504202e-05, |
|
"loss": 0.1533, |
|
"step": 3600 |
|
}, |
|
{ |
|
"epoch": 29.03, |
|
"eval_loss": 0.3176701068878174, |
|
"eval_runtime": 208.8703, |
|
"eval_samples_per_second": 8.828, |
|
"eval_wer": 0.39567406302442665, |
|
"step": 3600 |
|
}, |
|
{ |
|
"epoch": 29.84, |
|
"learning_rate": 5.2380952380952384e-05, |
|
"loss": 0.1396, |
|
"step": 3700 |
|
}, |
|
{ |
|
"epoch": 29.84, |
|
"eval_loss": 0.32652196288108826, |
|
"eval_runtime": 208.1553, |
|
"eval_samples_per_second": 8.859, |
|
"eval_wer": 0.3936229722170427, |
|
"step": 3700 |
|
}, |
|
{ |
|
"epoch": 30.65, |
|
"learning_rate": 5.0980392156862745e-05, |
|
"loss": 0.1392, |
|
"step": 3800 |
|
}, |
|
{ |
|
"epoch": 30.65, |
|
"eval_loss": 0.31360137462615967, |
|
"eval_runtime": 209.7641, |
|
"eval_samples_per_second": 8.791, |
|
"eval_wer": 0.39119895580831626, |
|
"step": 3800 |
|
}, |
|
{ |
|
"epoch": 31.45, |
|
"learning_rate": 4.957983193277311e-05, |
|
"loss": 0.1358, |
|
"step": 3900 |
|
}, |
|
{ |
|
"epoch": 31.45, |
|
"eval_loss": 0.31799858808517456, |
|
"eval_runtime": 209.0208, |
|
"eval_samples_per_second": 8.822, |
|
"eval_wer": 0.3893343278016036, |
|
"step": 3900 |
|
}, |
|
{ |
|
"epoch": 32.26, |
|
"learning_rate": 4.817927170868347e-05, |
|
"loss": 0.1401, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 32.26, |
|
"eval_loss": 0.3084213137626648, |
|
"eval_runtime": 209.0337, |
|
"eval_samples_per_second": 8.822, |
|
"eval_wer": 0.38607122878985645, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 33.06, |
|
"learning_rate": 4.677871148459384e-05, |
|
"loss": 0.1327, |
|
"step": 4100 |
|
}, |
|
{ |
|
"epoch": 33.06, |
|
"eval_loss": 0.3314739763736725, |
|
"eval_runtime": 209.2003, |
|
"eval_samples_per_second": 8.815, |
|
"eval_wer": 0.3857915345888495, |
|
"step": 4100 |
|
}, |
|
{ |
|
"epoch": 33.87, |
|
"learning_rate": 4.53781512605042e-05, |
|
"loss": 0.1273, |
|
"step": 4200 |
|
}, |
|
{ |
|
"epoch": 33.87, |
|
"eval_loss": 0.32433462142944336, |
|
"eval_runtime": 208.6782, |
|
"eval_samples_per_second": 8.837, |
|
"eval_wer": 0.388215550997576, |
|
"step": 4200 |
|
}, |
|
{ |
|
"epoch": 34.68, |
|
"learning_rate": 4.397759103641457e-05, |
|
"loss": 2.8674, |
|
"step": 4300 |
|
}, |
|
{ |
|
"epoch": 34.68, |
|
"eval_loss": 0.4206547737121582, |
|
"eval_runtime": 255.7774, |
|
"eval_samples_per_second": 7.209, |
|
"eval_wer": 0.2714898377773634, |
|
"step": 4300 |
|
}, |
|
{ |
|
"epoch": 35.48, |
|
"learning_rate": 4.257703081232493e-05, |
|
"loss": 0.2443, |
|
"step": 4400 |
|
}, |
|
{ |
|
"epoch": 35.48, |
|
"eval_loss": 0.3481670320034027, |
|
"eval_runtime": 258.3191, |
|
"eval_samples_per_second": 7.138, |
|
"eval_wer": 0.2341972776431102, |
|
"step": 4400 |
|
}, |
|
{ |
|
"epoch": 36.29, |
|
"learning_rate": 4.11764705882353e-05, |
|
"loss": 0.1918, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 36.29, |
|
"eval_loss": 0.35066932439804077, |
|
"eval_runtime": 260.0692, |
|
"eval_samples_per_second": 7.09, |
|
"eval_wer": 0.23074771583069179, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 37.1, |
|
"learning_rate": 3.977591036414566e-05, |
|
"loss": 0.1678, |
|
"step": 4600 |
|
}, |
|
{ |
|
"epoch": 37.1, |
|
"eval_loss": 0.3326978087425232, |
|
"eval_runtime": 260.7521, |
|
"eval_samples_per_second": 7.072, |
|
"eval_wer": 0.22673876561625955, |
|
"step": 4600 |
|
}, |
|
{ |
|
"epoch": 37.9, |
|
"learning_rate": 3.8375350140056026e-05, |
|
"loss": 0.1544, |
|
"step": 4700 |
|
}, |
|
{ |
|
"epoch": 37.9, |
|
"eval_loss": 0.3412529230117798, |
|
"eval_runtime": 260.8062, |
|
"eval_samples_per_second": 7.07, |
|
"eval_wer": 0.22440798060786873, |
|
"step": 4700 |
|
}, |
|
{ |
|
"epoch": 38.71, |
|
"learning_rate": 3.697478991596639e-05, |
|
"loss": 0.1475, |
|
"step": 4800 |
|
}, |
|
{ |
|
"epoch": 38.71, |
|
"eval_loss": 0.33288225531578064, |
|
"eval_runtime": 262.5936, |
|
"eval_samples_per_second": 7.022, |
|
"eval_wer": 0.22077195599477903, |
|
"step": 4800 |
|
}, |
|
{ |
|
"epoch": 39.52, |
|
"learning_rate": 3.5574229691876754e-05, |
|
"loss": 0.1447, |
|
"step": 4900 |
|
}, |
|
{ |
|
"epoch": 39.52, |
|
"eval_loss": 0.3270339071750641, |
|
"eval_runtime": 262.0824, |
|
"eval_samples_per_second": 7.036, |
|
"eval_wer": 0.21909379078873764, |
|
"step": 4900 |
|
}, |
|
{ |
|
"epoch": 40.32, |
|
"learning_rate": 3.4173669467787114e-05, |
|
"loss": 0.1402, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 40.32, |
|
"eval_loss": 0.3369254171848297, |
|
"eval_runtime": 263.645, |
|
"eval_samples_per_second": 6.994, |
|
"eval_wer": 0.2214245757971285, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 41.13, |
|
"learning_rate": 3.277310924369748e-05, |
|
"loss": 0.1413, |
|
"step": 5100 |
|
}, |
|
{ |
|
"epoch": 41.13, |
|
"eval_loss": 0.3336828649044037, |
|
"eval_runtime": 263.0331, |
|
"eval_samples_per_second": 7.011, |
|
"eval_wer": 0.21946671639008017, |
|
"step": 5100 |
|
}, |
|
{ |
|
"epoch": 41.94, |
|
"learning_rate": 3.137254901960784e-05, |
|
"loss": 0.1381, |
|
"step": 5200 |
|
}, |
|
{ |
|
"epoch": 41.94, |
|
"eval_loss": 0.323373407125473, |
|
"eval_runtime": 262.7696, |
|
"eval_samples_per_second": 7.018, |
|
"eval_wer": 0.214432220771956, |
|
"step": 5200 |
|
}, |
|
{ |
|
"epoch": 42.74, |
|
"learning_rate": 2.9971988795518207e-05, |
|
"loss": 0.1257, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 42.74, |
|
"eval_loss": 0.32813942432403564, |
|
"eval_runtime": 262.9096, |
|
"eval_samples_per_second": 7.014, |
|
"eval_wer": 0.21629684877866864, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 43.55, |
|
"learning_rate": 2.857142857142857e-05, |
|
"loss": 0.1276, |
|
"step": 5400 |
|
}, |
|
{ |
|
"epoch": 43.55, |
|
"eval_loss": 0.3204418420791626, |
|
"eval_runtime": 262.6036, |
|
"eval_samples_per_second": 7.022, |
|
"eval_wer": 0.21946671639008017, |
|
"step": 5400 |
|
}, |
|
{ |
|
"epoch": 44.35, |
|
"learning_rate": 2.7170868347338935e-05, |
|
"loss": 0.1248, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 44.35, |
|
"eval_loss": 0.3329363465309143, |
|
"eval_runtime": 273.4973, |
|
"eval_samples_per_second": 6.742, |
|
"eval_wer": 0.21722916278202498, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 45.16, |
|
"learning_rate": 2.57703081232493e-05, |
|
"loss": 0.1287, |
|
"step": 5600 |
|
}, |
|
{ |
|
"epoch": 45.16, |
|
"eval_loss": 0.31906744837760925, |
|
"eval_runtime": 274.362, |
|
"eval_samples_per_second": 6.721, |
|
"eval_wer": 0.21284728696625024, |
|
"step": 5600 |
|
}, |
|
{ |
|
"epoch": 45.97, |
|
"learning_rate": 2.4369747899159663e-05, |
|
"loss": 0.1215, |
|
"step": 5700 |
|
}, |
|
{ |
|
"epoch": 45.97, |
|
"eval_loss": 0.3277473747730255, |
|
"eval_runtime": 273.8431, |
|
"eval_samples_per_second": 6.734, |
|
"eval_wer": 0.21517807197464106, |
|
"step": 5700 |
|
}, |
|
{ |
|
"epoch": 46.77, |
|
"learning_rate": 2.2969187675070027e-05, |
|
"loss": 0.1219, |
|
"step": 5800 |
|
}, |
|
{ |
|
"epoch": 46.77, |
|
"eval_loss": 0.3112068772315979, |
|
"eval_runtime": 272.6473, |
|
"eval_samples_per_second": 6.763, |
|
"eval_wer": 0.20995711355584562, |
|
"step": 5800 |
|
}, |
|
{ |
|
"epoch": 47.58, |
|
"learning_rate": 2.1568627450980395e-05, |
|
"loss": 0.1179, |
|
"step": 5900 |
|
}, |
|
{ |
|
"epoch": 47.58, |
|
"eval_loss": 0.3236621618270874, |
|
"eval_runtime": 264.1309, |
|
"eval_samples_per_second": 6.981, |
|
"eval_wer": 0.21461868357262726, |
|
"step": 5900 |
|
}, |
|
{ |
|
"epoch": 48.39, |
|
"learning_rate": 2.016806722689076e-05, |
|
"loss": 0.1188, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 48.39, |
|
"eval_loss": 0.3213033080101013, |
|
"eval_runtime": 263.9442, |
|
"eval_samples_per_second": 6.986, |
|
"eval_wer": 0.21126235316054448, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 49.19, |
|
"learning_rate": 1.876750700280112e-05, |
|
"loss": 0.1243, |
|
"step": 6100 |
|
}, |
|
{ |
|
"epoch": 49.19, |
|
"eval_loss": 0.32063964009284973, |
|
"eval_runtime": 265.6074, |
|
"eval_samples_per_second": 6.943, |
|
"eval_wer": 0.21368636956927092, |
|
"step": 6100 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"learning_rate": 1.7366946778711484e-05, |
|
"loss": 0.1162, |
|
"step": 6200 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_loss": 0.31902745366096497, |
|
"eval_runtime": 264.7304, |
|
"eval_samples_per_second": 6.966, |
|
"eval_wer": 0.20949095655416744, |
|
"step": 6200 |
|
}, |
|
{ |
|
"epoch": 50.81, |
|
"learning_rate": 1.5966386554621848e-05, |
|
"loss": 0.1274, |
|
"step": 6300 |
|
}, |
|
{ |
|
"epoch": 50.81, |
|
"eval_loss": 0.3174721896648407, |
|
"eval_runtime": 265.1372, |
|
"eval_samples_per_second": 6.955, |
|
"eval_wer": 0.21070296475853068, |
|
"step": 6300 |
|
}, |
|
{ |
|
"epoch": 51.61, |
|
"learning_rate": 1.4565826330532215e-05, |
|
"loss": 0.1179, |
|
"step": 6400 |
|
}, |
|
{ |
|
"epoch": 51.61, |
|
"eval_loss": 0.32639437913894653, |
|
"eval_runtime": 264.7128, |
|
"eval_samples_per_second": 6.966, |
|
"eval_wer": 0.2127540555659146, |
|
"step": 6400 |
|
}, |
|
{ |
|
"epoch": 52.42, |
|
"learning_rate": 1.3165266106442578e-05, |
|
"loss": 0.1084, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 52.42, |
|
"eval_loss": 0.3261864185333252, |
|
"eval_runtime": 265.2652, |
|
"eval_samples_per_second": 6.952, |
|
"eval_wer": 0.211635278761887, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 53.23, |
|
"learning_rate": 1.1764705882352942e-05, |
|
"loss": 0.123, |
|
"step": 6600 |
|
}, |
|
{ |
|
"epoch": 53.23, |
|
"eval_loss": 0.31353211402893066, |
|
"eval_runtime": 265.8012, |
|
"eval_samples_per_second": 6.938, |
|
"eval_wer": 0.2119149729628939, |
|
"step": 6600 |
|
}, |
|
{ |
|
"epoch": 54.03, |
|
"learning_rate": 1.0364145658263306e-05, |
|
"loss": 0.1077, |
|
"step": 6700 |
|
}, |
|
{ |
|
"epoch": 54.03, |
|
"eval_loss": 0.31938183307647705, |
|
"eval_runtime": 265.3957, |
|
"eval_samples_per_second": 6.948, |
|
"eval_wer": 0.21060973335819505, |
|
"step": 6700 |
|
}, |
|
{ |
|
"epoch": 54.84, |
|
"learning_rate": 8.96358543417367e-06, |
|
"loss": 0.1088, |
|
"step": 6800 |
|
}, |
|
{ |
|
"epoch": 54.84, |
|
"eval_loss": 0.3212938904762268, |
|
"eval_runtime": 266.6583, |
|
"eval_samples_per_second": 6.915, |
|
"eval_wer": 0.21088942755920195, |
|
"step": 6800 |
|
}, |
|
{ |
|
"epoch": 55.65, |
|
"learning_rate": 7.563025210084033e-06, |
|
"loss": 0.1085, |
|
"step": 6900 |
|
}, |
|
{ |
|
"epoch": 55.65, |
|
"eval_loss": 0.320252925157547, |
|
"eval_runtime": 266.7391, |
|
"eval_samples_per_second": 6.913, |
|
"eval_wer": 0.21060973335819505, |
|
"step": 6900 |
|
}, |
|
{ |
|
"epoch": 56.45, |
|
"learning_rate": 6.162464985994398e-06, |
|
"loss": 0.1084, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 56.45, |
|
"eval_loss": 0.32074451446533203, |
|
"eval_runtime": 265.9571, |
|
"eval_samples_per_second": 6.933, |
|
"eval_wer": 0.2093044937534962, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 57.26, |
|
"learning_rate": 4.7619047619047615e-06, |
|
"loss": 0.1086, |
|
"step": 7100 |
|
}, |
|
{ |
|
"epoch": 57.26, |
|
"eval_loss": 0.3232016861438751, |
|
"eval_runtime": 267.1546, |
|
"eval_samples_per_second": 6.902, |
|
"eval_wer": 0.20874510535148239, |
|
"step": 7100 |
|
}, |
|
{ |
|
"epoch": 58.06, |
|
"learning_rate": 3.361344537815126e-06, |
|
"loss": 0.106, |
|
"step": 7200 |
|
}, |
|
{ |
|
"epoch": 58.06, |
|
"eval_loss": 0.3231372535228729, |
|
"eval_runtime": 266.9142, |
|
"eval_samples_per_second": 6.909, |
|
"eval_wer": 0.2093044937534962, |
|
"step": 7200 |
|
}, |
|
{ |
|
"epoch": 58.87, |
|
"learning_rate": 1.96078431372549e-06, |
|
"loss": 0.1097, |
|
"step": 7300 |
|
}, |
|
{ |
|
"epoch": 58.87, |
|
"eval_loss": 0.32339319586753845, |
|
"eval_runtime": 270.5457, |
|
"eval_samples_per_second": 6.816, |
|
"eval_wer": 0.208838336751818, |
|
"step": 7300 |
|
}, |
|
{ |
|
"epoch": 59.68, |
|
"learning_rate": 5.602240896358544e-07, |
|
"loss": 0.1033, |
|
"step": 7400 |
|
}, |
|
{ |
|
"epoch": 59.68, |
|
"eval_loss": 0.32322752475738525, |
|
"eval_runtime": 275.739, |
|
"eval_samples_per_second": 6.687, |
|
"eval_wer": 0.208838336751818, |
|
"step": 7400 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"step": 7440, |
|
"total_flos": 2.7385342136046084e+19, |
|
"train_runtime": 22157.5951, |
|
"train_samples_per_second": 0.336 |
|
} |
|
], |
|
"max_steps": 7440, |
|
"num_train_epochs": 60, |
|
"total_flos": 2.7385342136046084e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|