|
{ |
|
"best_metric": 0.13642320036888123, |
|
"best_model_checkpoint": "wav2vec2-large-xlsr-mecita-coraa-portuguese-random-all-03/checkpoint-3182", |
|
"epoch": 57.0, |
|
"global_step": 4902, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.01, |
|
"learning_rate": 3e-05, |
|
"loss": 29.1535, |
|
"step": 1 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_cer": 1.0, |
|
"eval_loss": 3.1676151752471924, |
|
"eval_runtime": 5.9631, |
|
"eval_samples_per_second": 57.185, |
|
"eval_steps_per_second": 7.211, |
|
"eval_wer": 1.0, |
|
"step": 86 |
|
}, |
|
{ |
|
"epoch": 1.16, |
|
"learning_rate": 2.9661627906976745e-05, |
|
"loss": 7.924, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_cer": 1.0, |
|
"eval_loss": 2.9288899898529053, |
|
"eval_runtime": 6.0836, |
|
"eval_samples_per_second": 56.053, |
|
"eval_steps_per_second": 7.068, |
|
"eval_wer": 1.0, |
|
"step": 172 |
|
}, |
|
{ |
|
"epoch": 2.33, |
|
"learning_rate": 2.931279069767442e-05, |
|
"loss": 3.0115, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_cer": 1.0, |
|
"eval_loss": 2.8972272872924805, |
|
"eval_runtime": 6.4814, |
|
"eval_samples_per_second": 52.612, |
|
"eval_steps_per_second": 6.634, |
|
"eval_wer": 1.0, |
|
"step": 258 |
|
}, |
|
{ |
|
"epoch": 3.49, |
|
"learning_rate": 2.8963953488372093e-05, |
|
"loss": 2.9304, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_cer": 1.0, |
|
"eval_loss": 2.887695550918579, |
|
"eval_runtime": 6.205, |
|
"eval_samples_per_second": 54.956, |
|
"eval_steps_per_second": 6.93, |
|
"eval_wer": 1.0, |
|
"step": 344 |
|
}, |
|
{ |
|
"epoch": 4.65, |
|
"learning_rate": 2.861511627906977e-05, |
|
"loss": 2.9073, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_cer": 1.0, |
|
"eval_loss": 2.857363224029541, |
|
"eval_runtime": 5.8413, |
|
"eval_samples_per_second": 58.377, |
|
"eval_steps_per_second": 7.361, |
|
"eval_wer": 1.0, |
|
"step": 430 |
|
}, |
|
{ |
|
"epoch": 5.81, |
|
"learning_rate": 2.8266279069767444e-05, |
|
"loss": 2.7919, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_cer": 0.674222480032127, |
|
"eval_loss": 1.9143861532211304, |
|
"eval_runtime": 6.2962, |
|
"eval_samples_per_second": 54.159, |
|
"eval_steps_per_second": 6.829, |
|
"eval_wer": 1.0, |
|
"step": 516 |
|
}, |
|
{ |
|
"epoch": 6.98, |
|
"learning_rate": 2.7917441860465118e-05, |
|
"loss": 1.6061, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_cer": 0.07661416268796573, |
|
"eval_loss": 0.543914258480072, |
|
"eval_runtime": 5.8137, |
|
"eval_samples_per_second": 58.654, |
|
"eval_steps_per_second": 7.396, |
|
"eval_wer": 0.2885666745899691, |
|
"step": 602 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_cer": 0.055776181339520774, |
|
"eval_loss": 0.37258943915367126, |
|
"eval_runtime": 6.0487, |
|
"eval_samples_per_second": 56.376, |
|
"eval_steps_per_second": 7.109, |
|
"eval_wer": 0.19491323983836464, |
|
"step": 688 |
|
}, |
|
{ |
|
"epoch": 8.14, |
|
"learning_rate": 2.7568604651162792e-05, |
|
"loss": 0.7808, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_cer": 0.05167105439293204, |
|
"eval_loss": 0.2959502637386322, |
|
"eval_runtime": 5.8892, |
|
"eval_samples_per_second": 57.902, |
|
"eval_steps_per_second": 7.301, |
|
"eval_wer": 0.18183979082481577, |
|
"step": 774 |
|
}, |
|
{ |
|
"epoch": 9.3, |
|
"learning_rate": 2.7219767441860466e-05, |
|
"loss": 0.5543, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_cer": 0.04774441122662978, |
|
"eval_loss": 0.259117066860199, |
|
"eval_runtime": 5.9755, |
|
"eval_samples_per_second": 57.066, |
|
"eval_steps_per_second": 7.196, |
|
"eval_wer": 0.16876634181126693, |
|
"step": 860 |
|
}, |
|
{ |
|
"epoch": 10.47, |
|
"learning_rate": 2.6870930232558143e-05, |
|
"loss": 0.4721, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_cer": 0.04265762348846549, |
|
"eval_loss": 0.23672477900981903, |
|
"eval_runtime": 6.0691, |
|
"eval_samples_per_second": 56.186, |
|
"eval_steps_per_second": 7.085, |
|
"eval_wer": 0.14452103636795816, |
|
"step": 946 |
|
}, |
|
{ |
|
"epoch": 11.63, |
|
"learning_rate": 2.6522093023255817e-05, |
|
"loss": 0.414, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_cer": 0.037615456695372806, |
|
"eval_loss": 0.21672293543815613, |
|
"eval_runtime": 6.2518, |
|
"eval_samples_per_second": 54.545, |
|
"eval_steps_per_second": 6.878, |
|
"eval_wer": 0.12598050867601615, |
|
"step": 1032 |
|
}, |
|
{ |
|
"epoch": 12.79, |
|
"learning_rate": 2.617325581395349e-05, |
|
"loss": 0.3819, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_cer": 0.03502744188121904, |
|
"eval_loss": 0.1979241967201233, |
|
"eval_runtime": 5.8651, |
|
"eval_samples_per_second": 58.141, |
|
"eval_steps_per_second": 7.332, |
|
"eval_wer": 0.11504635131922986, |
|
"step": 1118 |
|
}, |
|
{ |
|
"epoch": 13.95, |
|
"learning_rate": 2.5824418604651165e-05, |
|
"loss": 0.3376, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_cer": 0.03462585337557449, |
|
"eval_loss": 0.1877206414937973, |
|
"eval_runtime": 6.3492, |
|
"eval_samples_per_second": 53.708, |
|
"eval_steps_per_second": 6.773, |
|
"eval_wer": 0.11694794390301878, |
|
"step": 1204 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_cer": 0.03346570880371246, |
|
"eval_loss": 0.17655867338180542, |
|
"eval_runtime": 6.0868, |
|
"eval_samples_per_second": 56.023, |
|
"eval_steps_per_second": 7.065, |
|
"eval_wer": 0.10839077727596863, |
|
"step": 1290 |
|
}, |
|
{ |
|
"epoch": 15.12, |
|
"learning_rate": 2.547558139534884e-05, |
|
"loss": 0.3199, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_cer": 0.032260943286778816, |
|
"eval_loss": 0.175409734249115, |
|
"eval_runtime": 6.3852, |
|
"eval_samples_per_second": 53.405, |
|
"eval_steps_per_second": 6.734, |
|
"eval_wer": 0.10316139767054909, |
|
"step": 1376 |
|
}, |
|
{ |
|
"epoch": 16.28, |
|
"learning_rate": 2.512674418604651e-05, |
|
"loss": 0.3174, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_cer": 0.031547008165632946, |
|
"eval_loss": 0.1697303056716919, |
|
"eval_runtime": 6.098, |
|
"eval_samples_per_second": 55.92, |
|
"eval_steps_per_second": 7.051, |
|
"eval_wer": 0.10173520323270739, |
|
"step": 1462 |
|
}, |
|
{ |
|
"epoch": 17.44, |
|
"learning_rate": 2.4777906976744186e-05, |
|
"loss": 0.2747, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_cer": 0.030788452099415466, |
|
"eval_loss": 0.1668318510055542, |
|
"eval_runtime": 6.0816, |
|
"eval_samples_per_second": 56.071, |
|
"eval_steps_per_second": 7.071, |
|
"eval_wer": 0.09626812455431424, |
|
"step": 1548 |
|
}, |
|
{ |
|
"epoch": 18.6, |
|
"learning_rate": 2.442906976744186e-05, |
|
"loss": 0.2618, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_cer": 0.0300745169782696, |
|
"eval_loss": 0.16257551312446594, |
|
"eval_runtime": 5.9751, |
|
"eval_samples_per_second": 57.07, |
|
"eval_steps_per_second": 7.197, |
|
"eval_wer": 0.09365343475160447, |
|
"step": 1634 |
|
}, |
|
{ |
|
"epoch": 19.77, |
|
"learning_rate": 2.4080232558139534e-05, |
|
"loss": 0.2557, |
|
"step": 1700 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_cer": 0.029851412252911515, |
|
"eval_loss": 0.15971209108829498, |
|
"eval_runtime": 6.1983, |
|
"eval_samples_per_second": 55.015, |
|
"eval_steps_per_second": 6.937, |
|
"eval_wer": 0.09460423104349892, |
|
"step": 1720 |
|
}, |
|
{ |
|
"epoch": 20.93, |
|
"learning_rate": 2.3731395348837208e-05, |
|
"loss": 0.2578, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_cer": 0.029628307527553435, |
|
"eval_loss": 0.15854881703853607, |
|
"eval_runtime": 6.6998, |
|
"eval_samples_per_second": 50.897, |
|
"eval_steps_per_second": 6.418, |
|
"eval_wer": 0.09436653197052532, |
|
"step": 1806 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_cer": 0.030163758868412834, |
|
"eval_loss": 0.15489967167377472, |
|
"eval_runtime": 5.8895, |
|
"eval_samples_per_second": 57.899, |
|
"eval_steps_per_second": 7.301, |
|
"eval_wer": 0.09650582362728785, |
|
"step": 1892 |
|
}, |
|
{ |
|
"epoch": 22.09, |
|
"learning_rate": 2.3382558139534882e-05, |
|
"loss": 0.2288, |
|
"step": 1900 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_cer": 0.02837892106554817, |
|
"eval_loss": 0.15013234317302704, |
|
"eval_runtime": 5.9578, |
|
"eval_samples_per_second": 57.236, |
|
"eval_steps_per_second": 7.217, |
|
"eval_wer": 0.09389113382457809, |
|
"step": 1978 |
|
}, |
|
{ |
|
"epoch": 23.26, |
|
"learning_rate": 2.303372093023256e-05, |
|
"loss": 0.2269, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_cer": 0.029092856186694036, |
|
"eval_loss": 0.15236006677150726, |
|
"eval_runtime": 6.4802, |
|
"eval_samples_per_second": 52.622, |
|
"eval_steps_per_second": 6.636, |
|
"eval_wer": 0.09436653197052532, |
|
"step": 2064 |
|
}, |
|
{ |
|
"epoch": 24.42, |
|
"learning_rate": 2.2684883720930233e-05, |
|
"loss": 0.2327, |
|
"step": 2100 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_cer": 0.028111195395118468, |
|
"eval_loss": 0.14761987328529358, |
|
"eval_runtime": 5.9425, |
|
"eval_samples_per_second": 57.383, |
|
"eval_steps_per_second": 7.236, |
|
"eval_wer": 0.09032564772997385, |
|
"step": 2150 |
|
}, |
|
{ |
|
"epoch": 25.58, |
|
"learning_rate": 2.2336046511627907e-05, |
|
"loss": 0.2024, |
|
"step": 2200 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_cer": 0.028423542010619786, |
|
"eval_loss": 0.14807896316051483, |
|
"eval_runtime": 6.0178, |
|
"eval_samples_per_second": 56.665, |
|
"eval_steps_per_second": 7.145, |
|
"eval_wer": 0.09032564772997385, |
|
"step": 2236 |
|
}, |
|
{ |
|
"epoch": 26.74, |
|
"learning_rate": 2.198720930232558e-05, |
|
"loss": 0.2056, |
|
"step": 2300 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_cer": 0.02837892106554817, |
|
"eval_loss": 0.1433907002210617, |
|
"eval_runtime": 6.0685, |
|
"eval_samples_per_second": 56.192, |
|
"eval_steps_per_second": 7.086, |
|
"eval_wer": 0.09246493938673639, |
|
"step": 2322 |
|
}, |
|
{ |
|
"epoch": 27.91, |
|
"learning_rate": 2.1638372093023255e-05, |
|
"loss": 0.2097, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_cer": 0.028021953504975234, |
|
"eval_loss": 0.1468418389558792, |
|
"eval_runtime": 7.6911, |
|
"eval_samples_per_second": 44.337, |
|
"eval_steps_per_second": 5.591, |
|
"eval_wer": 0.0893748514380794, |
|
"step": 2408 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_cer": 0.02730801838382937, |
|
"eval_loss": 0.14347784221172333, |
|
"eval_runtime": 6.2489, |
|
"eval_samples_per_second": 54.569, |
|
"eval_steps_per_second": 6.881, |
|
"eval_wer": 0.08604706441644877, |
|
"step": 2494 |
|
}, |
|
{ |
|
"epoch": 29.07, |
|
"learning_rate": 2.128953488372093e-05, |
|
"loss": 0.2177, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_cer": 0.028111195395118468, |
|
"eval_loss": 0.14982478320598602, |
|
"eval_runtime": 6.7618, |
|
"eval_samples_per_second": 50.43, |
|
"eval_steps_per_second": 6.359, |
|
"eval_wer": 0.08771095792726408, |
|
"step": 2580 |
|
}, |
|
{ |
|
"epoch": 30.23, |
|
"learning_rate": 2.0940697674418606e-05, |
|
"loss": 0.1935, |
|
"step": 2600 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_cer": 0.027798848779617153, |
|
"eval_loss": 0.14517097175121307, |
|
"eval_runtime": 5.9019, |
|
"eval_samples_per_second": 57.778, |
|
"eval_steps_per_second": 7.286, |
|
"eval_wer": 0.08913715236510578, |
|
"step": 2666 |
|
}, |
|
{ |
|
"epoch": 31.4, |
|
"learning_rate": 2.059186046511628e-05, |
|
"loss": 0.1918, |
|
"step": 2700 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_cer": 0.027486502164115835, |
|
"eval_loss": 0.14662335813045502, |
|
"eval_runtime": 6.9556, |
|
"eval_samples_per_second": 49.026, |
|
"eval_steps_per_second": 6.182, |
|
"eval_wer": 0.08485856905158069, |
|
"step": 2752 |
|
}, |
|
{ |
|
"epoch": 32.56, |
|
"learning_rate": 2.0243023255813954e-05, |
|
"loss": 0.1805, |
|
"step": 2800 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_cer": 0.028155816340190085, |
|
"eval_loss": 0.14373721182346344, |
|
"eval_runtime": 6.2565, |
|
"eval_samples_per_second": 54.504, |
|
"eval_steps_per_second": 6.873, |
|
"eval_wer": 0.08889945329213216, |
|
"step": 2838 |
|
}, |
|
{ |
|
"epoch": 33.72, |
|
"learning_rate": 1.9894186046511628e-05, |
|
"loss": 0.1805, |
|
"step": 2900 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_cer": 0.027441881219044218, |
|
"eval_loss": 0.14093732833862305, |
|
"eval_runtime": 6.6898, |
|
"eval_samples_per_second": 50.973, |
|
"eval_steps_per_second": 6.428, |
|
"eval_wer": 0.08699786070834324, |
|
"step": 2924 |
|
}, |
|
{ |
|
"epoch": 34.88, |
|
"learning_rate": 1.9545348837209302e-05, |
|
"loss": 0.1835, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_cer": 0.027129534603542903, |
|
"eval_loss": 0.14223171770572662, |
|
"eval_runtime": 6.4219, |
|
"eval_samples_per_second": 53.099, |
|
"eval_steps_per_second": 6.696, |
|
"eval_wer": 0.08557166627050154, |
|
"step": 3010 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_cer": 0.026415599482397037, |
|
"eval_loss": 0.13766661286354065, |
|
"eval_runtime": 7.5399, |
|
"eval_samples_per_second": 45.226, |
|
"eval_steps_per_second": 5.703, |
|
"eval_wer": 0.08509626812455431, |
|
"step": 3096 |
|
}, |
|
{ |
|
"epoch": 36.05, |
|
"learning_rate": 1.919651162790698e-05, |
|
"loss": 0.1787, |
|
"step": 3100 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_cer": 0.026683325152826738, |
|
"eval_loss": 0.13642320036888123, |
|
"eval_runtime": 6.5226, |
|
"eval_samples_per_second": 52.28, |
|
"eval_steps_per_second": 6.592, |
|
"eval_wer": 0.08438317090563346, |
|
"step": 3182 |
|
}, |
|
{ |
|
"epoch": 37.21, |
|
"learning_rate": 1.8847674418604653e-05, |
|
"loss": 0.1695, |
|
"step": 3200 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_cer": 0.02677256704296997, |
|
"eval_loss": 0.14176321029663086, |
|
"eval_runtime": 6.3748, |
|
"eval_samples_per_second": 53.492, |
|
"eval_steps_per_second": 6.745, |
|
"eval_wer": 0.08485856905158069, |
|
"step": 3268 |
|
}, |
|
{ |
|
"epoch": 38.37, |
|
"learning_rate": 1.8498837209302327e-05, |
|
"loss": 0.1775, |
|
"step": 3300 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_cer": 0.02704029271339967, |
|
"eval_loss": 0.1400807499885559, |
|
"eval_runtime": 6.1197, |
|
"eval_samples_per_second": 55.721, |
|
"eval_steps_per_second": 7.026, |
|
"eval_wer": 0.08438317090563346, |
|
"step": 3354 |
|
}, |
|
{ |
|
"epoch": 39.53, |
|
"learning_rate": 1.815e-05, |
|
"loss": 0.1763, |
|
"step": 3400 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_cer": 0.02650484137254027, |
|
"eval_loss": 0.14022426307201385, |
|
"eval_runtime": 5.9433, |
|
"eval_samples_per_second": 57.375, |
|
"eval_steps_per_second": 7.235, |
|
"eval_wer": 0.08153078202995008, |
|
"step": 3440 |
|
}, |
|
{ |
|
"epoch": 40.7, |
|
"learning_rate": 1.7801162790697675e-05, |
|
"loss": 0.1702, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_cer": 0.026415599482397037, |
|
"eval_loss": 0.14177961647510529, |
|
"eval_runtime": 6.7266, |
|
"eval_samples_per_second": 50.694, |
|
"eval_steps_per_second": 6.393, |
|
"eval_wer": 0.08295697646779178, |
|
"step": 3526 |
|
}, |
|
{ |
|
"epoch": 41.86, |
|
"learning_rate": 1.7452325581395352e-05, |
|
"loss": 0.1569, |
|
"step": 3600 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_cer": 0.02583552719646602, |
|
"eval_loss": 0.13996584713459015, |
|
"eval_runtime": 5.888, |
|
"eval_samples_per_second": 57.914, |
|
"eval_steps_per_second": 7.303, |
|
"eval_wer": 0.08248157832184455, |
|
"step": 3612 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_cer": 0.026192494757038953, |
|
"eval_loss": 0.14005370438098907, |
|
"eval_runtime": 5.8324, |
|
"eval_samples_per_second": 58.466, |
|
"eval_steps_per_second": 7.373, |
|
"eval_wer": 0.08153078202995008, |
|
"step": 3698 |
|
}, |
|
{ |
|
"epoch": 43.02, |
|
"learning_rate": 1.7103488372093026e-05, |
|
"loss": 0.1617, |
|
"step": 3700 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_cer": 0.026192494757038953, |
|
"eval_loss": 0.14058516919612885, |
|
"eval_runtime": 6.1068, |
|
"eval_samples_per_second": 55.839, |
|
"eval_steps_per_second": 7.041, |
|
"eval_wer": 0.07915379130021392, |
|
"step": 3784 |
|
}, |
|
{ |
|
"epoch": 44.19, |
|
"learning_rate": 1.67546511627907e-05, |
|
"loss": 0.1596, |
|
"step": 3800 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_cer": 0.02637097853732542, |
|
"eval_loss": 0.1394573301076889, |
|
"eval_runtime": 6.5093, |
|
"eval_samples_per_second": 52.386, |
|
"eval_steps_per_second": 6.606, |
|
"eval_wer": 0.0817684811029237, |
|
"step": 3870 |
|
}, |
|
{ |
|
"epoch": 45.35, |
|
"learning_rate": 1.6405813953488374e-05, |
|
"loss": 0.1431, |
|
"step": 3900 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_cer": 0.026192494757038953, |
|
"eval_loss": 0.13823828101158142, |
|
"eval_runtime": 6.0067, |
|
"eval_samples_per_second": 56.77, |
|
"eval_steps_per_second": 7.159, |
|
"eval_wer": 0.08153078202995008, |
|
"step": 3956 |
|
}, |
|
{ |
|
"epoch": 46.51, |
|
"learning_rate": 1.6056976744186047e-05, |
|
"loss": 0.158, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_cer": 0.02650484137254027, |
|
"eval_loss": 0.13912436366081238, |
|
"eval_runtime": 6.0425, |
|
"eval_samples_per_second": 56.433, |
|
"eval_steps_per_second": 7.116, |
|
"eval_wer": 0.08129308295697647, |
|
"step": 4042 |
|
}, |
|
{ |
|
"epoch": 47.67, |
|
"learning_rate": 1.570813953488372e-05, |
|
"loss": 0.1552, |
|
"step": 4100 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_cer": 0.026594083262683504, |
|
"eval_loss": 0.13926950097084045, |
|
"eval_runtime": 6.5183, |
|
"eval_samples_per_second": 52.314, |
|
"eval_steps_per_second": 6.597, |
|
"eval_wer": 0.08248157832184455, |
|
"step": 4128 |
|
}, |
|
{ |
|
"epoch": 48.84, |
|
"learning_rate": 1.5359302325581395e-05, |
|
"loss": 0.1379, |
|
"step": 4200 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_cer": 0.025612422471107937, |
|
"eval_loss": 0.13708749413490295, |
|
"eval_runtime": 6.0023, |
|
"eval_samples_per_second": 56.811, |
|
"eval_steps_per_second": 7.164, |
|
"eval_wer": 0.08105538388400285, |
|
"step": 4214 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"learning_rate": 1.5010465116279071e-05, |
|
"loss": 0.145, |
|
"step": 4300 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_cer": 0.02556780152603632, |
|
"eval_loss": 0.1392103135585785, |
|
"eval_runtime": 7.2777, |
|
"eval_samples_per_second": 46.855, |
|
"eval_steps_per_second": 5.908, |
|
"eval_wer": 0.0801045875921084, |
|
"step": 4300 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"eval_cer": 0.02623711570211057, |
|
"eval_loss": 0.14161016047000885, |
|
"eval_runtime": 6.4267, |
|
"eval_samples_per_second": 53.06, |
|
"eval_steps_per_second": 6.691, |
|
"eval_wer": 0.08200618017589731, |
|
"step": 4386 |
|
}, |
|
{ |
|
"epoch": 51.16, |
|
"learning_rate": 1.4661627906976745e-05, |
|
"loss": 0.1647, |
|
"step": 4400 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"eval_cer": 0.02556780152603632, |
|
"eval_loss": 0.13915704190731049, |
|
"eval_runtime": 6.1093, |
|
"eval_samples_per_second": 55.816, |
|
"eval_steps_per_second": 7.038, |
|
"eval_wer": 0.07891609222724032, |
|
"step": 4472 |
|
}, |
|
{ |
|
"epoch": 52.33, |
|
"learning_rate": 1.4312790697674419e-05, |
|
"loss": 0.1493, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"eval_cer": 0.02570166436125117, |
|
"eval_loss": 0.14251555502414703, |
|
"eval_runtime": 6.4895, |
|
"eval_samples_per_second": 52.546, |
|
"eval_steps_per_second": 6.626, |
|
"eval_wer": 0.07939149037318755, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 53.49, |
|
"learning_rate": 1.3963953488372094e-05, |
|
"loss": 0.1492, |
|
"step": 4600 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"eval_cer": 0.025746285306322787, |
|
"eval_loss": 0.1419229656457901, |
|
"eval_runtime": 5.9077, |
|
"eval_samples_per_second": 57.721, |
|
"eval_steps_per_second": 7.279, |
|
"eval_wer": 0.07962918944616117, |
|
"step": 4644 |
|
}, |
|
{ |
|
"epoch": 54.65, |
|
"learning_rate": 1.3615116279069768e-05, |
|
"loss": 0.139, |
|
"step": 4700 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"eval_cer": 0.024987729240105304, |
|
"eval_loss": 0.13996940851211548, |
|
"eval_runtime": 5.9605, |
|
"eval_samples_per_second": 57.21, |
|
"eval_steps_per_second": 7.214, |
|
"eval_wer": 0.07582600427858331, |
|
"step": 4730 |
|
}, |
|
{ |
|
"epoch": 55.81, |
|
"learning_rate": 1.3266279069767444e-05, |
|
"loss": 0.1385, |
|
"step": 4800 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_cer": 0.02534469680067824, |
|
"eval_loss": 0.1423511654138565, |
|
"eval_runtime": 6.5323, |
|
"eval_samples_per_second": 52.203, |
|
"eval_steps_per_second": 6.583, |
|
"eval_wer": 0.07915379130021392, |
|
"step": 4816 |
|
}, |
|
{ |
|
"epoch": 56.98, |
|
"learning_rate": 1.2917441860465116e-05, |
|
"loss": 0.128, |
|
"step": 4900 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"eval_cer": 0.025255454910535005, |
|
"eval_loss": 0.1403101086616516, |
|
"eval_runtime": 6.4807, |
|
"eval_samples_per_second": 52.618, |
|
"eval_steps_per_second": 6.635, |
|
"eval_wer": 0.08057998573805562, |
|
"step": 4902 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"step": 4902, |
|
"total_flos": 4.0970110980881424e+19, |
|
"train_loss": 0.6410711561475954, |
|
"train_runtime": 7770.6868, |
|
"train_samples_per_second": 35.299, |
|
"train_steps_per_second": 1.107 |
|
} |
|
], |
|
"max_steps": 8600, |
|
"num_train_epochs": 100, |
|
"total_flos": 4.0970110980881424e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|