|
{ |
|
"best_metric": 11.954752604166668, |
|
"best_model_checkpoint": "/cluster/home/torstefl/Master/saved_model/Whisper/NB-02.06/checkpoint-609", |
|
"epoch": 6.920454545454545, |
|
"eval_steps": 21, |
|
"global_step": 609, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.24, |
|
"eval_rundkast_loss": 1.514348030090332, |
|
"eval_rundkast_runtime": 267.2294, |
|
"eval_rundkast_samples_per_second": 5.011, |
|
"eval_rundkast_steps_per_second": 0.105, |
|
"eval_rundkast_wer": 17.877139657654777, |
|
"step": 21 |
|
}, |
|
{ |
|
"epoch": 0.24, |
|
"eval_nb_samtale_loss": 1.4326682090759277, |
|
"eval_nb_samtale_runtime": 128.5326, |
|
"eval_nb_samtale_samples_per_second": 4.147, |
|
"eval_nb_samtale_steps_per_second": 0.093, |
|
"eval_nb_samtale_wer": 16.89453125, |
|
"step": 21 |
|
}, |
|
{ |
|
"epoch": 0.24, |
|
"eval_bigbrother_loss": 2.1967878341674805, |
|
"eval_bigbrother_runtime": 274.0177, |
|
"eval_bigbrother_samples_per_second": 5.0, |
|
"eval_bigbrother_steps_per_second": 0.106, |
|
"eval_bigbrother_wer": 37.10625956658342, |
|
"step": 21 |
|
}, |
|
{ |
|
"epoch": 0.48, |
|
"eval_rundkast_loss": 1.4300581216812134, |
|
"eval_rundkast_runtime": 263.2899, |
|
"eval_rundkast_samples_per_second": 5.086, |
|
"eval_rundkast_steps_per_second": 0.106, |
|
"eval_rundkast_wer": 17.789153735402337, |
|
"step": 42 |
|
}, |
|
{ |
|
"epoch": 0.48, |
|
"eval_nb_samtale_loss": 1.3351885080337524, |
|
"eval_nb_samtale_runtime": 127.9406, |
|
"eval_nb_samtale_samples_per_second": 4.166, |
|
"eval_nb_samtale_steps_per_second": 0.094, |
|
"eval_nb_samtale_wer": 16.935221354166664, |
|
"step": 42 |
|
}, |
|
{ |
|
"epoch": 0.48, |
|
"eval_bigbrother_loss": 2.0810060501098633, |
|
"eval_bigbrother_runtime": 273.3743, |
|
"eval_bigbrother_samples_per_second": 5.011, |
|
"eval_bigbrother_steps_per_second": 0.106, |
|
"eval_bigbrother_wer": 36.81624103762185, |
|
"step": 42 |
|
}, |
|
{ |
|
"epoch": 0.72, |
|
"eval_rundkast_loss": 1.298883080482483, |
|
"eval_rundkast_runtime": 264.443, |
|
"eval_rundkast_samples_per_second": 5.063, |
|
"eval_rundkast_steps_per_second": 0.106, |
|
"eval_rundkast_wer": 17.757158854583267, |
|
"step": 63 |
|
}, |
|
{ |
|
"epoch": 0.72, |
|
"eval_nb_samtale_loss": 1.1716408729553223, |
|
"eval_nb_samtale_runtime": 128.1882, |
|
"eval_nb_samtale_samples_per_second": 4.158, |
|
"eval_nb_samtale_steps_per_second": 0.094, |
|
"eval_nb_samtale_wer": 17.024739583333336, |
|
"step": 63 |
|
}, |
|
{ |
|
"epoch": 0.72, |
|
"eval_bigbrother_loss": 1.9180413484573364, |
|
"eval_bigbrother_runtime": 274.3045, |
|
"eval_bigbrother_samples_per_second": 4.994, |
|
"eval_bigbrother_steps_per_second": 0.106, |
|
"eval_bigbrother_wer": 36.67928784338999, |
|
"step": 63 |
|
}, |
|
{ |
|
"epoch": 0.95, |
|
"eval_rundkast_loss": 1.1174129247665405, |
|
"eval_rundkast_runtime": 266.1387, |
|
"eval_rundkast_samples_per_second": 5.031, |
|
"eval_rundkast_steps_per_second": 0.105, |
|
"eval_rundkast_wer": 17.765157574788034, |
|
"step": 84 |
|
}, |
|
{ |
|
"epoch": 0.95, |
|
"eval_nb_samtale_loss": 0.95993971824646, |
|
"eval_nb_samtale_runtime": 128.381, |
|
"eval_nb_samtale_samples_per_second": 4.152, |
|
"eval_nb_samtale_steps_per_second": 0.093, |
|
"eval_nb_samtale_wer": 17.635091145833336, |
|
"step": 84 |
|
}, |
|
{ |
|
"epoch": 0.95, |
|
"eval_bigbrother_loss": 1.7143659591674805, |
|
"eval_bigbrother_runtime": 275.348, |
|
"eval_bigbrother_samples_per_second": 4.976, |
|
"eval_bigbrother_steps_per_second": 0.105, |
|
"eval_bigbrother_wer": 36.69539998388786, |
|
"step": 84 |
|
}, |
|
{ |
|
"epoch": 1.14, |
|
"grad_norm": 12.247305870056152, |
|
"learning_rate": 1.0000000000000002e-06, |
|
"loss": 1.2113, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 1.19, |
|
"eval_rundkast_loss": 0.920071542263031, |
|
"eval_rundkast_runtime": 265.1068, |
|
"eval_rundkast_samples_per_second": 5.051, |
|
"eval_rundkast_steps_per_second": 0.106, |
|
"eval_rundkast_wer": 17.653175491921292, |
|
"step": 105 |
|
}, |
|
{ |
|
"epoch": 1.19, |
|
"eval_nb_samtale_loss": 0.777379035949707, |
|
"eval_nb_samtale_runtime": 128.2654, |
|
"eval_nb_samtale_samples_per_second": 4.155, |
|
"eval_nb_samtale_steps_per_second": 0.094, |
|
"eval_nb_samtale_wer": 17.195638020833336, |
|
"step": 105 |
|
}, |
|
{ |
|
"epoch": 1.19, |
|
"eval_bigbrother_loss": 1.4940869808197021, |
|
"eval_bigbrother_runtime": 273.3462, |
|
"eval_bigbrother_samples_per_second": 5.012, |
|
"eval_bigbrother_steps_per_second": 0.106, |
|
"eval_bigbrother_wer": 36.85652138886651, |
|
"step": 105 |
|
}, |
|
{ |
|
"epoch": 1.43, |
|
"eval_rundkast_loss": 0.7526112794876099, |
|
"eval_rundkast_runtime": 263.7468, |
|
"eval_rundkast_samples_per_second": 5.077, |
|
"eval_rundkast_steps_per_second": 0.106, |
|
"eval_rundkast_wer": 17.325227963525837, |
|
"step": 126 |
|
}, |
|
{ |
|
"epoch": 1.43, |
|
"eval_nb_samtale_loss": 0.6493657231330872, |
|
"eval_nb_samtale_runtime": 128.8699, |
|
"eval_nb_samtale_samples_per_second": 4.136, |
|
"eval_nb_samtale_steps_per_second": 0.093, |
|
"eval_nb_samtale_wer": 16.162109375, |
|
"step": 126 |
|
}, |
|
{ |
|
"epoch": 1.43, |
|
"eval_bigbrother_loss": 1.2856446504592896, |
|
"eval_bigbrother_runtime": 274.6648, |
|
"eval_bigbrother_samples_per_second": 4.988, |
|
"eval_bigbrother_steps_per_second": 0.106, |
|
"eval_bigbrother_wer": 35.73672762426489, |
|
"step": 126 |
|
}, |
|
{ |
|
"epoch": 1.67, |
|
"eval_rundkast_loss": 0.6184744238853455, |
|
"eval_rundkast_runtime": 264.7084, |
|
"eval_rundkast_samples_per_second": 5.058, |
|
"eval_rundkast_steps_per_second": 0.106, |
|
"eval_rundkast_wer": 17.04527275635898, |
|
"step": 147 |
|
}, |
|
{ |
|
"epoch": 1.67, |
|
"eval_nb_samtale_loss": 0.55622398853302, |
|
"eval_nb_samtale_runtime": 128.1926, |
|
"eval_nb_samtale_samples_per_second": 4.158, |
|
"eval_nb_samtale_steps_per_second": 0.094, |
|
"eval_nb_samtale_wer": 15.388997395833334, |
|
"step": 147 |
|
}, |
|
{ |
|
"epoch": 1.67, |
|
"eval_bigbrother_loss": 1.117920994758606, |
|
"eval_bigbrother_runtime": 275.1798, |
|
"eval_bigbrother_samples_per_second": 4.979, |
|
"eval_bigbrother_steps_per_second": 0.105, |
|
"eval_bigbrother_wer": 35.688391202771285, |
|
"step": 147 |
|
}, |
|
{ |
|
"epoch": 1.91, |
|
"eval_rundkast_loss": 0.5196747779846191, |
|
"eval_rundkast_runtime": 264.025, |
|
"eval_rundkast_samples_per_second": 5.071, |
|
"eval_rundkast_steps_per_second": 0.106, |
|
"eval_rundkast_wer": 16.73332266837306, |
|
"step": 168 |
|
}, |
|
{ |
|
"epoch": 1.91, |
|
"eval_nb_samtale_loss": 0.48537084460258484, |
|
"eval_nb_samtale_runtime": 130.6175, |
|
"eval_nb_samtale_samples_per_second": 4.081, |
|
"eval_nb_samtale_steps_per_second": 0.092, |
|
"eval_nb_samtale_wer": 15.087890625, |
|
"step": 168 |
|
}, |
|
{ |
|
"epoch": 1.91, |
|
"eval_bigbrother_loss": 0.993186891078949, |
|
"eval_bigbrother_runtime": 272.8105, |
|
"eval_bigbrother_samples_per_second": 5.022, |
|
"eval_bigbrother_steps_per_second": 0.106, |
|
"eval_bigbrother_wer": 35.42254088455651, |
|
"step": 168 |
|
}, |
|
{ |
|
"epoch": 2.15, |
|
"eval_rundkast_loss": 0.46956706047058105, |
|
"eval_rundkast_runtime": 265.2136, |
|
"eval_rundkast_samples_per_second": 5.049, |
|
"eval_rundkast_steps_per_second": 0.106, |
|
"eval_rundkast_wer": 16.309390497520397, |
|
"step": 189 |
|
}, |
|
{ |
|
"epoch": 2.15, |
|
"eval_nb_samtale_loss": 0.43936076760292053, |
|
"eval_nb_samtale_runtime": 130.644, |
|
"eval_nb_samtale_samples_per_second": 4.08, |
|
"eval_nb_samtale_steps_per_second": 0.092, |
|
"eval_nb_samtale_wer": 14.925130208333334, |
|
"step": 189 |
|
}, |
|
{ |
|
"epoch": 2.15, |
|
"eval_bigbrother_loss": 0.9301990866661072, |
|
"eval_bigbrother_runtime": 274.7257, |
|
"eval_bigbrother_samples_per_second": 4.987, |
|
"eval_bigbrother_steps_per_second": 0.106, |
|
"eval_bigbrother_wer": 35.237251268831066, |
|
"step": 189 |
|
}, |
|
{ |
|
"epoch": 2.27, |
|
"grad_norm": 3.6259799003601074, |
|
"learning_rate": 2.0000000000000003e-06, |
|
"loss": 0.5775, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 2.39, |
|
"eval_rundkast_loss": 0.4360753893852234, |
|
"eval_rundkast_runtime": 264.6712, |
|
"eval_rundkast_samples_per_second": 5.059, |
|
"eval_rundkast_steps_per_second": 0.106, |
|
"eval_rundkast_wer": 16.061430171172614, |
|
"step": 210 |
|
}, |
|
{ |
|
"epoch": 2.39, |
|
"eval_nb_samtale_loss": 0.40685713291168213, |
|
"eval_nb_samtale_runtime": 131.2828, |
|
"eval_nb_samtale_samples_per_second": 4.06, |
|
"eval_nb_samtale_steps_per_second": 0.091, |
|
"eval_nb_samtale_wer": 14.640299479166666, |
|
"step": 210 |
|
}, |
|
{ |
|
"epoch": 2.39, |
|
"eval_bigbrother_loss": 0.8864747881889343, |
|
"eval_bigbrother_runtime": 276.0432, |
|
"eval_bigbrother_samples_per_second": 4.963, |
|
"eval_bigbrother_steps_per_second": 0.105, |
|
"eval_bigbrother_wer": 36.30065254169016, |
|
"step": 210 |
|
}, |
|
{ |
|
"epoch": 2.62, |
|
"eval_rundkast_loss": 0.4100657105445862, |
|
"eval_rundkast_runtime": 262.8044, |
|
"eval_rundkast_samples_per_second": 5.095, |
|
"eval_rundkast_steps_per_second": 0.107, |
|
"eval_rundkast_wer": 15.877459606462965, |
|
"step": 231 |
|
}, |
|
{ |
|
"epoch": 2.62, |
|
"eval_nb_samtale_loss": 0.3821322023868561, |
|
"eval_nb_samtale_runtime": 130.922, |
|
"eval_nb_samtale_samples_per_second": 4.071, |
|
"eval_nb_samtale_steps_per_second": 0.092, |
|
"eval_nb_samtale_wer": 14.420572916666666, |
|
"step": 231 |
|
}, |
|
{ |
|
"epoch": 2.62, |
|
"eval_bigbrother_loss": 0.8451758027076721, |
|
"eval_bigbrother_runtime": 280.5265, |
|
"eval_bigbrother_samples_per_second": 4.884, |
|
"eval_bigbrother_steps_per_second": 0.103, |
|
"eval_bigbrother_wer": 41.01345363731571, |
|
"step": 231 |
|
}, |
|
{ |
|
"epoch": 2.86, |
|
"eval_rundkast_loss": 0.3871939480304718, |
|
"eval_rundkast_runtime": 263.4938, |
|
"eval_rundkast_samples_per_second": 5.082, |
|
"eval_rundkast_steps_per_second": 0.106, |
|
"eval_rundkast_wer": 15.66949288113902, |
|
"step": 252 |
|
}, |
|
{ |
|
"epoch": 2.86, |
|
"eval_nb_samtale_loss": 0.3619038164615631, |
|
"eval_nb_samtale_runtime": 131.3433, |
|
"eval_nb_samtale_samples_per_second": 4.058, |
|
"eval_nb_samtale_steps_per_second": 0.091, |
|
"eval_nb_samtale_wer": 13.7939453125, |
|
"step": 252 |
|
}, |
|
{ |
|
"epoch": 2.86, |
|
"eval_bigbrother_loss": 0.8229660987854004, |
|
"eval_bigbrother_runtime": 274.5883, |
|
"eval_bigbrother_samples_per_second": 4.989, |
|
"eval_bigbrother_steps_per_second": 0.106, |
|
"eval_bigbrother_wer": 35.42254088455651, |
|
"step": 252 |
|
}, |
|
{ |
|
"epoch": 3.1, |
|
"eval_rundkast_loss": 0.3819302022457123, |
|
"eval_rundkast_runtime": 264.1232, |
|
"eval_rundkast_samples_per_second": 5.07, |
|
"eval_rundkast_steps_per_second": 0.106, |
|
"eval_rundkast_wer": 15.62949928011518, |
|
"step": 273 |
|
}, |
|
{ |
|
"epoch": 3.1, |
|
"eval_nb_samtale_loss": 0.3480302095413208, |
|
"eval_nb_samtale_runtime": 131.3337, |
|
"eval_nb_samtale_samples_per_second": 4.058, |
|
"eval_nb_samtale_steps_per_second": 0.091, |
|
"eval_nb_samtale_wer": 13.6962890625, |
|
"step": 273 |
|
}, |
|
{ |
|
"epoch": 3.1, |
|
"eval_bigbrother_loss": 0.7991706728935242, |
|
"eval_bigbrother_runtime": 275.8969, |
|
"eval_bigbrother_samples_per_second": 4.966, |
|
"eval_bigbrother_steps_per_second": 0.105, |
|
"eval_bigbrother_wer": 36.510110368162415, |
|
"step": 273 |
|
}, |
|
{ |
|
"epoch": 3.34, |
|
"eval_rundkast_loss": 0.373095840215683, |
|
"eval_rundkast_runtime": 263.7758, |
|
"eval_rundkast_samples_per_second": 5.076, |
|
"eval_rundkast_steps_per_second": 0.106, |
|
"eval_rundkast_wer": 15.54951207806751, |
|
"step": 294 |
|
}, |
|
{ |
|
"epoch": 3.34, |
|
"eval_nb_samtale_loss": 0.33873096108436584, |
|
"eval_nb_samtale_runtime": 130.9933, |
|
"eval_nb_samtale_samples_per_second": 4.069, |
|
"eval_nb_samtale_steps_per_second": 0.092, |
|
"eval_nb_samtale_wer": 13.37890625, |
|
"step": 294 |
|
}, |
|
{ |
|
"epoch": 3.34, |
|
"eval_bigbrother_loss": 0.7896400690078735, |
|
"eval_bigbrother_runtime": 278.8566, |
|
"eval_bigbrother_samples_per_second": 4.913, |
|
"eval_bigbrother_steps_per_second": 0.104, |
|
"eval_bigbrother_wer": 37.299605252557804, |
|
"step": 294 |
|
}, |
|
{ |
|
"epoch": 3.41, |
|
"grad_norm": 2.6569244861602783, |
|
"learning_rate": 3e-06, |
|
"loss": 0.3439, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 3.58, |
|
"eval_rundkast_loss": 0.36107075214385986, |
|
"eval_rundkast_runtime": 264.3342, |
|
"eval_rundkast_samples_per_second": 5.066, |
|
"eval_rundkast_steps_per_second": 0.106, |
|
"eval_rundkast_wer": 15.469524876019836, |
|
"step": 315 |
|
}, |
|
{ |
|
"epoch": 3.58, |
|
"eval_nb_samtale_loss": 0.3277055621147156, |
|
"eval_nb_samtale_runtime": 130.9603, |
|
"eval_nb_samtale_samples_per_second": 4.07, |
|
"eval_nb_samtale_steps_per_second": 0.092, |
|
"eval_nb_samtale_wer": 13.191731770833334, |
|
"step": 315 |
|
}, |
|
{ |
|
"epoch": 3.58, |
|
"eval_bigbrother_loss": 0.7788997292518616, |
|
"eval_bigbrother_runtime": 274.084, |
|
"eval_bigbrother_samples_per_second": 4.998, |
|
"eval_bigbrother_steps_per_second": 0.106, |
|
"eval_bigbrother_wer": 34.92306452912269, |
|
"step": 315 |
|
}, |
|
{ |
|
"epoch": 3.82, |
|
"eval_rundkast_loss": 0.36361250281333923, |
|
"eval_rundkast_runtime": 261.275, |
|
"eval_rundkast_samples_per_second": 5.125, |
|
"eval_rundkast_steps_per_second": 0.107, |
|
"eval_rundkast_wer": 15.413533834586465, |
|
"step": 336 |
|
}, |
|
{ |
|
"epoch": 3.82, |
|
"eval_nb_samtale_loss": 0.32056552171707153, |
|
"eval_nb_samtale_runtime": 129.8079, |
|
"eval_nb_samtale_samples_per_second": 4.106, |
|
"eval_nb_samtale_steps_per_second": 0.092, |
|
"eval_nb_samtale_wer": 13.053385416666666, |
|
"step": 336 |
|
}, |
|
{ |
|
"epoch": 3.82, |
|
"eval_bigbrother_loss": 0.7767297029495239, |
|
"eval_bigbrother_runtime": 272.9633, |
|
"eval_bigbrother_samples_per_second": 5.019, |
|
"eval_bigbrother_steps_per_second": 0.106, |
|
"eval_bigbrother_wer": 35.22919519858213, |
|
"step": 336 |
|
}, |
|
{ |
|
"epoch": 4.06, |
|
"eval_rundkast_loss": 0.36683785915374756, |
|
"eval_rundkast_runtime": 265.3797, |
|
"eval_rundkast_samples_per_second": 5.046, |
|
"eval_rundkast_steps_per_second": 0.106, |
|
"eval_rundkast_wer": 15.173572228443449, |
|
"step": 357 |
|
}, |
|
{ |
|
"epoch": 4.06, |
|
"eval_nb_samtale_loss": 0.31466686725616455, |
|
"eval_nb_samtale_runtime": 129.9464, |
|
"eval_nb_samtale_samples_per_second": 4.102, |
|
"eval_nb_samtale_steps_per_second": 0.092, |
|
"eval_nb_samtale_wer": 12.996419270833334, |
|
"step": 357 |
|
}, |
|
{ |
|
"epoch": 4.06, |
|
"eval_bigbrother_loss": 0.7835009098052979, |
|
"eval_bigbrother_runtime": 277.5736, |
|
"eval_bigbrother_samples_per_second": 4.936, |
|
"eval_bigbrother_steps_per_second": 0.104, |
|
"eval_bigbrother_wer": 37.06597921533876, |
|
"step": 357 |
|
}, |
|
{ |
|
"epoch": 4.3, |
|
"eval_rundkast_loss": 0.3616587817668915, |
|
"eval_rundkast_runtime": 263.8209, |
|
"eval_rundkast_samples_per_second": 5.075, |
|
"eval_rundkast_steps_per_second": 0.106, |
|
"eval_rundkast_wer": 15.149576067829148, |
|
"step": 378 |
|
}, |
|
{ |
|
"epoch": 4.3, |
|
"eval_nb_samtale_loss": 0.31130969524383545, |
|
"eval_nb_samtale_runtime": 132.0306, |
|
"eval_nb_samtale_samples_per_second": 4.037, |
|
"eval_nb_samtale_steps_per_second": 0.091, |
|
"eval_nb_samtale_wer": 12.923177083333334, |
|
"step": 378 |
|
}, |
|
{ |
|
"epoch": 4.3, |
|
"eval_bigbrother_loss": 0.795174241065979, |
|
"eval_bigbrother_runtime": 277.1352, |
|
"eval_bigbrother_samples_per_second": 4.943, |
|
"eval_bigbrother_steps_per_second": 0.105, |
|
"eval_bigbrother_wer": 37.17070812857488, |
|
"step": 378 |
|
}, |
|
{ |
|
"epoch": 4.53, |
|
"eval_rundkast_loss": 0.36144548654556274, |
|
"eval_rundkast_runtime": 263.0031, |
|
"eval_rundkast_samples_per_second": 5.091, |
|
"eval_rundkast_steps_per_second": 0.106, |
|
"eval_rundkast_wer": 15.381538953767398, |
|
"step": 399 |
|
}, |
|
{ |
|
"epoch": 4.53, |
|
"eval_nb_samtale_loss": 0.30702516436576843, |
|
"eval_nb_samtale_runtime": 129.1297, |
|
"eval_nb_samtale_samples_per_second": 4.128, |
|
"eval_nb_samtale_steps_per_second": 0.093, |
|
"eval_nb_samtale_wer": 12.703450520833334, |
|
"step": 399 |
|
}, |
|
{ |
|
"epoch": 4.53, |
|
"eval_bigbrother_loss": 0.7950104475021362, |
|
"eval_bigbrother_runtime": 274.4695, |
|
"eval_bigbrother_samples_per_second": 4.991, |
|
"eval_bigbrother_steps_per_second": 0.106, |
|
"eval_bigbrother_wer": 34.74583098364617, |
|
"step": 399 |
|
}, |
|
{ |
|
"epoch": 4.55, |
|
"grad_norm": 3.0804500579833984, |
|
"learning_rate": 4.000000000000001e-06, |
|
"loss": 0.2472, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 4.77, |
|
"eval_rundkast_loss": 0.362693190574646, |
|
"eval_rundkast_runtime": 262.0631, |
|
"eval_rundkast_samples_per_second": 5.109, |
|
"eval_rundkast_steps_per_second": 0.107, |
|
"eval_rundkast_wer": 15.22956326987682, |
|
"step": 420 |
|
}, |
|
{ |
|
"epoch": 4.77, |
|
"eval_nb_samtale_loss": 0.30581969022750854, |
|
"eval_nb_samtale_runtime": 129.8604, |
|
"eval_nb_samtale_samples_per_second": 4.104, |
|
"eval_nb_samtale_steps_per_second": 0.092, |
|
"eval_nb_samtale_wer": 12.548828125, |
|
"step": 420 |
|
}, |
|
{ |
|
"epoch": 4.77, |
|
"eval_bigbrother_loss": 0.7997460961341858, |
|
"eval_bigbrother_runtime": 272.793, |
|
"eval_bigbrother_samples_per_second": 5.022, |
|
"eval_bigbrother_steps_per_second": 0.106, |
|
"eval_bigbrother_wer": 34.74583098364617, |
|
"step": 420 |
|
}, |
|
{ |
|
"epoch": 5.01, |
|
"eval_rundkast_loss": 0.3545509874820709, |
|
"eval_rundkast_runtime": 263.7902, |
|
"eval_rundkast_samples_per_second": 5.076, |
|
"eval_rundkast_steps_per_second": 0.106, |
|
"eval_rundkast_wer": 15.325547912334025, |
|
"step": 441 |
|
}, |
|
{ |
|
"epoch": 5.01, |
|
"eval_nb_samtale_loss": 0.3055456578731537, |
|
"eval_nb_samtale_runtime": 130.0706, |
|
"eval_nb_samtale_samples_per_second": 4.098, |
|
"eval_nb_samtale_steps_per_second": 0.092, |
|
"eval_nb_samtale_wer": 12.386067708333332, |
|
"step": 441 |
|
}, |
|
{ |
|
"epoch": 5.01, |
|
"eval_bigbrother_loss": 0.7725541591644287, |
|
"eval_bigbrother_runtime": 279.7798, |
|
"eval_bigbrother_samples_per_second": 4.897, |
|
"eval_bigbrother_steps_per_second": 0.104, |
|
"eval_bigbrother_wer": 37.6701844840087, |
|
"step": 441 |
|
}, |
|
{ |
|
"epoch": 5.25, |
|
"eval_rundkast_loss": 0.3629949688911438, |
|
"eval_rundkast_runtime": 261.4464, |
|
"eval_rundkast_samples_per_second": 5.122, |
|
"eval_rundkast_steps_per_second": 0.107, |
|
"eval_rundkast_wer": 15.30955047192449, |
|
"step": 462 |
|
}, |
|
{ |
|
"epoch": 5.25, |
|
"eval_nb_samtale_loss": 0.3084648847579956, |
|
"eval_nb_samtale_runtime": 128.7883, |
|
"eval_nb_samtale_samples_per_second": 4.139, |
|
"eval_nb_samtale_steps_per_second": 0.093, |
|
"eval_nb_samtale_wer": 12.3779296875, |
|
"step": 462 |
|
}, |
|
{ |
|
"epoch": 5.25, |
|
"eval_bigbrother_loss": 0.8035539388656616, |
|
"eval_bigbrother_runtime": 271.0588, |
|
"eval_bigbrother_samples_per_second": 5.054, |
|
"eval_bigbrother_steps_per_second": 0.107, |
|
"eval_bigbrother_wer": 34.43970031418674, |
|
"step": 462 |
|
}, |
|
{ |
|
"epoch": 5.49, |
|
"eval_rundkast_loss": 0.3648250699043274, |
|
"eval_rundkast_runtime": 264.7567, |
|
"eval_rundkast_samples_per_second": 5.057, |
|
"eval_rundkast_steps_per_second": 0.106, |
|
"eval_rundkast_wer": 15.189569668852984, |
|
"step": 483 |
|
}, |
|
{ |
|
"epoch": 5.49, |
|
"eval_nb_samtale_loss": 0.30580607056617737, |
|
"eval_nb_samtale_runtime": 130.4573, |
|
"eval_nb_samtale_samples_per_second": 4.086, |
|
"eval_nb_samtale_steps_per_second": 0.092, |
|
"eval_nb_samtale_wer": 12.288411458333332, |
|
"step": 483 |
|
}, |
|
{ |
|
"epoch": 5.49, |
|
"eval_bigbrother_loss": 0.8111706376075745, |
|
"eval_bigbrother_runtime": 273.5914, |
|
"eval_bigbrother_samples_per_second": 5.007, |
|
"eval_bigbrother_steps_per_second": 0.106, |
|
"eval_bigbrother_wer": 34.34302747119955, |
|
"step": 483 |
|
}, |
|
{ |
|
"epoch": 5.68, |
|
"grad_norm": 2.708979368209839, |
|
"learning_rate": 5e-06, |
|
"loss": 0.1864, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 5.73, |
|
"eval_rundkast_loss": 0.3714243173599243, |
|
"eval_rundkast_runtime": 264.8889, |
|
"eval_rundkast_samples_per_second": 5.055, |
|
"eval_rundkast_steps_per_second": 0.106, |
|
"eval_rundkast_wer": 15.213565829467285, |
|
"step": 504 |
|
}, |
|
{ |
|
"epoch": 5.73, |
|
"eval_nb_samtale_loss": 0.30661869049072266, |
|
"eval_nb_samtale_runtime": 129.9332, |
|
"eval_nb_samtale_samples_per_second": 4.102, |
|
"eval_nb_samtale_steps_per_second": 0.092, |
|
"eval_nb_samtale_wer": 12.3291015625, |
|
"step": 504 |
|
}, |
|
{ |
|
"epoch": 5.73, |
|
"eval_bigbrother_loss": 0.8136927485466003, |
|
"eval_bigbrother_runtime": 272.3894, |
|
"eval_bigbrother_samples_per_second": 5.03, |
|
"eval_bigbrother_steps_per_second": 0.106, |
|
"eval_bigbrother_wer": 34.5041488761782, |
|
"step": 504 |
|
}, |
|
{ |
|
"epoch": 5.97, |
|
"eval_rundkast_loss": 0.3704493045806885, |
|
"eval_rundkast_runtime": 263.3704, |
|
"eval_rundkast_samples_per_second": 5.084, |
|
"eval_rundkast_steps_per_second": 0.106, |
|
"eval_rundkast_wer": 15.261558150695889, |
|
"step": 525 |
|
}, |
|
{ |
|
"epoch": 5.97, |
|
"eval_nb_samtale_loss": 0.3032839298248291, |
|
"eval_nb_samtale_runtime": 128.4216, |
|
"eval_nb_samtale_samples_per_second": 4.15, |
|
"eval_nb_samtale_steps_per_second": 0.093, |
|
"eval_nb_samtale_wer": 12.3779296875, |
|
"step": 525 |
|
}, |
|
{ |
|
"epoch": 5.97, |
|
"eval_bigbrother_loss": 0.8149410486221313, |
|
"eval_bigbrother_runtime": 272.1944, |
|
"eval_bigbrother_samples_per_second": 5.033, |
|
"eval_bigbrother_steps_per_second": 0.107, |
|
"eval_bigbrother_wer": 34.81027954563764, |
|
"step": 525 |
|
}, |
|
{ |
|
"epoch": 6.2, |
|
"eval_rundkast_loss": 0.3849130868911743, |
|
"eval_rundkast_runtime": 261.0506, |
|
"eval_rundkast_samples_per_second": 5.129, |
|
"eval_rundkast_steps_per_second": 0.107, |
|
"eval_rundkast_wer": 15.061590145576709, |
|
"step": 546 |
|
}, |
|
{ |
|
"epoch": 6.2, |
|
"eval_nb_samtale_loss": 0.3138934373855591, |
|
"eval_nb_samtale_runtime": 130.4524, |
|
"eval_nb_samtale_samples_per_second": 4.086, |
|
"eval_nb_samtale_steps_per_second": 0.092, |
|
"eval_nb_samtale_wer": 12.052408854166668, |
|
"step": 546 |
|
}, |
|
{ |
|
"epoch": 6.2, |
|
"eval_bigbrother_loss": 0.8786391615867615, |
|
"eval_bigbrother_runtime": 271.5141, |
|
"eval_bigbrother_samples_per_second": 5.046, |
|
"eval_bigbrother_steps_per_second": 0.107, |
|
"eval_bigbrother_wer": 34.72166277289938, |
|
"step": 546 |
|
}, |
|
{ |
|
"epoch": 6.44, |
|
"eval_rundkast_loss": 0.38933807611465454, |
|
"eval_rundkast_runtime": 257.6232, |
|
"eval_rundkast_samples_per_second": 5.198, |
|
"eval_rundkast_steps_per_second": 0.109, |
|
"eval_rundkast_wer": 15.20556710926252, |
|
"step": 567 |
|
}, |
|
{ |
|
"epoch": 6.44, |
|
"eval_nb_samtale_loss": 0.3130148649215698, |
|
"eval_nb_samtale_runtime": 126.9397, |
|
"eval_nb_samtale_samples_per_second": 4.199, |
|
"eval_nb_samtale_steps_per_second": 0.095, |
|
"eval_nb_samtale_wer": 12.239583333333332, |
|
"step": 567 |
|
}, |
|
{ |
|
"epoch": 6.44, |
|
"eval_bigbrother_loss": 0.885236382484436, |
|
"eval_bigbrother_runtime": 274.5244, |
|
"eval_bigbrother_samples_per_second": 4.99, |
|
"eval_bigbrother_steps_per_second": 0.106, |
|
"eval_bigbrother_wer": 37.001530653347295, |
|
"step": 567 |
|
}, |
|
{ |
|
"epoch": 6.68, |
|
"eval_rundkast_loss": 0.38271185755729675, |
|
"eval_rundkast_runtime": 256.838, |
|
"eval_rundkast_samples_per_second": 5.213, |
|
"eval_rundkast_steps_per_second": 0.109, |
|
"eval_rundkast_wer": 15.16557350823868, |
|
"step": 588 |
|
}, |
|
{ |
|
"epoch": 6.68, |
|
"eval_nb_samtale_loss": 0.3086356222629547, |
|
"eval_nb_samtale_runtime": 128.1513, |
|
"eval_nb_samtale_samples_per_second": 4.159, |
|
"eval_nb_samtale_steps_per_second": 0.094, |
|
"eval_nb_samtale_wer": 12.190755208333332, |
|
"step": 588 |
|
}, |
|
{ |
|
"epoch": 6.68, |
|
"eval_bigbrother_loss": 0.8816072344779968, |
|
"eval_bigbrother_runtime": 275.8579, |
|
"eval_bigbrother_samples_per_second": 4.966, |
|
"eval_bigbrother_steps_per_second": 0.105, |
|
"eval_bigbrother_wer": 37.581567711270445, |
|
"step": 588 |
|
}, |
|
{ |
|
"epoch": 6.82, |
|
"grad_norm": 2.3564608097076416, |
|
"learning_rate": 6e-06, |
|
"loss": 0.135, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 6.92, |
|
"eval_rundkast_loss": 0.38250651955604553, |
|
"eval_rundkast_runtime": 256.6014, |
|
"eval_rundkast_samples_per_second": 5.218, |
|
"eval_rundkast_steps_per_second": 0.109, |
|
"eval_rundkast_wer": 14.901615741481363, |
|
"step": 609 |
|
}, |
|
{ |
|
"epoch": 6.92, |
|
"eval_nb_samtale_loss": 0.31294992566108704, |
|
"eval_nb_samtale_runtime": 127.0511, |
|
"eval_nb_samtale_samples_per_second": 4.195, |
|
"eval_nb_samtale_steps_per_second": 0.094, |
|
"eval_nb_samtale_wer": 11.954752604166668, |
|
"step": 609 |
|
}, |
|
{ |
|
"epoch": 6.92, |
|
"eval_bigbrother_loss": 0.8941463828086853, |
|
"eval_bigbrother_runtime": 267.477, |
|
"eval_bigbrother_samples_per_second": 5.122, |
|
"eval_bigbrother_steps_per_second": 0.108, |
|
"eval_bigbrother_wer": 34.520261016676066, |
|
"step": 609 |
|
} |
|
], |
|
"logging_steps": 100, |
|
"max_steps": 1056, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 12, |
|
"save_steps": 21, |
|
"total_flos": 8.4324653973504e+18, |
|
"train_batch_size": 48, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|