Whisper-small-NB / checkpoint-3520 /trainer_state.json
Tflatval's picture
Upload folder using huggingface_hub
d78950e verified
raw
history blame contribute delete
No virus
41.8 kB
{
"best_metric": 0.17350260416666666,
"best_model_checkpoint": "/cluster/home/torstefl/Master/saved_model/W2V/single/NB/30.05/checkpoint-3344",
"epoch": 40.0,
"eval_steps": 500,
"global_step": 3520,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 3.9170310497283936,
"learning_rate": 5.8e-06,
"loss": 0.9591,
"step": 88
},
{
"epoch": 1.0,
"eval_rundkast_loss": 0.5365053415298462,
"eval_rundkast_runtime": 35.6704,
"eval_rundkast_samples_per_second": 37.706,
"eval_rundkast_steps_per_second": 1.205,
"eval_rundkast_wer": 0.23027362392618517,
"step": 88
},
{
"epoch": 1.0,
"eval_nb_samtale_loss": 0.67843097448349,
"eval_nb_samtale_runtime": 39.2213,
"eval_nb_samtale_samples_per_second": 13.59,
"eval_nb_samtale_steps_per_second": 0.433,
"eval_nb_samtale_wer": 0.24666341145833334,
"step": 88
},
{
"epoch": 1.0,
"eval_bigbrother_loss": 2.74082612991333,
"eval_bigbrother_runtime": 41.8079,
"eval_bigbrother_samples_per_second": 32.769,
"eval_bigbrother_steps_per_second": 1.029,
"eval_bigbrother_wer": 0.6191089986304681,
"step": 88
},
{
"epoch": 2.0,
"grad_norm": 4.4212822914123535,
"learning_rate": 1.1666666666666668e-05,
"loss": 0.8123,
"step": 176
},
{
"epoch": 2.0,
"eval_rundkast_loss": 0.4252748191356659,
"eval_rundkast_runtime": 33.6441,
"eval_rundkast_samples_per_second": 39.977,
"eval_rundkast_steps_per_second": 1.278,
"eval_rundkast_wer": 0.2241489023226217,
"step": 176
},
{
"epoch": 2.0,
"eval_nb_samtale_loss": 0.5754267573356628,
"eval_nb_samtale_runtime": 38.5834,
"eval_nb_samtale_samples_per_second": 13.814,
"eval_nb_samtale_steps_per_second": 0.441,
"eval_nb_samtale_wer": 0.23527018229166666,
"step": 176
},
{
"epoch": 2.0,
"eval_bigbrother_loss": 2.240948438644409,
"eval_bigbrother_runtime": 41.5488,
"eval_bigbrother_samples_per_second": 32.973,
"eval_bigbrother_steps_per_second": 1.035,
"eval_bigbrother_wer": 0.6037219044550068,
"step": 176
},
{
"epoch": 3.0,
"grad_norm": 3.1233577728271484,
"learning_rate": 1.7533333333333334e-05,
"loss": 0.7517,
"step": 264
},
{
"epoch": 3.0,
"eval_rundkast_loss": 0.419950932264328,
"eval_rundkast_runtime": 33.5339,
"eval_rundkast_samples_per_second": 40.109,
"eval_rundkast_steps_per_second": 1.282,
"eval_rundkast_wer": 0.2205695195672924,
"step": 264
},
{
"epoch": 3.0,
"eval_nb_samtale_loss": 0.5531216263771057,
"eval_nb_samtale_runtime": 38.5893,
"eval_nb_samtale_samples_per_second": 13.812,
"eval_nb_samtale_steps_per_second": 0.441,
"eval_nb_samtale_wer": 0.22932942708333334,
"step": 264
},
{
"epoch": 3.0,
"eval_bigbrother_loss": 2.1344377994537354,
"eval_bigbrother_runtime": 41.2938,
"eval_bigbrother_samples_per_second": 33.177,
"eval_bigbrother_steps_per_second": 1.041,
"eval_bigbrother_wer": 0.5964714412309675,
"step": 264
},
{
"epoch": 4.0,
"grad_norm": 3.1834347248077393,
"learning_rate": 2.3400000000000003e-05,
"loss": 0.7074,
"step": 352
},
{
"epoch": 4.0,
"eval_rundkast_loss": 0.4088253676891327,
"eval_rundkast_runtime": 33.3755,
"eval_rundkast_samples_per_second": 40.299,
"eval_rundkast_steps_per_second": 1.288,
"eval_rundkast_wer": 0.22009226853324848,
"step": 352
},
{
"epoch": 4.0,
"eval_nb_samtale_loss": 0.5255401134490967,
"eval_nb_samtale_runtime": 38.2361,
"eval_nb_samtale_samples_per_second": 13.94,
"eval_nb_samtale_steps_per_second": 0.445,
"eval_nb_samtale_wer": 0.22696940104166666,
"step": 352
},
{
"epoch": 4.0,
"eval_bigbrother_loss": 2.036323070526123,
"eval_bigbrother_runtime": 41.2821,
"eval_bigbrother_samples_per_second": 33.186,
"eval_bigbrother_steps_per_second": 1.042,
"eval_bigbrother_wer": 0.5905099492467575,
"step": 352
},
{
"epoch": 5.0,
"grad_norm": 1.5792173147201538,
"learning_rate": 2.926666666666667e-05,
"loss": 0.6874,
"step": 440
},
{
"epoch": 5.0,
"eval_rundkast_loss": 0.40116986632347107,
"eval_rundkast_runtime": 33.3522,
"eval_rundkast_samples_per_second": 40.327,
"eval_rundkast_steps_per_second": 1.289,
"eval_rundkast_wer": 0.21985364301622654,
"step": 440
},
{
"epoch": 5.0,
"eval_nb_samtale_loss": 0.5132110714912415,
"eval_nb_samtale_runtime": 38.393,
"eval_nb_samtale_samples_per_second": 13.883,
"eval_nb_samtale_steps_per_second": 0.443,
"eval_nb_samtale_wer": 0.224365234375,
"step": 440
},
{
"epoch": 5.0,
"eval_bigbrother_loss": 1.9978336095809937,
"eval_bigbrother_runtime": 41.45,
"eval_bigbrother_samples_per_second": 33.052,
"eval_bigbrother_steps_per_second": 1.037,
"eval_bigbrother_wer": 0.5905099492467575,
"step": 440
},
{
"epoch": 6.0,
"grad_norm": 2.002620220184326,
"learning_rate": 3.513333333333334e-05,
"loss": 0.6548,
"step": 528
},
{
"epoch": 6.0,
"eval_rundkast_loss": 0.4032253921031952,
"eval_rundkast_runtime": 33.4235,
"eval_rundkast_samples_per_second": 40.241,
"eval_rundkast_steps_per_second": 1.287,
"eval_rundkast_wer": 0.217467387846007,
"step": 528
},
{
"epoch": 6.0,
"eval_nb_samtale_loss": 0.5047765374183655,
"eval_nb_samtale_runtime": 38.2135,
"eval_nb_samtale_samples_per_second": 13.948,
"eval_nb_samtale_steps_per_second": 0.445,
"eval_nb_samtale_wer": 0.220947265625,
"step": 528
},
{
"epoch": 6.0,
"eval_bigbrother_loss": 1.9670743942260742,
"eval_bigbrother_runtime": 41.4322,
"eval_bigbrother_samples_per_second": 33.066,
"eval_bigbrother_steps_per_second": 1.038,
"eval_bigbrother_wer": 0.5801176186256344,
"step": 528
},
{
"epoch": 7.0,
"grad_norm": 1.4368079900741577,
"learning_rate": 4.1e-05,
"loss": 0.6439,
"step": 616
},
{
"epoch": 7.0,
"eval_rundkast_loss": 0.39594346284866333,
"eval_rundkast_runtime": 33.337,
"eval_rundkast_samples_per_second": 40.346,
"eval_rundkast_steps_per_second": 1.29,
"eval_rundkast_wer": 0.22009226853324848,
"step": 616
},
{
"epoch": 7.0,
"eval_nb_samtale_loss": 0.48273980617523193,
"eval_nb_samtale_runtime": 38.0773,
"eval_nb_samtale_samples_per_second": 13.998,
"eval_nb_samtale_steps_per_second": 0.446,
"eval_nb_samtale_wer": 0.21964518229166666,
"step": 616
},
{
"epoch": 7.0,
"eval_bigbrother_loss": 1.921434998512268,
"eval_bigbrother_runtime": 41.5595,
"eval_bigbrother_samples_per_second": 32.965,
"eval_bigbrother_steps_per_second": 1.035,
"eval_bigbrother_wer": 0.5865624748247805,
"step": 616
},
{
"epoch": 8.0,
"grad_norm": 1.1675041913986206,
"learning_rate": 4.686666666666667e-05,
"loss": 0.6158,
"step": 704
},
{
"epoch": 8.0,
"eval_rundkast_loss": 0.40993189811706543,
"eval_rundkast_runtime": 33.4667,
"eval_rundkast_samples_per_second": 40.189,
"eval_rundkast_steps_per_second": 1.285,
"eval_rundkast_wer": 0.22128539611835826,
"step": 704
},
{
"epoch": 8.0,
"eval_nb_samtale_loss": 0.494111031293869,
"eval_nb_samtale_runtime": 38.0186,
"eval_nb_samtale_samples_per_second": 14.019,
"eval_nb_samtale_steps_per_second": 0.447,
"eval_nb_samtale_wer": 0.21712239583333334,
"step": 704
},
{
"epoch": 8.0,
"eval_bigbrother_loss": 1.9780834913253784,
"eval_bigbrother_runtime": 41.757,
"eval_bigbrother_samples_per_second": 32.809,
"eval_bigbrother_steps_per_second": 1.03,
"eval_bigbrother_wer": 0.5809232256505277,
"step": 704
},
{
"epoch": 9.0,
"grad_norm": 2.030735731124878,
"learning_rate": 5.273333333333333e-05,
"loss": 0.6041,
"step": 792
},
{
"epoch": 9.0,
"eval_rundkast_loss": 0.3950729966163635,
"eval_rundkast_runtime": 33.5538,
"eval_rundkast_samples_per_second": 40.085,
"eval_rundkast_steps_per_second": 1.282,
"eval_rundkast_wer": 0.21762647152402165,
"step": 792
},
{
"epoch": 9.0,
"eval_nb_samtale_loss": 0.45818740129470825,
"eval_nb_samtale_runtime": 37.9662,
"eval_nb_samtale_samples_per_second": 14.039,
"eval_nb_samtale_steps_per_second": 0.448,
"eval_nb_samtale_wer": 0.21183268229166666,
"step": 792
},
{
"epoch": 9.0,
"eval_bigbrother_loss": 1.8719202280044556,
"eval_bigbrother_runtime": 42.0553,
"eval_bigbrother_samples_per_second": 32.576,
"eval_bigbrother_steps_per_second": 1.022,
"eval_bigbrother_wer": 0.5723032304841699,
"step": 792
},
{
"epoch": 10.0,
"grad_norm": 1.995400071144104,
"learning_rate": 5.86e-05,
"loss": 0.586,
"step": 880
},
{
"epoch": 10.0,
"eval_rundkast_loss": 0.39550164341926575,
"eval_rundkast_runtime": 33.4182,
"eval_rundkast_samples_per_second": 40.248,
"eval_rundkast_steps_per_second": 1.287,
"eval_rundkast_wer": 0.21762647152402165,
"step": 880
},
{
"epoch": 10.0,
"eval_nb_samtale_loss": 0.46760231256484985,
"eval_nb_samtale_runtime": 38.1072,
"eval_nb_samtale_samples_per_second": 13.987,
"eval_nb_samtale_steps_per_second": 0.446,
"eval_nb_samtale_wer": 0.208251953125,
"step": 880
},
{
"epoch": 10.0,
"eval_bigbrother_loss": 1.8893344402313232,
"eval_bigbrother_runtime": 41.5152,
"eval_bigbrother_samples_per_second": 33.0,
"eval_bigbrother_steps_per_second": 1.036,
"eval_bigbrother_wer": 0.5765729477161041,
"step": 880
},
{
"epoch": 11.0,
"grad_norm": 1.3565304279327393,
"learning_rate": 6.446666666666667e-05,
"loss": 0.5779,
"step": 968
},
{
"epoch": 11.0,
"eval_rundkast_loss": 0.39460697770118713,
"eval_rundkast_runtime": 33.627,
"eval_rundkast_samples_per_second": 39.998,
"eval_rundkast_steps_per_second": 1.279,
"eval_rundkast_wer": 0.21810372255806554,
"step": 968
},
{
"epoch": 11.0,
"eval_nb_samtale_loss": 0.45650386810302734,
"eval_nb_samtale_runtime": 37.9631,
"eval_nb_samtale_samples_per_second": 14.04,
"eval_nb_samtale_steps_per_second": 0.448,
"eval_nb_samtale_wer": 0.20613606770833334,
"step": 968
},
{
"epoch": 11.0,
"eval_bigbrother_loss": 1.9142467975616455,
"eval_bigbrother_runtime": 41.4099,
"eval_bigbrother_samples_per_second": 33.084,
"eval_bigbrother_steps_per_second": 1.038,
"eval_bigbrother_wer": 0.5729477161040845,
"step": 968
},
{
"epoch": 12.0,
"grad_norm": 1.7810662984848022,
"learning_rate": 7.033333333333334e-05,
"loss": 0.5375,
"step": 1056
},
{
"epoch": 12.0,
"eval_rundkast_loss": 0.40589994192123413,
"eval_rundkast_runtime": 33.6087,
"eval_rundkast_samples_per_second": 40.019,
"eval_rundkast_steps_per_second": 1.279,
"eval_rundkast_wer": 0.2184218899140948,
"step": 1056
},
{
"epoch": 12.0,
"eval_nb_samtale_loss": 0.46365875005722046,
"eval_nb_samtale_runtime": 38.2581,
"eval_nb_samtale_samples_per_second": 13.932,
"eval_nb_samtale_steps_per_second": 0.444,
"eval_nb_samtale_wer": 0.201171875,
"step": 1056
},
{
"epoch": 12.0,
"eval_bigbrother_loss": 1.9760468006134033,
"eval_bigbrother_runtime": 42.201,
"eval_bigbrother_samples_per_second": 32.464,
"eval_bigbrother_steps_per_second": 1.019,
"eval_bigbrother_wer": 0.5706920164343833,
"step": 1056
},
{
"epoch": 13.0,
"grad_norm": 1.9388726949691772,
"learning_rate": 7.620000000000001e-05,
"loss": 0.5238,
"step": 1144
},
{
"epoch": 13.0,
"eval_rundkast_loss": 0.4222950339317322,
"eval_rundkast_runtime": 33.5989,
"eval_rundkast_samples_per_second": 40.031,
"eval_rundkast_steps_per_second": 1.28,
"eval_rundkast_wer": 0.21945593382118994,
"step": 1144
},
{
"epoch": 13.0,
"eval_nb_samtale_loss": 0.47446364164352417,
"eval_nb_samtale_runtime": 37.9325,
"eval_nb_samtale_samples_per_second": 14.051,
"eval_nb_samtale_steps_per_second": 0.448,
"eval_nb_samtale_wer": 0.20345052083333334,
"step": 1144
},
{
"epoch": 13.0,
"eval_bigbrother_loss": 1.956613540649414,
"eval_bigbrother_runtime": 41.6064,
"eval_bigbrother_samples_per_second": 32.928,
"eval_bigbrother_steps_per_second": 1.033,
"eval_bigbrother_wer": 0.564408281640216,
"step": 1144
},
{
"epoch": 14.0,
"grad_norm": 1.7794352769851685,
"learning_rate": 8.206666666666666e-05,
"loss": 0.5002,
"step": 1232
},
{
"epoch": 14.0,
"eval_rundkast_loss": 0.40369686484336853,
"eval_rundkast_runtime": 33.4225,
"eval_rundkast_samples_per_second": 40.242,
"eval_rundkast_steps_per_second": 1.287,
"eval_rundkast_wer": 0.2170696786509704,
"step": 1232
},
{
"epoch": 14.0,
"eval_nb_samtale_loss": 0.4533463418483734,
"eval_nb_samtale_runtime": 38.1602,
"eval_nb_samtale_samples_per_second": 13.967,
"eval_nb_samtale_steps_per_second": 0.445,
"eval_nb_samtale_wer": 0.19881184895833334,
"step": 1232
},
{
"epoch": 14.0,
"eval_bigbrother_loss": 1.9202650785446167,
"eval_bigbrother_runtime": 41.8647,
"eval_bigbrother_samples_per_second": 32.724,
"eval_bigbrother_steps_per_second": 1.027,
"eval_bigbrother_wer": 0.5650527672601305,
"step": 1232
},
{
"epoch": 15.0,
"grad_norm": 2.007899284362793,
"learning_rate": 8.793333333333333e-05,
"loss": 0.4939,
"step": 1320
},
{
"epoch": 15.0,
"eval_rundkast_loss": 0.39848214387893677,
"eval_rundkast_runtime": 33.4922,
"eval_rundkast_samples_per_second": 40.159,
"eval_rundkast_steps_per_second": 1.284,
"eval_rundkast_wer": 0.21794463888005092,
"step": 1320
},
{
"epoch": 15.0,
"eval_nb_samtale_loss": 0.43362265825271606,
"eval_nb_samtale_runtime": 37.9431,
"eval_nb_samtale_samples_per_second": 14.047,
"eval_nb_samtale_steps_per_second": 0.448,
"eval_nb_samtale_wer": 0.20182291666666666,
"step": 1320
},
{
"epoch": 15.0,
"eval_bigbrother_loss": 1.824406385421753,
"eval_bigbrother_runtime": 41.6014,
"eval_bigbrother_samples_per_second": 32.932,
"eval_bigbrother_steps_per_second": 1.034,
"eval_bigbrother_wer": 0.5605413679207283,
"step": 1320
},
{
"epoch": 16.0,
"grad_norm": 1.890428066253662,
"learning_rate": 9.38e-05,
"loss": 0.493,
"step": 1408
},
{
"epoch": 16.0,
"eval_rundkast_loss": 0.42038509249687195,
"eval_rundkast_runtime": 33.8742,
"eval_rundkast_samples_per_second": 39.706,
"eval_rundkast_steps_per_second": 1.269,
"eval_rundkast_wer": 0.22009226853324848,
"step": 1408
},
{
"epoch": 16.0,
"eval_nb_samtale_loss": 0.4756682515144348,
"eval_nb_samtale_runtime": 38.2223,
"eval_nb_samtale_samples_per_second": 13.945,
"eval_nb_samtale_steps_per_second": 0.445,
"eval_nb_samtale_wer": 0.20003255208333334,
"step": 1408
},
{
"epoch": 16.0,
"eval_bigbrother_loss": 2.017906665802002,
"eval_bigbrother_runtime": 41.7123,
"eval_bigbrother_samples_per_second": 32.844,
"eval_bigbrother_steps_per_second": 1.031,
"eval_bigbrother_wer": 0.5624748247804721,
"step": 1408
},
{
"epoch": 17.0,
"grad_norm": 1.8507376909255981,
"learning_rate": 9.966666666666667e-05,
"loss": 0.4734,
"step": 1496
},
{
"epoch": 17.0,
"eval_rundkast_loss": 0.4344000518321991,
"eval_rundkast_runtime": 34.0756,
"eval_rundkast_samples_per_second": 39.471,
"eval_rundkast_steps_per_second": 1.262,
"eval_rundkast_wer": 0.21699013681196308,
"step": 1496
},
{
"epoch": 17.0,
"eval_nb_samtale_loss": 0.4668411314487457,
"eval_nb_samtale_runtime": 37.9422,
"eval_nb_samtale_samples_per_second": 14.048,
"eval_nb_samtale_steps_per_second": 0.448,
"eval_nb_samtale_wer": 0.19694010416666666,
"step": 1496
},
{
"epoch": 17.0,
"eval_bigbrother_loss": 1.9858715534210205,
"eval_bigbrother_runtime": 41.6236,
"eval_bigbrother_samples_per_second": 32.914,
"eval_bigbrother_steps_per_second": 1.033,
"eval_bigbrother_wer": 0.5611052928381536,
"step": 1496
},
{
"epoch": 18.0,
"grad_norm": 1.6648415327072144,
"learning_rate": 9.589108910891089e-05,
"loss": 0.4444,
"step": 1584
},
{
"epoch": 18.0,
"eval_rundkast_loss": 0.459636926651001,
"eval_rundkast_runtime": 33.6234,
"eval_rundkast_samples_per_second": 40.002,
"eval_rundkast_steps_per_second": 1.279,
"eval_rundkast_wer": 0.2184218899140948,
"step": 1584
},
{
"epoch": 18.0,
"eval_nb_samtale_loss": 0.4778790771961212,
"eval_nb_samtale_runtime": 37.93,
"eval_nb_samtale_samples_per_second": 14.052,
"eval_nb_samtale_steps_per_second": 0.448,
"eval_nb_samtale_wer": 0.19482421875,
"step": 1584
},
{
"epoch": 18.0,
"eval_bigbrother_loss": 2.19545316696167,
"eval_bigbrother_runtime": 41.4756,
"eval_bigbrother_samples_per_second": 33.031,
"eval_bigbrother_steps_per_second": 1.037,
"eval_bigbrother_wer": 0.5647305244501732,
"step": 1584
},
{
"epoch": 19.0,
"grad_norm": 2.001049041748047,
"learning_rate": 9.153465346534654e-05,
"loss": 0.4535,
"step": 1672
},
{
"epoch": 19.0,
"eval_rundkast_loss": 0.4358086585998535,
"eval_rundkast_runtime": 33.8712,
"eval_rundkast_samples_per_second": 39.709,
"eval_rundkast_steps_per_second": 1.27,
"eval_rundkast_wer": 0.21317212853961184,
"step": 1672
},
{
"epoch": 19.0,
"eval_nb_samtale_loss": 0.4770139157772064,
"eval_nb_samtale_runtime": 38.0225,
"eval_nb_samtale_samples_per_second": 14.018,
"eval_nb_samtale_steps_per_second": 0.447,
"eval_nb_samtale_wer": 0.19514973958333334,
"step": 1672
},
{
"epoch": 19.0,
"eval_bigbrother_loss": 2.057053804397583,
"eval_bigbrother_runtime": 41.9595,
"eval_bigbrother_samples_per_second": 32.651,
"eval_bigbrother_steps_per_second": 1.025,
"eval_bigbrother_wer": 0.5624748247804721,
"step": 1672
},
{
"epoch": 20.0,
"grad_norm": 1.6764415502548218,
"learning_rate": 8.717821782178219e-05,
"loss": 0.4231,
"step": 1760
},
{
"epoch": 20.0,
"eval_rundkast_loss": 0.41307970881462097,
"eval_rundkast_runtime": 34.1234,
"eval_rundkast_samples_per_second": 39.416,
"eval_rundkast_steps_per_second": 1.26,
"eval_rundkast_wer": 0.21603563474387527,
"step": 1760
},
{
"epoch": 20.0,
"eval_nb_samtale_loss": 0.43975648283958435,
"eval_nb_samtale_runtime": 37.7496,
"eval_nb_samtale_samples_per_second": 14.119,
"eval_nb_samtale_steps_per_second": 0.45,
"eval_nb_samtale_wer": 0.18717447916666666,
"step": 1760
},
{
"epoch": 20.0,
"eval_bigbrother_loss": 1.9533370733261108,
"eval_bigbrother_runtime": 41.7155,
"eval_bigbrother_samples_per_second": 32.842,
"eval_bigbrother_steps_per_second": 1.031,
"eval_bigbrother_wer": 0.5524852976717957,
"step": 1760
},
{
"epoch": 21.0,
"grad_norm": 1.599152684211731,
"learning_rate": 8.282178217821782e-05,
"loss": 0.4086,
"step": 1848
},
{
"epoch": 21.0,
"eval_rundkast_loss": 0.4404522776603699,
"eval_rundkast_runtime": 33.7971,
"eval_rundkast_samples_per_second": 39.796,
"eval_rundkast_steps_per_second": 1.272,
"eval_rundkast_wer": 0.2138880050906777,
"step": 1848
},
{
"epoch": 21.0,
"eval_nb_samtale_loss": 0.4675068259239197,
"eval_nb_samtale_runtime": 37.8694,
"eval_nb_samtale_samples_per_second": 14.075,
"eval_nb_samtale_steps_per_second": 0.449,
"eval_nb_samtale_wer": 0.19132486979166666,
"step": 1848
},
{
"epoch": 21.0,
"eval_bigbrother_loss": 2.153977632522583,
"eval_bigbrother_runtime": 41.6263,
"eval_bigbrother_samples_per_second": 32.912,
"eval_bigbrother_steps_per_second": 1.033,
"eval_bigbrother_wer": 0.5508740836220092,
"step": 1848
},
{
"epoch": 22.0,
"grad_norm": 2.0951850414276123,
"learning_rate": 7.846534653465347e-05,
"loss": 0.3963,
"step": 1936
},
{
"epoch": 22.0,
"eval_rundkast_loss": 0.455175518989563,
"eval_rundkast_runtime": 33.5764,
"eval_rundkast_samples_per_second": 40.058,
"eval_rundkast_steps_per_second": 1.281,
"eval_rundkast_wer": 0.21643334393891187,
"step": 1936
},
{
"epoch": 22.0,
"eval_nb_samtale_loss": 0.4630807340145111,
"eval_nb_samtale_runtime": 37.7668,
"eval_nb_samtale_samples_per_second": 14.113,
"eval_nb_samtale_steps_per_second": 0.45,
"eval_nb_samtale_wer": 0.18977864583333334,
"step": 1936
},
{
"epoch": 22.0,
"eval_bigbrother_loss": 2.1877636909484863,
"eval_bigbrother_runtime": 41.6656,
"eval_bigbrother_samples_per_second": 32.881,
"eval_bigbrother_steps_per_second": 1.032,
"eval_bigbrother_wer": 0.5527269797792637,
"step": 1936
},
{
"epoch": 23.0,
"grad_norm": 1.5935795307159424,
"learning_rate": 7.410891089108911e-05,
"loss": 0.3858,
"step": 2024
},
{
"epoch": 23.0,
"eval_rundkast_loss": 0.46708443760871887,
"eval_rundkast_runtime": 33.6671,
"eval_rundkast_samples_per_second": 39.95,
"eval_rundkast_steps_per_second": 1.277,
"eval_rundkast_wer": 0.2152402163538021,
"step": 2024
},
{
"epoch": 23.0,
"eval_nb_samtale_loss": 0.4683707356452942,
"eval_nb_samtale_runtime": 37.9855,
"eval_nb_samtale_samples_per_second": 14.032,
"eval_nb_samtale_steps_per_second": 0.448,
"eval_nb_samtale_wer": 0.185791015625,
"step": 2024
},
{
"epoch": 23.0,
"eval_bigbrother_loss": 2.148423910140991,
"eval_bigbrother_runtime": 41.6837,
"eval_bigbrother_samples_per_second": 32.867,
"eval_bigbrother_steps_per_second": 1.032,
"eval_bigbrother_wer": 0.5511157657294772,
"step": 2024
},
{
"epoch": 24.0,
"grad_norm": 2.292874813079834,
"learning_rate": 6.975247524752476e-05,
"loss": 0.3763,
"step": 2112
},
{
"epoch": 24.0,
"eval_rundkast_loss": 0.47619959712028503,
"eval_rundkast_runtime": 33.4679,
"eval_rundkast_samples_per_second": 40.188,
"eval_rundkast_steps_per_second": 1.285,
"eval_rundkast_wer": 0.21810372255806554,
"step": 2112
},
{
"epoch": 24.0,
"eval_nb_samtale_loss": 0.47193431854248047,
"eval_nb_samtale_runtime": 37.7044,
"eval_nb_samtale_samples_per_second": 14.136,
"eval_nb_samtale_steps_per_second": 0.451,
"eval_nb_samtale_wer": 0.18709309895833334,
"step": 2112
},
{
"epoch": 24.0,
"eval_bigbrother_loss": 2.1468334197998047,
"eval_bigbrother_runtime": 41.3571,
"eval_bigbrother_samples_per_second": 33.126,
"eval_bigbrother_steps_per_second": 1.04,
"eval_bigbrother_wer": 0.559735760895835,
"step": 2112
},
{
"epoch": 25.0,
"grad_norm": 2.466032028198242,
"learning_rate": 6.53960396039604e-05,
"loss": 0.3741,
"step": 2200
},
{
"epoch": 25.0,
"eval_rundkast_loss": 0.4504246711730957,
"eval_rundkast_runtime": 33.5467,
"eval_rundkast_samples_per_second": 40.093,
"eval_rundkast_steps_per_second": 1.282,
"eval_rundkast_wer": 0.2134107540566338,
"step": 2200
},
{
"epoch": 25.0,
"eval_nb_samtale_loss": 0.4489670693874359,
"eval_nb_samtale_runtime": 37.6649,
"eval_nb_samtale_samples_per_second": 14.151,
"eval_nb_samtale_steps_per_second": 0.451,
"eval_nb_samtale_wer": 0.185546875,
"step": 2200
},
{
"epoch": 25.0,
"eval_bigbrother_loss": 2.1423308849334717,
"eval_bigbrother_runtime": 41.5117,
"eval_bigbrother_samples_per_second": 33.003,
"eval_bigbrother_steps_per_second": 1.036,
"eval_bigbrother_wer": 0.553290904696689,
"step": 2200
},
{
"epoch": 26.0,
"grad_norm": 1.5329217910766602,
"learning_rate": 6.103960396039604e-05,
"loss": 0.3723,
"step": 2288
},
{
"epoch": 26.0,
"eval_rundkast_loss": 0.4836730659008026,
"eval_rundkast_runtime": 33.6087,
"eval_rundkast_samples_per_second": 40.019,
"eval_rundkast_steps_per_second": 1.279,
"eval_rundkast_wer": 0.2152402163538021,
"step": 2288
},
{
"epoch": 26.0,
"eval_nb_samtale_loss": 0.4578171968460083,
"eval_nb_samtale_runtime": 37.9306,
"eval_nb_samtale_samples_per_second": 14.052,
"eval_nb_samtale_steps_per_second": 0.448,
"eval_nb_samtale_wer": 0.18424479166666666,
"step": 2288
},
{
"epoch": 26.0,
"eval_bigbrother_loss": 2.1947550773620605,
"eval_bigbrother_runtime": 41.8164,
"eval_bigbrother_samples_per_second": 32.762,
"eval_bigbrother_steps_per_second": 1.028,
"eval_bigbrother_wer": 0.549101748167244,
"step": 2288
},
{
"epoch": 27.0,
"grad_norm": 1.3041456937789917,
"learning_rate": 5.668316831683168e-05,
"loss": 0.3684,
"step": 2376
},
{
"epoch": 27.0,
"eval_rundkast_loss": 0.4755971133708954,
"eval_rundkast_runtime": 33.7598,
"eval_rundkast_samples_per_second": 39.84,
"eval_rundkast_steps_per_second": 1.274,
"eval_rundkast_wer": 0.21197900095450206,
"step": 2376
},
{
"epoch": 27.0,
"eval_nb_samtale_loss": 0.4704474210739136,
"eval_nb_samtale_runtime": 37.5334,
"eval_nb_samtale_samples_per_second": 14.201,
"eval_nb_samtale_steps_per_second": 0.453,
"eval_nb_samtale_wer": 0.180419921875,
"step": 2376
},
{
"epoch": 27.0,
"eval_bigbrother_loss": 2.2346787452697754,
"eval_bigbrother_runtime": 41.523,
"eval_bigbrother_samples_per_second": 32.994,
"eval_bigbrother_steps_per_second": 1.036,
"eval_bigbrother_wer": 0.549101748167244,
"step": 2376
},
{
"epoch": 28.0,
"grad_norm": 1.4035800695419312,
"learning_rate": 5.232673267326733e-05,
"loss": 0.3536,
"step": 2464
},
{
"epoch": 28.0,
"eval_rundkast_loss": 0.4591149687767029,
"eval_rundkast_runtime": 33.8672,
"eval_rundkast_samples_per_second": 39.714,
"eval_rundkast_steps_per_second": 1.27,
"eval_rundkast_wer": 0.2085587018771874,
"step": 2464
},
{
"epoch": 28.0,
"eval_nb_samtale_loss": 0.4490753710269928,
"eval_nb_samtale_runtime": 37.5138,
"eval_nb_samtale_samples_per_second": 14.208,
"eval_nb_samtale_steps_per_second": 0.453,
"eval_nb_samtale_wer": 0.18074544270833334,
"step": 2464
},
{
"epoch": 28.0,
"eval_bigbrother_loss": 2.1479501724243164,
"eval_bigbrother_runtime": 41.5368,
"eval_bigbrother_samples_per_second": 32.983,
"eval_bigbrother_steps_per_second": 1.035,
"eval_bigbrother_wer": 0.5502295980020946,
"step": 2464
},
{
"epoch": 29.0,
"grad_norm": 2.3787569999694824,
"learning_rate": 4.797029702970297e-05,
"loss": 0.3422,
"step": 2552
},
{
"epoch": 29.0,
"eval_rundkast_loss": 0.45249199867248535,
"eval_rundkast_runtime": 33.8412,
"eval_rundkast_samples_per_second": 39.745,
"eval_rundkast_steps_per_second": 1.271,
"eval_rundkast_wer": 0.2116608335984728,
"step": 2552
},
{
"epoch": 29.0,
"eval_nb_samtale_loss": 0.42878830432891846,
"eval_nb_samtale_runtime": 37.8412,
"eval_nb_samtale_samples_per_second": 14.085,
"eval_nb_samtale_steps_per_second": 0.449,
"eval_nb_samtale_wer": 0.179931640625,
"step": 2552
},
{
"epoch": 29.0,
"eval_bigbrother_loss": 2.074361562728882,
"eval_bigbrother_runtime": 41.584,
"eval_bigbrother_samples_per_second": 32.945,
"eval_bigbrother_steps_per_second": 1.034,
"eval_bigbrother_wer": 0.5470877306050109,
"step": 2552
},
{
"epoch": 30.0,
"grad_norm": 1.0397918224334717,
"learning_rate": 4.3613861386138617e-05,
"loss": 0.3271,
"step": 2640
},
{
"epoch": 30.0,
"eval_rundkast_loss": 0.4873400926589966,
"eval_rundkast_runtime": 33.7561,
"eval_rundkast_samples_per_second": 39.845,
"eval_rundkast_steps_per_second": 1.274,
"eval_rundkast_wer": 0.21174037543748012,
"step": 2640
},
{
"epoch": 30.0,
"eval_nb_samtale_loss": 0.4706071615219116,
"eval_nb_samtale_runtime": 37.8498,
"eval_nb_samtale_samples_per_second": 14.082,
"eval_nb_samtale_steps_per_second": 0.449,
"eval_nb_samtale_wer": 0.17960611979166666,
"step": 2640
},
{
"epoch": 30.0,
"eval_bigbrother_loss": 2.284547805786133,
"eval_bigbrother_runtime": 43.2872,
"eval_bigbrother_samples_per_second": 31.649,
"eval_bigbrother_steps_per_second": 0.993,
"eval_bigbrother_wer": 0.5479738983323934,
"step": 2640
},
{
"epoch": 31.0,
"grad_norm": 1.832560420036316,
"learning_rate": 3.925742574257426e-05,
"loss": 0.3351,
"step": 2728
},
{
"epoch": 31.0,
"eval_rundkast_loss": 0.4675346612930298,
"eval_rundkast_runtime": 33.6595,
"eval_rundkast_samples_per_second": 39.959,
"eval_rundkast_steps_per_second": 1.277,
"eval_rundkast_wer": 0.21094495704740693,
"step": 2728
},
{
"epoch": 31.0,
"eval_nb_samtale_loss": 0.44606560468673706,
"eval_nb_samtale_runtime": 37.8399,
"eval_nb_samtale_samples_per_second": 14.086,
"eval_nb_samtale_steps_per_second": 0.449,
"eval_nb_samtale_wer": 0.1767578125,
"step": 2728
},
{
"epoch": 31.0,
"eval_bigbrother_loss": 2.2436790466308594,
"eval_bigbrother_runtime": 41.8909,
"eval_bigbrother_samples_per_second": 32.704,
"eval_bigbrother_steps_per_second": 1.026,
"eval_bigbrother_wer": 0.5497462337871586,
"step": 2728
},
{
"epoch": 32.0,
"grad_norm": 2.598604917526245,
"learning_rate": 3.49009900990099e-05,
"loss": 0.3266,
"step": 2816
},
{
"epoch": 32.0,
"eval_rundkast_loss": 0.47241419553756714,
"eval_rundkast_runtime": 33.6802,
"eval_rundkast_samples_per_second": 39.934,
"eval_rundkast_steps_per_second": 1.277,
"eval_rundkast_wer": 0.2099109131403118,
"step": 2816
},
{
"epoch": 32.0,
"eval_nb_samtale_loss": 0.46288925409317017,
"eval_nb_samtale_runtime": 37.3999,
"eval_nb_samtale_samples_per_second": 14.251,
"eval_nb_samtale_steps_per_second": 0.455,
"eval_nb_samtale_wer": 0.17952473958333334,
"step": 2816
},
{
"epoch": 32.0,
"eval_bigbrother_loss": 2.2838997840881348,
"eval_bigbrother_runtime": 41.6372,
"eval_bigbrother_samples_per_second": 32.903,
"eval_bigbrother_steps_per_second": 1.033,
"eval_bigbrother_wer": 0.5497462337871586,
"step": 2816
},
{
"epoch": 33.0,
"grad_norm": 2.8319473266601562,
"learning_rate": 3.054455445544554e-05,
"loss": 0.3164,
"step": 2904
},
{
"epoch": 33.0,
"eval_rundkast_loss": 0.49051862955093384,
"eval_rundkast_runtime": 33.5657,
"eval_rundkast_samples_per_second": 40.071,
"eval_rundkast_steps_per_second": 1.281,
"eval_rundkast_wer": 0.21102449888641425,
"step": 2904
},
{
"epoch": 33.0,
"eval_nb_samtale_loss": 0.47550272941589355,
"eval_nb_samtale_runtime": 37.719,
"eval_nb_samtale_samples_per_second": 14.131,
"eval_nb_samtale_steps_per_second": 0.451,
"eval_nb_samtale_wer": 0.17708333333333334,
"step": 2904
},
{
"epoch": 33.0,
"eval_bigbrother_loss": 2.360140085220337,
"eval_bigbrother_runtime": 41.7548,
"eval_bigbrother_samples_per_second": 32.811,
"eval_bigbrother_steps_per_second": 1.03,
"eval_bigbrother_wer": 0.549343430274712,
"step": 2904
},
{
"epoch": 34.0,
"grad_norm": 1.165239930152893,
"learning_rate": 2.6188118811881192e-05,
"loss": 0.325,
"step": 2992
},
{
"epoch": 34.0,
"eval_rundkast_loss": 0.4772399365901947,
"eval_rundkast_runtime": 34.1144,
"eval_rundkast_samples_per_second": 39.426,
"eval_rundkast_steps_per_second": 1.26,
"eval_rundkast_wer": 0.21142220808145085,
"step": 2992
},
{
"epoch": 34.0,
"eval_nb_samtale_loss": 0.45948928594589233,
"eval_nb_samtale_runtime": 37.8345,
"eval_nb_samtale_samples_per_second": 14.088,
"eval_nb_samtale_steps_per_second": 0.449,
"eval_nb_samtale_wer": 0.17692057291666666,
"step": 2992
},
{
"epoch": 34.0,
"eval_bigbrother_loss": 2.2873830795288086,
"eval_bigbrother_runtime": 41.8269,
"eval_bigbrother_samples_per_second": 32.754,
"eval_bigbrother_steps_per_second": 1.028,
"eval_bigbrother_wer": 0.5465238056875856,
"step": 2992
},
{
"epoch": 35.0,
"grad_norm": 1.3796650171279907,
"learning_rate": 2.1831683168316834e-05,
"loss": 0.3195,
"step": 3080
},
{
"epoch": 35.0,
"eval_rundkast_loss": 0.48370474576950073,
"eval_rundkast_runtime": 33.7199,
"eval_rundkast_samples_per_second": 39.887,
"eval_rundkast_steps_per_second": 1.275,
"eval_rundkast_wer": 0.21006999681832644,
"step": 3080
},
{
"epoch": 35.0,
"eval_nb_samtale_loss": 0.4662381708621979,
"eval_nb_samtale_runtime": 38.5158,
"eval_nb_samtale_samples_per_second": 13.838,
"eval_nb_samtale_steps_per_second": 0.441,
"eval_nb_samtale_wer": 0.17635091145833334,
"step": 3080
},
{
"epoch": 35.0,
"eval_bigbrother_loss": 2.249934434890747,
"eval_bigbrother_runtime": 41.5219,
"eval_bigbrother_samples_per_second": 32.995,
"eval_bigbrother_steps_per_second": 1.036,
"eval_bigbrother_wer": 0.5461210021751389,
"step": 3080
},
{
"epoch": 36.0,
"grad_norm": 2.232914686203003,
"learning_rate": 1.7475247524752476e-05,
"loss": 0.3169,
"step": 3168
},
{
"epoch": 36.0,
"eval_rundkast_loss": 0.4873496890068054,
"eval_rundkast_runtime": 33.9486,
"eval_rundkast_samples_per_second": 39.619,
"eval_rundkast_steps_per_second": 1.267,
"eval_rundkast_wer": 0.20935412026726058,
"step": 3168
},
{
"epoch": 36.0,
"eval_nb_samtale_loss": 0.4695265591144562,
"eval_nb_samtale_runtime": 37.5912,
"eval_nb_samtale_samples_per_second": 14.179,
"eval_nb_samtale_steps_per_second": 0.452,
"eval_nb_samtale_wer": 0.175048828125,
"step": 3168
},
{
"epoch": 36.0,
"eval_bigbrother_loss": 2.2812929153442383,
"eval_bigbrother_runtime": 42.1676,
"eval_bigbrother_samples_per_second": 32.489,
"eval_bigbrother_steps_per_second": 1.02,
"eval_bigbrother_wer": 0.545879320067671,
"step": 3168
},
{
"epoch": 37.0,
"grad_norm": 1.227518916130066,
"learning_rate": 1.311881188118812e-05,
"loss": 0.3205,
"step": 3256
},
{
"epoch": 37.0,
"eval_rundkast_loss": 0.4848962128162384,
"eval_rundkast_runtime": 34.1615,
"eval_rundkast_samples_per_second": 39.372,
"eval_rundkast_steps_per_second": 1.259,
"eval_rundkast_wer": 0.21046770601336304,
"step": 3256
},
{
"epoch": 37.0,
"eval_nb_samtale_loss": 0.45955517888069153,
"eval_nb_samtale_runtime": 37.7962,
"eval_nb_samtale_samples_per_second": 14.102,
"eval_nb_samtale_steps_per_second": 0.45,
"eval_nb_samtale_wer": 0.17521158854166666,
"step": 3256
},
{
"epoch": 37.0,
"eval_bigbrother_loss": 2.2612295150756836,
"eval_bigbrother_runtime": 41.8835,
"eval_bigbrother_samples_per_second": 32.71,
"eval_bigbrother_steps_per_second": 1.027,
"eval_bigbrother_wer": 0.5478127769274148,
"step": 3256
},
{
"epoch": 38.0,
"grad_norm": 1.3873769044876099,
"learning_rate": 8.762376237623762e-06,
"loss": 0.3164,
"step": 3344
},
{
"epoch": 38.0,
"eval_rundkast_loss": 0.4849892556667328,
"eval_rundkast_runtime": 33.7856,
"eval_rundkast_samples_per_second": 39.81,
"eval_rundkast_steps_per_second": 1.273,
"eval_rundkast_wer": 0.20999045497931912,
"step": 3344
},
{
"epoch": 38.0,
"eval_nb_samtale_loss": 0.45760098099708557,
"eval_nb_samtale_runtime": 37.6736,
"eval_nb_samtale_samples_per_second": 14.148,
"eval_nb_samtale_steps_per_second": 0.451,
"eval_nb_samtale_wer": 0.17350260416666666,
"step": 3344
},
{
"epoch": 38.0,
"eval_bigbrother_loss": 2.2668609619140625,
"eval_bigbrother_runtime": 42.1887,
"eval_bigbrother_samples_per_second": 32.473,
"eval_bigbrother_steps_per_second": 1.019,
"eval_bigbrother_wer": 0.5437041811004591,
"step": 3344
},
{
"epoch": 39.0,
"grad_norm": 1.6516066789627075,
"learning_rate": 4.405940594059406e-06,
"loss": 0.3145,
"step": 3432
},
{
"epoch": 39.0,
"eval_rundkast_loss": 0.48802104592323303,
"eval_rundkast_runtime": 34.1337,
"eval_rundkast_samples_per_second": 39.404,
"eval_rundkast_steps_per_second": 1.26,
"eval_rundkast_wer": 0.20911549475023863,
"step": 3432
},
{
"epoch": 39.0,
"eval_nb_samtale_loss": 0.4593607187271118,
"eval_nb_samtale_runtime": 37.7724,
"eval_nb_samtale_samples_per_second": 14.111,
"eval_nb_samtale_steps_per_second": 0.45,
"eval_nb_samtale_wer": 0.17390950520833334,
"step": 3432
},
{
"epoch": 39.0,
"eval_bigbrother_loss": 2.2844576835632324,
"eval_bigbrother_runtime": 41.9423,
"eval_bigbrother_samples_per_second": 32.664,
"eval_bigbrother_steps_per_second": 1.025,
"eval_bigbrother_wer": 0.5430596954805446,
"step": 3432
},
{
"epoch": 40.0,
"grad_norm": 1.1558164358139038,
"learning_rate": 4.950495049504951e-08,
"loss": 0.3122,
"step": 3520
},
{
"epoch": 40.0,
"eval_rundkast_loss": 0.4869055449962616,
"eval_rundkast_runtime": 33.9078,
"eval_rundkast_samples_per_second": 39.666,
"eval_rundkast_steps_per_second": 1.268,
"eval_rundkast_wer": 0.20895641107222399,
"step": 3520
},
{
"epoch": 40.0,
"eval_nb_samtale_loss": 0.4583870470523834,
"eval_nb_samtale_runtime": 37.9869,
"eval_nb_samtale_samples_per_second": 14.031,
"eval_nb_samtale_steps_per_second": 0.448,
"eval_nb_samtale_wer": 0.174072265625,
"step": 3520
},
{
"epoch": 40.0,
"eval_bigbrother_loss": 2.280332565307617,
"eval_bigbrother_runtime": 41.7851,
"eval_bigbrother_samples_per_second": 32.787,
"eval_bigbrother_steps_per_second": 1.029,
"eval_bigbrother_wer": 0.5434624989929913,
"step": 3520
}
],
"logging_steps": 500,
"max_steps": 3520,
"num_input_tokens_seen": 0,
"num_train_epochs": 40,
"save_steps": 500,
"total_flos": 4.807600562770979e+19,
"train_batch_size": 48,
"trial_name": null,
"trial_params": null
}