Whisper-small-NB / trainer_state.json
Tflatval's picture
Upload folder using huggingface_hub
1d3ef3c verified
raw
history blame contribute delete
No virus
26.6 kB
{
"best_metric": 11.954752604166668,
"best_model_checkpoint": "/cluster/home/torstefl/Master/saved_model/Whisper/NB-02.06/checkpoint-609",
"epoch": 6.920454545454545,
"eval_steps": 21,
"global_step": 609,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.24,
"eval_rundkast_loss": 1.514348030090332,
"eval_rundkast_runtime": 267.2294,
"eval_rundkast_samples_per_second": 5.011,
"eval_rundkast_steps_per_second": 0.105,
"eval_rundkast_wer": 17.877139657654777,
"step": 21
},
{
"epoch": 0.24,
"eval_nb_samtale_loss": 1.4326682090759277,
"eval_nb_samtale_runtime": 128.5326,
"eval_nb_samtale_samples_per_second": 4.147,
"eval_nb_samtale_steps_per_second": 0.093,
"eval_nb_samtale_wer": 16.89453125,
"step": 21
},
{
"epoch": 0.24,
"eval_bigbrother_loss": 2.1967878341674805,
"eval_bigbrother_runtime": 274.0177,
"eval_bigbrother_samples_per_second": 5.0,
"eval_bigbrother_steps_per_second": 0.106,
"eval_bigbrother_wer": 37.10625956658342,
"step": 21
},
{
"epoch": 0.48,
"eval_rundkast_loss": 1.4300581216812134,
"eval_rundkast_runtime": 263.2899,
"eval_rundkast_samples_per_second": 5.086,
"eval_rundkast_steps_per_second": 0.106,
"eval_rundkast_wer": 17.789153735402337,
"step": 42
},
{
"epoch": 0.48,
"eval_nb_samtale_loss": 1.3351885080337524,
"eval_nb_samtale_runtime": 127.9406,
"eval_nb_samtale_samples_per_second": 4.166,
"eval_nb_samtale_steps_per_second": 0.094,
"eval_nb_samtale_wer": 16.935221354166664,
"step": 42
},
{
"epoch": 0.48,
"eval_bigbrother_loss": 2.0810060501098633,
"eval_bigbrother_runtime": 273.3743,
"eval_bigbrother_samples_per_second": 5.011,
"eval_bigbrother_steps_per_second": 0.106,
"eval_bigbrother_wer": 36.81624103762185,
"step": 42
},
{
"epoch": 0.72,
"eval_rundkast_loss": 1.298883080482483,
"eval_rundkast_runtime": 264.443,
"eval_rundkast_samples_per_second": 5.063,
"eval_rundkast_steps_per_second": 0.106,
"eval_rundkast_wer": 17.757158854583267,
"step": 63
},
{
"epoch": 0.72,
"eval_nb_samtale_loss": 1.1716408729553223,
"eval_nb_samtale_runtime": 128.1882,
"eval_nb_samtale_samples_per_second": 4.158,
"eval_nb_samtale_steps_per_second": 0.094,
"eval_nb_samtale_wer": 17.024739583333336,
"step": 63
},
{
"epoch": 0.72,
"eval_bigbrother_loss": 1.9180413484573364,
"eval_bigbrother_runtime": 274.3045,
"eval_bigbrother_samples_per_second": 4.994,
"eval_bigbrother_steps_per_second": 0.106,
"eval_bigbrother_wer": 36.67928784338999,
"step": 63
},
{
"epoch": 0.95,
"eval_rundkast_loss": 1.1174129247665405,
"eval_rundkast_runtime": 266.1387,
"eval_rundkast_samples_per_second": 5.031,
"eval_rundkast_steps_per_second": 0.105,
"eval_rundkast_wer": 17.765157574788034,
"step": 84
},
{
"epoch": 0.95,
"eval_nb_samtale_loss": 0.95993971824646,
"eval_nb_samtale_runtime": 128.381,
"eval_nb_samtale_samples_per_second": 4.152,
"eval_nb_samtale_steps_per_second": 0.093,
"eval_nb_samtale_wer": 17.635091145833336,
"step": 84
},
{
"epoch": 0.95,
"eval_bigbrother_loss": 1.7143659591674805,
"eval_bigbrother_runtime": 275.348,
"eval_bigbrother_samples_per_second": 4.976,
"eval_bigbrother_steps_per_second": 0.105,
"eval_bigbrother_wer": 36.69539998388786,
"step": 84
},
{
"epoch": 1.14,
"grad_norm": 12.247305870056152,
"learning_rate": 1.0000000000000002e-06,
"loss": 1.2113,
"step": 100
},
{
"epoch": 1.19,
"eval_rundkast_loss": 0.920071542263031,
"eval_rundkast_runtime": 265.1068,
"eval_rundkast_samples_per_second": 5.051,
"eval_rundkast_steps_per_second": 0.106,
"eval_rundkast_wer": 17.653175491921292,
"step": 105
},
{
"epoch": 1.19,
"eval_nb_samtale_loss": 0.777379035949707,
"eval_nb_samtale_runtime": 128.2654,
"eval_nb_samtale_samples_per_second": 4.155,
"eval_nb_samtale_steps_per_second": 0.094,
"eval_nb_samtale_wer": 17.195638020833336,
"step": 105
},
{
"epoch": 1.19,
"eval_bigbrother_loss": 1.4940869808197021,
"eval_bigbrother_runtime": 273.3462,
"eval_bigbrother_samples_per_second": 5.012,
"eval_bigbrother_steps_per_second": 0.106,
"eval_bigbrother_wer": 36.85652138886651,
"step": 105
},
{
"epoch": 1.43,
"eval_rundkast_loss": 0.7526112794876099,
"eval_rundkast_runtime": 263.7468,
"eval_rundkast_samples_per_second": 5.077,
"eval_rundkast_steps_per_second": 0.106,
"eval_rundkast_wer": 17.325227963525837,
"step": 126
},
{
"epoch": 1.43,
"eval_nb_samtale_loss": 0.6493657231330872,
"eval_nb_samtale_runtime": 128.8699,
"eval_nb_samtale_samples_per_second": 4.136,
"eval_nb_samtale_steps_per_second": 0.093,
"eval_nb_samtale_wer": 16.162109375,
"step": 126
},
{
"epoch": 1.43,
"eval_bigbrother_loss": 1.2856446504592896,
"eval_bigbrother_runtime": 274.6648,
"eval_bigbrother_samples_per_second": 4.988,
"eval_bigbrother_steps_per_second": 0.106,
"eval_bigbrother_wer": 35.73672762426489,
"step": 126
},
{
"epoch": 1.67,
"eval_rundkast_loss": 0.6184744238853455,
"eval_rundkast_runtime": 264.7084,
"eval_rundkast_samples_per_second": 5.058,
"eval_rundkast_steps_per_second": 0.106,
"eval_rundkast_wer": 17.04527275635898,
"step": 147
},
{
"epoch": 1.67,
"eval_nb_samtale_loss": 0.55622398853302,
"eval_nb_samtale_runtime": 128.1926,
"eval_nb_samtale_samples_per_second": 4.158,
"eval_nb_samtale_steps_per_second": 0.094,
"eval_nb_samtale_wer": 15.388997395833334,
"step": 147
},
{
"epoch": 1.67,
"eval_bigbrother_loss": 1.117920994758606,
"eval_bigbrother_runtime": 275.1798,
"eval_bigbrother_samples_per_second": 4.979,
"eval_bigbrother_steps_per_second": 0.105,
"eval_bigbrother_wer": 35.688391202771285,
"step": 147
},
{
"epoch": 1.91,
"eval_rundkast_loss": 0.5196747779846191,
"eval_rundkast_runtime": 264.025,
"eval_rundkast_samples_per_second": 5.071,
"eval_rundkast_steps_per_second": 0.106,
"eval_rundkast_wer": 16.73332266837306,
"step": 168
},
{
"epoch": 1.91,
"eval_nb_samtale_loss": 0.48537084460258484,
"eval_nb_samtale_runtime": 130.6175,
"eval_nb_samtale_samples_per_second": 4.081,
"eval_nb_samtale_steps_per_second": 0.092,
"eval_nb_samtale_wer": 15.087890625,
"step": 168
},
{
"epoch": 1.91,
"eval_bigbrother_loss": 0.993186891078949,
"eval_bigbrother_runtime": 272.8105,
"eval_bigbrother_samples_per_second": 5.022,
"eval_bigbrother_steps_per_second": 0.106,
"eval_bigbrother_wer": 35.42254088455651,
"step": 168
},
{
"epoch": 2.15,
"eval_rundkast_loss": 0.46956706047058105,
"eval_rundkast_runtime": 265.2136,
"eval_rundkast_samples_per_second": 5.049,
"eval_rundkast_steps_per_second": 0.106,
"eval_rundkast_wer": 16.309390497520397,
"step": 189
},
{
"epoch": 2.15,
"eval_nb_samtale_loss": 0.43936076760292053,
"eval_nb_samtale_runtime": 130.644,
"eval_nb_samtale_samples_per_second": 4.08,
"eval_nb_samtale_steps_per_second": 0.092,
"eval_nb_samtale_wer": 14.925130208333334,
"step": 189
},
{
"epoch": 2.15,
"eval_bigbrother_loss": 0.9301990866661072,
"eval_bigbrother_runtime": 274.7257,
"eval_bigbrother_samples_per_second": 4.987,
"eval_bigbrother_steps_per_second": 0.106,
"eval_bigbrother_wer": 35.237251268831066,
"step": 189
},
{
"epoch": 2.27,
"grad_norm": 3.6259799003601074,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.5775,
"step": 200
},
{
"epoch": 2.39,
"eval_rundkast_loss": 0.4360753893852234,
"eval_rundkast_runtime": 264.6712,
"eval_rundkast_samples_per_second": 5.059,
"eval_rundkast_steps_per_second": 0.106,
"eval_rundkast_wer": 16.061430171172614,
"step": 210
},
{
"epoch": 2.39,
"eval_nb_samtale_loss": 0.40685713291168213,
"eval_nb_samtale_runtime": 131.2828,
"eval_nb_samtale_samples_per_second": 4.06,
"eval_nb_samtale_steps_per_second": 0.091,
"eval_nb_samtale_wer": 14.640299479166666,
"step": 210
},
{
"epoch": 2.39,
"eval_bigbrother_loss": 0.8864747881889343,
"eval_bigbrother_runtime": 276.0432,
"eval_bigbrother_samples_per_second": 4.963,
"eval_bigbrother_steps_per_second": 0.105,
"eval_bigbrother_wer": 36.30065254169016,
"step": 210
},
{
"epoch": 2.62,
"eval_rundkast_loss": 0.4100657105445862,
"eval_rundkast_runtime": 262.8044,
"eval_rundkast_samples_per_second": 5.095,
"eval_rundkast_steps_per_second": 0.107,
"eval_rundkast_wer": 15.877459606462965,
"step": 231
},
{
"epoch": 2.62,
"eval_nb_samtale_loss": 0.3821322023868561,
"eval_nb_samtale_runtime": 130.922,
"eval_nb_samtale_samples_per_second": 4.071,
"eval_nb_samtale_steps_per_second": 0.092,
"eval_nb_samtale_wer": 14.420572916666666,
"step": 231
},
{
"epoch": 2.62,
"eval_bigbrother_loss": 0.8451758027076721,
"eval_bigbrother_runtime": 280.5265,
"eval_bigbrother_samples_per_second": 4.884,
"eval_bigbrother_steps_per_second": 0.103,
"eval_bigbrother_wer": 41.01345363731571,
"step": 231
},
{
"epoch": 2.86,
"eval_rundkast_loss": 0.3871939480304718,
"eval_rundkast_runtime": 263.4938,
"eval_rundkast_samples_per_second": 5.082,
"eval_rundkast_steps_per_second": 0.106,
"eval_rundkast_wer": 15.66949288113902,
"step": 252
},
{
"epoch": 2.86,
"eval_nb_samtale_loss": 0.3619038164615631,
"eval_nb_samtale_runtime": 131.3433,
"eval_nb_samtale_samples_per_second": 4.058,
"eval_nb_samtale_steps_per_second": 0.091,
"eval_nb_samtale_wer": 13.7939453125,
"step": 252
},
{
"epoch": 2.86,
"eval_bigbrother_loss": 0.8229660987854004,
"eval_bigbrother_runtime": 274.5883,
"eval_bigbrother_samples_per_second": 4.989,
"eval_bigbrother_steps_per_second": 0.106,
"eval_bigbrother_wer": 35.42254088455651,
"step": 252
},
{
"epoch": 3.1,
"eval_rundkast_loss": 0.3819302022457123,
"eval_rundkast_runtime": 264.1232,
"eval_rundkast_samples_per_second": 5.07,
"eval_rundkast_steps_per_second": 0.106,
"eval_rundkast_wer": 15.62949928011518,
"step": 273
},
{
"epoch": 3.1,
"eval_nb_samtale_loss": 0.3480302095413208,
"eval_nb_samtale_runtime": 131.3337,
"eval_nb_samtale_samples_per_second": 4.058,
"eval_nb_samtale_steps_per_second": 0.091,
"eval_nb_samtale_wer": 13.6962890625,
"step": 273
},
{
"epoch": 3.1,
"eval_bigbrother_loss": 0.7991706728935242,
"eval_bigbrother_runtime": 275.8969,
"eval_bigbrother_samples_per_second": 4.966,
"eval_bigbrother_steps_per_second": 0.105,
"eval_bigbrother_wer": 36.510110368162415,
"step": 273
},
{
"epoch": 3.34,
"eval_rundkast_loss": 0.373095840215683,
"eval_rundkast_runtime": 263.7758,
"eval_rundkast_samples_per_second": 5.076,
"eval_rundkast_steps_per_second": 0.106,
"eval_rundkast_wer": 15.54951207806751,
"step": 294
},
{
"epoch": 3.34,
"eval_nb_samtale_loss": 0.33873096108436584,
"eval_nb_samtale_runtime": 130.9933,
"eval_nb_samtale_samples_per_second": 4.069,
"eval_nb_samtale_steps_per_second": 0.092,
"eval_nb_samtale_wer": 13.37890625,
"step": 294
},
{
"epoch": 3.34,
"eval_bigbrother_loss": 0.7896400690078735,
"eval_bigbrother_runtime": 278.8566,
"eval_bigbrother_samples_per_second": 4.913,
"eval_bigbrother_steps_per_second": 0.104,
"eval_bigbrother_wer": 37.299605252557804,
"step": 294
},
{
"epoch": 3.41,
"grad_norm": 2.6569244861602783,
"learning_rate": 3e-06,
"loss": 0.3439,
"step": 300
},
{
"epoch": 3.58,
"eval_rundkast_loss": 0.36107075214385986,
"eval_rundkast_runtime": 264.3342,
"eval_rundkast_samples_per_second": 5.066,
"eval_rundkast_steps_per_second": 0.106,
"eval_rundkast_wer": 15.469524876019836,
"step": 315
},
{
"epoch": 3.58,
"eval_nb_samtale_loss": 0.3277055621147156,
"eval_nb_samtale_runtime": 130.9603,
"eval_nb_samtale_samples_per_second": 4.07,
"eval_nb_samtale_steps_per_second": 0.092,
"eval_nb_samtale_wer": 13.191731770833334,
"step": 315
},
{
"epoch": 3.58,
"eval_bigbrother_loss": 0.7788997292518616,
"eval_bigbrother_runtime": 274.084,
"eval_bigbrother_samples_per_second": 4.998,
"eval_bigbrother_steps_per_second": 0.106,
"eval_bigbrother_wer": 34.92306452912269,
"step": 315
},
{
"epoch": 3.82,
"eval_rundkast_loss": 0.36361250281333923,
"eval_rundkast_runtime": 261.275,
"eval_rundkast_samples_per_second": 5.125,
"eval_rundkast_steps_per_second": 0.107,
"eval_rundkast_wer": 15.413533834586465,
"step": 336
},
{
"epoch": 3.82,
"eval_nb_samtale_loss": 0.32056552171707153,
"eval_nb_samtale_runtime": 129.8079,
"eval_nb_samtale_samples_per_second": 4.106,
"eval_nb_samtale_steps_per_second": 0.092,
"eval_nb_samtale_wer": 13.053385416666666,
"step": 336
},
{
"epoch": 3.82,
"eval_bigbrother_loss": 0.7767297029495239,
"eval_bigbrother_runtime": 272.9633,
"eval_bigbrother_samples_per_second": 5.019,
"eval_bigbrother_steps_per_second": 0.106,
"eval_bigbrother_wer": 35.22919519858213,
"step": 336
},
{
"epoch": 4.06,
"eval_rundkast_loss": 0.36683785915374756,
"eval_rundkast_runtime": 265.3797,
"eval_rundkast_samples_per_second": 5.046,
"eval_rundkast_steps_per_second": 0.106,
"eval_rundkast_wer": 15.173572228443449,
"step": 357
},
{
"epoch": 4.06,
"eval_nb_samtale_loss": 0.31466686725616455,
"eval_nb_samtale_runtime": 129.9464,
"eval_nb_samtale_samples_per_second": 4.102,
"eval_nb_samtale_steps_per_second": 0.092,
"eval_nb_samtale_wer": 12.996419270833334,
"step": 357
},
{
"epoch": 4.06,
"eval_bigbrother_loss": 0.7835009098052979,
"eval_bigbrother_runtime": 277.5736,
"eval_bigbrother_samples_per_second": 4.936,
"eval_bigbrother_steps_per_second": 0.104,
"eval_bigbrother_wer": 37.06597921533876,
"step": 357
},
{
"epoch": 4.3,
"eval_rundkast_loss": 0.3616587817668915,
"eval_rundkast_runtime": 263.8209,
"eval_rundkast_samples_per_second": 5.075,
"eval_rundkast_steps_per_second": 0.106,
"eval_rundkast_wer": 15.149576067829148,
"step": 378
},
{
"epoch": 4.3,
"eval_nb_samtale_loss": 0.31130969524383545,
"eval_nb_samtale_runtime": 132.0306,
"eval_nb_samtale_samples_per_second": 4.037,
"eval_nb_samtale_steps_per_second": 0.091,
"eval_nb_samtale_wer": 12.923177083333334,
"step": 378
},
{
"epoch": 4.3,
"eval_bigbrother_loss": 0.795174241065979,
"eval_bigbrother_runtime": 277.1352,
"eval_bigbrother_samples_per_second": 4.943,
"eval_bigbrother_steps_per_second": 0.105,
"eval_bigbrother_wer": 37.17070812857488,
"step": 378
},
{
"epoch": 4.53,
"eval_rundkast_loss": 0.36144548654556274,
"eval_rundkast_runtime": 263.0031,
"eval_rundkast_samples_per_second": 5.091,
"eval_rundkast_steps_per_second": 0.106,
"eval_rundkast_wer": 15.381538953767398,
"step": 399
},
{
"epoch": 4.53,
"eval_nb_samtale_loss": 0.30702516436576843,
"eval_nb_samtale_runtime": 129.1297,
"eval_nb_samtale_samples_per_second": 4.128,
"eval_nb_samtale_steps_per_second": 0.093,
"eval_nb_samtale_wer": 12.703450520833334,
"step": 399
},
{
"epoch": 4.53,
"eval_bigbrother_loss": 0.7950104475021362,
"eval_bigbrother_runtime": 274.4695,
"eval_bigbrother_samples_per_second": 4.991,
"eval_bigbrother_steps_per_second": 0.106,
"eval_bigbrother_wer": 34.74583098364617,
"step": 399
},
{
"epoch": 4.55,
"grad_norm": 3.0804500579833984,
"learning_rate": 4.000000000000001e-06,
"loss": 0.2472,
"step": 400
},
{
"epoch": 4.77,
"eval_rundkast_loss": 0.362693190574646,
"eval_rundkast_runtime": 262.0631,
"eval_rundkast_samples_per_second": 5.109,
"eval_rundkast_steps_per_second": 0.107,
"eval_rundkast_wer": 15.22956326987682,
"step": 420
},
{
"epoch": 4.77,
"eval_nb_samtale_loss": 0.30581969022750854,
"eval_nb_samtale_runtime": 129.8604,
"eval_nb_samtale_samples_per_second": 4.104,
"eval_nb_samtale_steps_per_second": 0.092,
"eval_nb_samtale_wer": 12.548828125,
"step": 420
},
{
"epoch": 4.77,
"eval_bigbrother_loss": 0.7997460961341858,
"eval_bigbrother_runtime": 272.793,
"eval_bigbrother_samples_per_second": 5.022,
"eval_bigbrother_steps_per_second": 0.106,
"eval_bigbrother_wer": 34.74583098364617,
"step": 420
},
{
"epoch": 5.01,
"eval_rundkast_loss": 0.3545509874820709,
"eval_rundkast_runtime": 263.7902,
"eval_rundkast_samples_per_second": 5.076,
"eval_rundkast_steps_per_second": 0.106,
"eval_rundkast_wer": 15.325547912334025,
"step": 441
},
{
"epoch": 5.01,
"eval_nb_samtale_loss": 0.3055456578731537,
"eval_nb_samtale_runtime": 130.0706,
"eval_nb_samtale_samples_per_second": 4.098,
"eval_nb_samtale_steps_per_second": 0.092,
"eval_nb_samtale_wer": 12.386067708333332,
"step": 441
},
{
"epoch": 5.01,
"eval_bigbrother_loss": 0.7725541591644287,
"eval_bigbrother_runtime": 279.7798,
"eval_bigbrother_samples_per_second": 4.897,
"eval_bigbrother_steps_per_second": 0.104,
"eval_bigbrother_wer": 37.6701844840087,
"step": 441
},
{
"epoch": 5.25,
"eval_rundkast_loss": 0.3629949688911438,
"eval_rundkast_runtime": 261.4464,
"eval_rundkast_samples_per_second": 5.122,
"eval_rundkast_steps_per_second": 0.107,
"eval_rundkast_wer": 15.30955047192449,
"step": 462
},
{
"epoch": 5.25,
"eval_nb_samtale_loss": 0.3084648847579956,
"eval_nb_samtale_runtime": 128.7883,
"eval_nb_samtale_samples_per_second": 4.139,
"eval_nb_samtale_steps_per_second": 0.093,
"eval_nb_samtale_wer": 12.3779296875,
"step": 462
},
{
"epoch": 5.25,
"eval_bigbrother_loss": 0.8035539388656616,
"eval_bigbrother_runtime": 271.0588,
"eval_bigbrother_samples_per_second": 5.054,
"eval_bigbrother_steps_per_second": 0.107,
"eval_bigbrother_wer": 34.43970031418674,
"step": 462
},
{
"epoch": 5.49,
"eval_rundkast_loss": 0.3648250699043274,
"eval_rundkast_runtime": 264.7567,
"eval_rundkast_samples_per_second": 5.057,
"eval_rundkast_steps_per_second": 0.106,
"eval_rundkast_wer": 15.189569668852984,
"step": 483
},
{
"epoch": 5.49,
"eval_nb_samtale_loss": 0.30580607056617737,
"eval_nb_samtale_runtime": 130.4573,
"eval_nb_samtale_samples_per_second": 4.086,
"eval_nb_samtale_steps_per_second": 0.092,
"eval_nb_samtale_wer": 12.288411458333332,
"step": 483
},
{
"epoch": 5.49,
"eval_bigbrother_loss": 0.8111706376075745,
"eval_bigbrother_runtime": 273.5914,
"eval_bigbrother_samples_per_second": 5.007,
"eval_bigbrother_steps_per_second": 0.106,
"eval_bigbrother_wer": 34.34302747119955,
"step": 483
},
{
"epoch": 5.68,
"grad_norm": 2.708979368209839,
"learning_rate": 5e-06,
"loss": 0.1864,
"step": 500
},
{
"epoch": 5.73,
"eval_rundkast_loss": 0.3714243173599243,
"eval_rundkast_runtime": 264.8889,
"eval_rundkast_samples_per_second": 5.055,
"eval_rundkast_steps_per_second": 0.106,
"eval_rundkast_wer": 15.213565829467285,
"step": 504
},
{
"epoch": 5.73,
"eval_nb_samtale_loss": 0.30661869049072266,
"eval_nb_samtale_runtime": 129.9332,
"eval_nb_samtale_samples_per_second": 4.102,
"eval_nb_samtale_steps_per_second": 0.092,
"eval_nb_samtale_wer": 12.3291015625,
"step": 504
},
{
"epoch": 5.73,
"eval_bigbrother_loss": 0.8136927485466003,
"eval_bigbrother_runtime": 272.3894,
"eval_bigbrother_samples_per_second": 5.03,
"eval_bigbrother_steps_per_second": 0.106,
"eval_bigbrother_wer": 34.5041488761782,
"step": 504
},
{
"epoch": 5.97,
"eval_rundkast_loss": 0.3704493045806885,
"eval_rundkast_runtime": 263.3704,
"eval_rundkast_samples_per_second": 5.084,
"eval_rundkast_steps_per_second": 0.106,
"eval_rundkast_wer": 15.261558150695889,
"step": 525
},
{
"epoch": 5.97,
"eval_nb_samtale_loss": 0.3032839298248291,
"eval_nb_samtale_runtime": 128.4216,
"eval_nb_samtale_samples_per_second": 4.15,
"eval_nb_samtale_steps_per_second": 0.093,
"eval_nb_samtale_wer": 12.3779296875,
"step": 525
},
{
"epoch": 5.97,
"eval_bigbrother_loss": 0.8149410486221313,
"eval_bigbrother_runtime": 272.1944,
"eval_bigbrother_samples_per_second": 5.033,
"eval_bigbrother_steps_per_second": 0.107,
"eval_bigbrother_wer": 34.81027954563764,
"step": 525
},
{
"epoch": 6.2,
"eval_rundkast_loss": 0.3849130868911743,
"eval_rundkast_runtime": 261.0506,
"eval_rundkast_samples_per_second": 5.129,
"eval_rundkast_steps_per_second": 0.107,
"eval_rundkast_wer": 15.061590145576709,
"step": 546
},
{
"epoch": 6.2,
"eval_nb_samtale_loss": 0.3138934373855591,
"eval_nb_samtale_runtime": 130.4524,
"eval_nb_samtale_samples_per_second": 4.086,
"eval_nb_samtale_steps_per_second": 0.092,
"eval_nb_samtale_wer": 12.052408854166668,
"step": 546
},
{
"epoch": 6.2,
"eval_bigbrother_loss": 0.8786391615867615,
"eval_bigbrother_runtime": 271.5141,
"eval_bigbrother_samples_per_second": 5.046,
"eval_bigbrother_steps_per_second": 0.107,
"eval_bigbrother_wer": 34.72166277289938,
"step": 546
},
{
"epoch": 6.44,
"eval_rundkast_loss": 0.38933807611465454,
"eval_rundkast_runtime": 257.6232,
"eval_rundkast_samples_per_second": 5.198,
"eval_rundkast_steps_per_second": 0.109,
"eval_rundkast_wer": 15.20556710926252,
"step": 567
},
{
"epoch": 6.44,
"eval_nb_samtale_loss": 0.3130148649215698,
"eval_nb_samtale_runtime": 126.9397,
"eval_nb_samtale_samples_per_second": 4.199,
"eval_nb_samtale_steps_per_second": 0.095,
"eval_nb_samtale_wer": 12.239583333333332,
"step": 567
},
{
"epoch": 6.44,
"eval_bigbrother_loss": 0.885236382484436,
"eval_bigbrother_runtime": 274.5244,
"eval_bigbrother_samples_per_second": 4.99,
"eval_bigbrother_steps_per_second": 0.106,
"eval_bigbrother_wer": 37.001530653347295,
"step": 567
},
{
"epoch": 6.68,
"eval_rundkast_loss": 0.38271185755729675,
"eval_rundkast_runtime": 256.838,
"eval_rundkast_samples_per_second": 5.213,
"eval_rundkast_steps_per_second": 0.109,
"eval_rundkast_wer": 15.16557350823868,
"step": 588
},
{
"epoch": 6.68,
"eval_nb_samtale_loss": 0.3086356222629547,
"eval_nb_samtale_runtime": 128.1513,
"eval_nb_samtale_samples_per_second": 4.159,
"eval_nb_samtale_steps_per_second": 0.094,
"eval_nb_samtale_wer": 12.190755208333332,
"step": 588
},
{
"epoch": 6.68,
"eval_bigbrother_loss": 0.8816072344779968,
"eval_bigbrother_runtime": 275.8579,
"eval_bigbrother_samples_per_second": 4.966,
"eval_bigbrother_steps_per_second": 0.105,
"eval_bigbrother_wer": 37.581567711270445,
"step": 588
},
{
"epoch": 6.82,
"grad_norm": 2.3564608097076416,
"learning_rate": 6e-06,
"loss": 0.135,
"step": 600
},
{
"epoch": 6.92,
"eval_rundkast_loss": 0.38250651955604553,
"eval_rundkast_runtime": 256.6014,
"eval_rundkast_samples_per_second": 5.218,
"eval_rundkast_steps_per_second": 0.109,
"eval_rundkast_wer": 14.901615741481363,
"step": 609
},
{
"epoch": 6.92,
"eval_nb_samtale_loss": 0.31294992566108704,
"eval_nb_samtale_runtime": 127.0511,
"eval_nb_samtale_samples_per_second": 4.195,
"eval_nb_samtale_steps_per_second": 0.094,
"eval_nb_samtale_wer": 11.954752604166668,
"step": 609
},
{
"epoch": 6.92,
"eval_bigbrother_loss": 0.8941463828086853,
"eval_bigbrother_runtime": 267.477,
"eval_bigbrother_samples_per_second": 5.122,
"eval_bigbrother_steps_per_second": 0.108,
"eval_bigbrother_wer": 34.520261016676066,
"step": 609
}
],
"logging_steps": 100,
"max_steps": 1056,
"num_input_tokens_seen": 0,
"num_train_epochs": 12,
"save_steps": 21,
"total_flos": 8.4324653973504e+18,
"train_batch_size": 48,
"trial_name": null,
"trial_params": null
}