Tflatval's picture
Upload folder using huggingface_hub
390fa32 verified
raw
history blame
No virus
52.7 kB
{
"best_metric": 0.289421480911704,
"best_model_checkpoint": "/cluster/home/torstefl/Master/saved_model/W2V/Combined/BB-NB-22.05/checkpoint-17670",
"epoch": 40.0,
"eval_steps": 500,
"global_step": 18600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 5.088616847991943,
"learning_rate": 3.086666666666667e-05,
"loss": 2.0999,
"step": 465
},
{
"epoch": 1.0,
"eval_rundkast_loss": 0.39486202597618103,
"eval_rundkast_runtime": 32.0081,
"eval_rundkast_samples_per_second": 42.021,
"eval_rundkast_steps_per_second": 1.343,
"eval_rundkast_wer": 0.22597836461979,
"step": 465
},
{
"epoch": 1.0,
"eval_NB_BB_loss": 1.3563096523284912,
"eval_NB_BB_runtime": 84.5302,
"eval_NB_BB_samples_per_second": 22.513,
"eval_NB_BB_steps_per_second": 0.71,
"eval_NB_BB_wer": 0.40965952795433386,
"step": 465
},
{
"epoch": 1.0,
"eval_nb_samtale_loss": 0.5479292273521423,
"eval_nb_samtale_runtime": 36.6651,
"eval_nb_samtale_samples_per_second": 14.537,
"eval_nb_samtale_steps_per_second": 0.464,
"eval_nb_samtale_wer": 0.2421875,
"step": 465
},
{
"epoch": 1.0,
"eval_bigbrother_loss": 1.670620083808899,
"eval_bigbrother_runtime": 39.7215,
"eval_bigbrother_samples_per_second": 34.49,
"eval_bigbrother_steps_per_second": 1.083,
"eval_bigbrother_wer": 0.5755256585837428,
"step": 465
},
{
"epoch": 2.0,
"grad_norm": 5.0017313957214355,
"learning_rate": 6.186666666666668e-05,
"loss": 1.7526,
"step": 930
},
{
"epoch": 2.0,
"eval_rundkast_loss": 0.3949491083621979,
"eval_rundkast_runtime": 32.7201,
"eval_rundkast_samples_per_second": 41.106,
"eval_rundkast_steps_per_second": 1.314,
"eval_rundkast_wer": 0.22398981864460707,
"step": 930
},
{
"epoch": 2.0,
"eval_NB_BB_loss": 1.2307980060577393,
"eval_NB_BB_runtime": 83.9537,
"eval_NB_BB_samples_per_second": 22.667,
"eval_NB_BB_steps_per_second": 0.715,
"eval_NB_BB_wer": 0.38634063398242985,
"step": 930
},
{
"epoch": 2.0,
"eval_nb_samtale_loss": 0.5440447330474854,
"eval_nb_samtale_runtime": 36.2064,
"eval_nb_samtale_samples_per_second": 14.721,
"eval_nb_samtale_steps_per_second": 0.47,
"eval_nb_samtale_wer": 0.23177083333333334,
"step": 930
},
{
"epoch": 2.0,
"eval_bigbrother_loss": 1.4979978799819946,
"eval_bigbrother_runtime": 39.598,
"eval_bigbrother_samples_per_second": 34.598,
"eval_bigbrother_steps_per_second": 1.086,
"eval_bigbrother_wer": 0.5396761459759929,
"step": 930
},
{
"epoch": 3.0,
"grad_norm": 7.238979816436768,
"learning_rate": 9.286666666666667e-05,
"loss": 1.6611,
"step": 1395
},
{
"epoch": 3.0,
"eval_rundkast_loss": 0.4249923825263977,
"eval_rundkast_runtime": 32.4044,
"eval_rundkast_samples_per_second": 41.507,
"eval_rundkast_steps_per_second": 1.327,
"eval_rundkast_wer": 0.22621699013681196,
"step": 1395
},
{
"epoch": 3.0,
"eval_NB_BB_loss": 1.2449074983596802,
"eval_NB_BB_runtime": 85.2007,
"eval_NB_BB_samples_per_second": 22.335,
"eval_NB_BB_steps_per_second": 0.704,
"eval_NB_BB_wer": 0.3861786972187361,
"step": 1395
},
{
"epoch": 3.0,
"eval_nb_samtale_loss": 0.5582835078239441,
"eval_nb_samtale_runtime": 36.2595,
"eval_nb_samtale_samples_per_second": 14.7,
"eval_nb_samtale_steps_per_second": 0.469,
"eval_nb_samtale_wer": 0.23274739583333334,
"step": 1395
},
{
"epoch": 3.0,
"eval_bigbrother_loss": 1.5122398138046265,
"eval_bigbrother_runtime": 39.5302,
"eval_bigbrother_samples_per_second": 34.657,
"eval_bigbrother_steps_per_second": 1.088,
"eval_bigbrother_wer": 0.5397567066784822,
"step": 1395
},
{
"epoch": 4.0,
"grad_norm": 9.255756378173828,
"learning_rate": 9.790643274853801e-05,
"loss": 1.5765,
"step": 1860
},
{
"epoch": 4.0,
"eval_rundkast_loss": 0.37671104073524475,
"eval_rundkast_runtime": 31.5626,
"eval_rundkast_samples_per_second": 42.614,
"eval_rundkast_steps_per_second": 1.362,
"eval_rundkast_wer": 0.220967228762329,
"step": 1860
},
{
"epoch": 4.0,
"eval_NB_BB_loss": 1.0437960624694824,
"eval_NB_BB_runtime": 84.5888,
"eval_NB_BB_samples_per_second": 22.497,
"eval_NB_BB_steps_per_second": 0.709,
"eval_NB_BB_wer": 0.3624954455285211,
"step": 1860
},
{
"epoch": 4.0,
"eval_nb_samtale_loss": 0.48440223932266235,
"eval_nb_samtale_runtime": 39.3769,
"eval_nb_samtale_samples_per_second": 13.536,
"eval_nb_samtale_steps_per_second": 0.432,
"eval_nb_samtale_wer": 0.22314453125,
"step": 1860
},
{
"epoch": 4.0,
"eval_bigbrother_loss": 1.2615869045257568,
"eval_bigbrother_runtime": 41.8866,
"eval_bigbrother_samples_per_second": 32.707,
"eval_bigbrother_steps_per_second": 1.027,
"eval_bigbrother_wer": 0.5008458873761379,
"step": 1860
},
{
"epoch": 5.0,
"grad_norm": 6.270685195922852,
"learning_rate": 9.519883040935674e-05,
"loss": 1.4853,
"step": 2325
},
{
"epoch": 5.0,
"eval_rundkast_loss": 0.3830512762069702,
"eval_rundkast_runtime": 31.7506,
"eval_rundkast_samples_per_second": 42.361,
"eval_rundkast_steps_per_second": 1.354,
"eval_rundkast_wer": 0.22351256761056315,
"step": 2325
},
{
"epoch": 5.0,
"eval_NB_BB_loss": 1.0370458364486694,
"eval_NB_BB_runtime": 83.374,
"eval_NB_BB_samples_per_second": 22.825,
"eval_NB_BB_steps_per_second": 0.72,
"eval_NB_BB_wer": 0.35549168049876523,
"step": 2325
},
{
"epoch": 5.0,
"eval_nb_samtale_loss": 0.47176724672317505,
"eval_nb_samtale_runtime": 35.9414,
"eval_nb_samtale_samples_per_second": 14.83,
"eval_nb_samtale_steps_per_second": 0.473,
"eval_nb_samtale_wer": 0.21818033854166666,
"step": 2325
},
{
"epoch": 5.0,
"eval_bigbrother_loss": 1.256990671157837,
"eval_bigbrother_runtime": 39.4041,
"eval_bigbrother_samples_per_second": 34.768,
"eval_bigbrother_steps_per_second": 1.091,
"eval_bigbrother_wer": 0.49093692096995084,
"step": 2325
},
{
"epoch": 6.0,
"grad_norm": 6.830248832702637,
"learning_rate": 9.24795321637427e-05,
"loss": 1.4316,
"step": 2790
},
{
"epoch": 6.0,
"eval_rundkast_loss": 0.41122955083847046,
"eval_rundkast_runtime": 31.5822,
"eval_rundkast_samples_per_second": 42.587,
"eval_rundkast_steps_per_second": 1.362,
"eval_rundkast_wer": 0.2255011135857461,
"step": 2790
},
{
"epoch": 6.0,
"eval_NB_BB_loss": 1.0182600021362305,
"eval_NB_BB_runtime": 83.3578,
"eval_NB_BB_samples_per_second": 22.829,
"eval_NB_BB_steps_per_second": 0.72,
"eval_NB_BB_wer": 0.3526577871341241,
"step": 2790
},
{
"epoch": 6.0,
"eval_nb_samtale_loss": 0.4850824475288391,
"eval_nb_samtale_runtime": 35.9277,
"eval_nb_samtale_samples_per_second": 14.835,
"eval_nb_samtale_steps_per_second": 0.473,
"eval_nb_samtale_wer": 0.22054036458333334,
"step": 2790
},
{
"epoch": 6.0,
"eval_bigbrother_loss": 1.2255350351333618,
"eval_bigbrother_runtime": 39.6894,
"eval_bigbrother_samples_per_second": 34.518,
"eval_bigbrother_steps_per_second": 1.083,
"eval_bigbrother_wer": 0.4833642149359542,
"step": 2790
},
{
"epoch": 7.0,
"grad_norm": 5.503568172454834,
"learning_rate": 8.976023391812865e-05,
"loss": 1.3699,
"step": 3255
},
{
"epoch": 7.0,
"eval_rundkast_loss": 0.409690260887146,
"eval_rundkast_runtime": 31.88,
"eval_rundkast_samples_per_second": 42.189,
"eval_rundkast_steps_per_second": 1.349,
"eval_rundkast_wer": 0.2182628062360802,
"step": 3255
},
{
"epoch": 7.0,
"eval_NB_BB_loss": 0.9981555342674255,
"eval_NB_BB_runtime": 83.1726,
"eval_NB_BB_samples_per_second": 22.88,
"eval_NB_BB_steps_per_second": 0.721,
"eval_NB_BB_wer": 0.33933848832031094,
"step": 3255
},
{
"epoch": 7.0,
"eval_nb_samtale_loss": 0.4907973110675812,
"eval_nb_samtale_runtime": 35.9575,
"eval_nb_samtale_samples_per_second": 14.823,
"eval_nb_samtale_steps_per_second": 0.473,
"eval_nb_samtale_wer": 0.21346028645833334,
"step": 3255
},
{
"epoch": 7.0,
"eval_bigbrother_loss": 1.1955358982086182,
"eval_bigbrother_runtime": 39.6796,
"eval_bigbrother_samples_per_second": 34.527,
"eval_bigbrother_steps_per_second": 1.084,
"eval_bigbrother_wer": 0.46435188914847336,
"step": 3255
},
{
"epoch": 8.0,
"grad_norm": 11.339502334594727,
"learning_rate": 8.704093567251463e-05,
"loss": 1.3346,
"step": 3720
},
{
"epoch": 8.0,
"eval_rundkast_loss": 0.3831312358379364,
"eval_rundkast_runtime": 32.9308,
"eval_rundkast_samples_per_second": 40.843,
"eval_rundkast_steps_per_second": 1.306,
"eval_rundkast_wer": 0.2166719694559338,
"step": 3720
},
{
"epoch": 8.0,
"eval_NB_BB_loss": 0.9318952560424805,
"eval_NB_BB_runtime": 98.1107,
"eval_NB_BB_samples_per_second": 19.396,
"eval_NB_BB_steps_per_second": 0.612,
"eval_NB_BB_wer": 0.3345613537913445,
"step": 3720
},
{
"epoch": 8.0,
"eval_nb_samtale_loss": 0.458311527967453,
"eval_nb_samtale_runtime": 36.9177,
"eval_nb_samtale_samples_per_second": 14.438,
"eval_nb_samtale_steps_per_second": 0.46,
"eval_nb_samtale_wer": 0.20939127604166666,
"step": 3720
},
{
"epoch": 8.0,
"eval_bigbrother_loss": 1.1163750886917114,
"eval_bigbrother_runtime": 40.3476,
"eval_bigbrother_samples_per_second": 33.955,
"eval_bigbrother_steps_per_second": 1.066,
"eval_bigbrother_wer": 0.4583903971642633,
"step": 3720
},
{
"epoch": 9.0,
"grad_norm": 2.8908886909484863,
"learning_rate": 8.432163742690059e-05,
"loss": 1.2933,
"step": 4185
},
{
"epoch": 9.0,
"eval_rundkast_loss": 0.3958103656768799,
"eval_rundkast_runtime": 32.4676,
"eval_rundkast_samples_per_second": 41.426,
"eval_rundkast_steps_per_second": 1.324,
"eval_rundkast_wer": 0.21563792554883868,
"step": 4185
},
{
"epoch": 9.0,
"eval_NB_BB_loss": 0.9900856614112854,
"eval_NB_BB_runtime": 85.2037,
"eval_NB_BB_samples_per_second": 22.335,
"eval_NB_BB_steps_per_second": 0.704,
"eval_NB_BB_wer": 0.33201084976316747,
"step": 4185
},
{
"epoch": 9.0,
"eval_nb_samtale_loss": 0.48341503739356995,
"eval_nb_samtale_runtime": 36.9893,
"eval_nb_samtale_samples_per_second": 14.41,
"eval_nb_samtale_steps_per_second": 0.46,
"eval_nb_samtale_wer": 0.206298828125,
"step": 4185
},
{
"epoch": 9.0,
"eval_bigbrother_loss": 1.1871527433395386,
"eval_bigbrother_runtime": 41.4962,
"eval_bigbrother_samples_per_second": 33.015,
"eval_bigbrother_steps_per_second": 1.036,
"eval_bigbrother_wer": 0.4568597438169661,
"step": 4185
},
{
"epoch": 10.0,
"grad_norm": 5.720297336578369,
"learning_rate": 8.160233918128655e-05,
"loss": 1.2483,
"step": 4650
},
{
"epoch": 10.0,
"eval_rundkast_loss": 0.4080227017402649,
"eval_rundkast_runtime": 32.4095,
"eval_rundkast_samples_per_second": 41.5,
"eval_rundkast_steps_per_second": 1.327,
"eval_rundkast_wer": 0.21181991727648744,
"step": 4650
},
{
"epoch": 10.0,
"eval_NB_BB_loss": 0.9500575065612793,
"eval_NB_BB_runtime": 84.6361,
"eval_NB_BB_samples_per_second": 22.485,
"eval_NB_BB_steps_per_second": 0.709,
"eval_NB_BB_wer": 0.3251285373061819,
"step": 4650
},
{
"epoch": 10.0,
"eval_nb_samtale_loss": 0.4818229675292969,
"eval_nb_samtale_runtime": 37.1509,
"eval_nb_samtale_samples_per_second": 14.347,
"eval_nb_samtale_steps_per_second": 0.458,
"eval_nb_samtale_wer": 0.201904296875,
"step": 4650
},
{
"epoch": 10.0,
"eval_bigbrother_loss": 1.1322485208511353,
"eval_bigbrother_runtime": 40.3892,
"eval_bigbrother_samples_per_second": 33.92,
"eval_bigbrother_steps_per_second": 1.065,
"eval_bigbrother_wer": 0.44638685249335375,
"step": 4650
},
{
"epoch": 11.0,
"grad_norm": 15.0436372756958,
"learning_rate": 7.888304093567252e-05,
"loss": 1.2131,
"step": 5115
},
{
"epoch": 11.0,
"eval_rundkast_loss": 0.43607091903686523,
"eval_rundkast_runtime": 32.6212,
"eval_rundkast_samples_per_second": 41.231,
"eval_rundkast_steps_per_second": 1.318,
"eval_rundkast_wer": 0.21492204899777284,
"step": 5115
},
{
"epoch": 11.0,
"eval_NB_BB_loss": 1.0018919706344604,
"eval_NB_BB_runtime": 85.111,
"eval_NB_BB_samples_per_second": 22.359,
"eval_NB_BB_steps_per_second": 0.705,
"eval_NB_BB_wer": 0.32488563216064126,
"step": 5115
},
{
"epoch": 11.0,
"eval_nb_samtale_loss": 0.4951498210430145,
"eval_nb_samtale_runtime": 36.7127,
"eval_nb_samtale_samples_per_second": 14.518,
"eval_nb_samtale_steps_per_second": 0.463,
"eval_nb_samtale_wer": 0.2001953125,
"step": 5115
},
{
"epoch": 11.0,
"eval_bigbrother_loss": 1.1989638805389404,
"eval_bigbrother_runtime": 40.7234,
"eval_bigbrother_samples_per_second": 33.642,
"eval_bigbrother_steps_per_second": 1.056,
"eval_bigbrother_wer": 0.4492064770804801,
"step": 5115
},
{
"epoch": 12.0,
"grad_norm": 6.106450080871582,
"learning_rate": 7.616374269005848e-05,
"loss": 1.1821,
"step": 5580
},
{
"epoch": 12.0,
"eval_rundkast_loss": 0.41126009821891785,
"eval_rundkast_runtime": 33.0331,
"eval_rundkast_samples_per_second": 40.717,
"eval_rundkast_steps_per_second": 1.302,
"eval_rundkast_wer": 0.2180241807190582,
"step": 5580
},
{
"epoch": 12.0,
"eval_NB_BB_loss": 0.9629638195037842,
"eval_NB_BB_runtime": 99.548,
"eval_NB_BB_samples_per_second": 19.116,
"eval_NB_BB_steps_per_second": 0.603,
"eval_NB_BB_wer": 0.3250880531152585,
"step": 5580
},
{
"epoch": 12.0,
"eval_nb_samtale_loss": 0.46501702070236206,
"eval_nb_samtale_runtime": 36.9075,
"eval_nb_samtale_samples_per_second": 14.442,
"eval_nb_samtale_steps_per_second": 0.461,
"eval_nb_samtale_wer": 0.202880859375,
"step": 5580
},
{
"epoch": 12.0,
"eval_bigbrother_loss": 1.1566274166107178,
"eval_bigbrother_runtime": 40.4961,
"eval_bigbrother_samples_per_second": 33.83,
"eval_bigbrother_steps_per_second": 1.062,
"eval_bigbrother_wer": 0.4453395633609925,
"step": 5580
},
{
"epoch": 13.0,
"grad_norm": 10.281853675842285,
"learning_rate": 7.344444444444445e-05,
"loss": 1.1652,
"step": 6045
},
{
"epoch": 13.0,
"eval_rundkast_loss": 0.38290590047836304,
"eval_rundkast_runtime": 32.4453,
"eval_rundkast_samples_per_second": 41.454,
"eval_rundkast_steps_per_second": 1.325,
"eval_rundkast_wer": 0.21563792554883868,
"step": 6045
},
{
"epoch": 13.0,
"eval_NB_BB_loss": 0.9116414785385132,
"eval_NB_BB_runtime": 84.9456,
"eval_NB_BB_samples_per_second": 22.403,
"eval_NB_BB_steps_per_second": 0.706,
"eval_NB_BB_wer": 0.31994656086798107,
"step": 6045
},
{
"epoch": 13.0,
"eval_nb_samtale_loss": 0.4675864279270172,
"eval_nb_samtale_runtime": 36.7336,
"eval_nb_samtale_samples_per_second": 14.51,
"eval_nb_samtale_steps_per_second": 0.463,
"eval_nb_samtale_wer": 0.198486328125,
"step": 6045
},
{
"epoch": 13.0,
"eval_bigbrother_loss": 1.0843714475631714,
"eval_bigbrother_runtime": 40.2808,
"eval_bigbrother_samples_per_second": 34.011,
"eval_bigbrother_steps_per_second": 1.068,
"eval_bigbrother_wer": 0.4403447998066543,
"step": 6045
},
{
"epoch": 14.0,
"grad_norm": 3.9103004932403564,
"learning_rate": 7.072514619883041e-05,
"loss": 1.1179,
"step": 6510
},
{
"epoch": 14.0,
"eval_rundkast_loss": 0.3869563937187195,
"eval_rundkast_runtime": 32.4154,
"eval_rundkast_samples_per_second": 41.493,
"eval_rundkast_steps_per_second": 1.327,
"eval_rundkast_wer": 0.2121380846325167,
"step": 6510
},
{
"epoch": 14.0,
"eval_NB_BB_loss": 0.9029076099395752,
"eval_NB_BB_runtime": 85.8744,
"eval_NB_BB_samples_per_second": 22.16,
"eval_NB_BB_steps_per_second": 0.699,
"eval_NB_BB_wer": 0.31063519695558883,
"step": 6510
},
{
"epoch": 14.0,
"eval_nb_samtale_loss": 0.4522353410720825,
"eval_nb_samtale_runtime": 36.6303,
"eval_nb_samtale_samples_per_second": 14.551,
"eval_nb_samtale_steps_per_second": 0.464,
"eval_nb_samtale_wer": 0.19287109375,
"step": 6510
},
{
"epoch": 14.0,
"eval_bigbrother_loss": 1.0779362916946411,
"eval_bigbrother_runtime": 40.3876,
"eval_bigbrother_samples_per_second": 33.921,
"eval_bigbrother_steps_per_second": 1.065,
"eval_bigbrother_wer": 0.42818013373076613,
"step": 6510
},
{
"epoch": 15.0,
"grad_norm": 6.248087406158447,
"learning_rate": 6.800584795321637e-05,
"loss": 1.1123,
"step": 6975
},
{
"epoch": 15.0,
"eval_rundkast_loss": 0.43526676297187805,
"eval_rundkast_runtime": 32.5572,
"eval_rundkast_samples_per_second": 41.312,
"eval_rundkast_steps_per_second": 1.321,
"eval_rundkast_wer": 0.21110404072542158,
"step": 6975
},
{
"epoch": 15.0,
"eval_NB_BB_loss": 1.0294309854507446,
"eval_NB_BB_runtime": 85.0774,
"eval_NB_BB_samples_per_second": 22.368,
"eval_NB_BB_steps_per_second": 0.705,
"eval_NB_BB_wer": 0.3128618274563783,
"step": 6975
},
{
"epoch": 15.0,
"eval_nb_samtale_loss": 0.5030134916305542,
"eval_nb_samtale_runtime": 36.6885,
"eval_nb_samtale_samples_per_second": 14.528,
"eval_nb_samtale_steps_per_second": 0.463,
"eval_nb_samtale_wer": 0.193603515625,
"step": 6975
},
{
"epoch": 15.0,
"eval_bigbrother_loss": 1.2345293760299683,
"eval_bigbrother_runtime": 40.3974,
"eval_bigbrother_samples_per_second": 33.913,
"eval_bigbrother_steps_per_second": 1.064,
"eval_bigbrother_wer": 0.4302747119954886,
"step": 6975
},
{
"epoch": 16.0,
"grad_norm": 6.180894374847412,
"learning_rate": 6.529239766081871e-05,
"loss": 1.075,
"step": 7440
},
{
"epoch": 16.0,
"eval_rundkast_loss": 0.4082247316837311,
"eval_rundkast_runtime": 32.5615,
"eval_rundkast_samples_per_second": 41.306,
"eval_rundkast_steps_per_second": 1.321,
"eval_rundkast_wer": 0.21006999681832644,
"step": 7440
},
{
"epoch": 16.0,
"eval_NB_BB_loss": 0.9210716485977173,
"eval_NB_BB_runtime": 84.9343,
"eval_NB_BB_samples_per_second": 22.406,
"eval_NB_BB_steps_per_second": 0.706,
"eval_NB_BB_wer": 0.3099064815189668,
"step": 7440
},
{
"epoch": 16.0,
"eval_nb_samtale_loss": 0.459839791059494,
"eval_nb_samtale_runtime": 37.1878,
"eval_nb_samtale_samples_per_second": 14.333,
"eval_nb_samtale_steps_per_second": 0.457,
"eval_nb_samtale_wer": 0.19303385416666666,
"step": 7440
},
{
"epoch": 16.0,
"eval_bigbrother_loss": 1.100581407546997,
"eval_bigbrother_runtime": 40.4416,
"eval_bigbrother_samples_per_second": 33.876,
"eval_bigbrother_steps_per_second": 1.063,
"eval_bigbrother_wer": 0.42487714492870376,
"step": 7440
},
{
"epoch": 17.0,
"grad_norm": 5.789996147155762,
"learning_rate": 6.257309941520468e-05,
"loss": 1.0718,
"step": 7905
},
{
"epoch": 17.0,
"eval_rundkast_loss": 0.4331410825252533,
"eval_rundkast_runtime": 32.5516,
"eval_rundkast_samples_per_second": 41.319,
"eval_rundkast_steps_per_second": 1.321,
"eval_rundkast_wer": 0.21014953865733377,
"step": 7905
},
{
"epoch": 17.0,
"eval_NB_BB_loss": 0.965010404586792,
"eval_NB_BB_runtime": 84.6139,
"eval_NB_BB_samples_per_second": 22.49,
"eval_NB_BB_steps_per_second": 0.709,
"eval_NB_BB_wer": 0.3072345249180195,
"step": 7905
},
{
"epoch": 17.0,
"eval_nb_samtale_loss": 0.49670931696891785,
"eval_nb_samtale_runtime": 36.4484,
"eval_nb_samtale_samples_per_second": 14.623,
"eval_nb_samtale_steps_per_second": 0.466,
"eval_nb_samtale_wer": 0.19140625,
"step": 7905
},
{
"epoch": 17.0,
"eval_bigbrother_loss": 1.1466903686523438,
"eval_bigbrother_runtime": 40.4761,
"eval_bigbrother_samples_per_second": 33.847,
"eval_bigbrother_steps_per_second": 1.062,
"eval_bigbrother_wer": 0.4217352775316201,
"step": 7905
},
{
"epoch": 18.0,
"grad_norm": 12.003623008728027,
"learning_rate": 5.985380116959065e-05,
"loss": 1.0422,
"step": 8370
},
{
"epoch": 18.0,
"eval_rundkast_loss": 0.4282049536705017,
"eval_rundkast_runtime": 32.7905,
"eval_rundkast_samples_per_second": 41.018,
"eval_rundkast_steps_per_second": 1.311,
"eval_rundkast_wer": 0.21134266624244352,
"step": 8370
},
{
"epoch": 18.0,
"eval_NB_BB_loss": 0.9594568610191345,
"eval_NB_BB_runtime": 84.0609,
"eval_NB_BB_samples_per_second": 22.638,
"eval_NB_BB_steps_per_second": 0.714,
"eval_NB_BB_wer": 0.30707258815432575,
"step": 8370
},
{
"epoch": 18.0,
"eval_nb_samtale_loss": 0.4719415307044983,
"eval_nb_samtale_runtime": 36.4276,
"eval_nb_samtale_samples_per_second": 14.632,
"eval_nb_samtale_steps_per_second": 0.467,
"eval_nb_samtale_wer": 0.192626953125,
"step": 8370
},
{
"epoch": 18.0,
"eval_bigbrother_loss": 1.148333191871643,
"eval_bigbrother_runtime": 40.3155,
"eval_bigbrother_samples_per_second": 33.982,
"eval_bigbrother_steps_per_second": 1.067,
"eval_bigbrother_wer": 0.42068798839925886,
"step": 8370
},
{
"epoch": 19.0,
"grad_norm": 7.242124080657959,
"learning_rate": 5.7134502923976606e-05,
"loss": 1.0303,
"step": 8835
},
{
"epoch": 19.0,
"eval_rundkast_loss": 0.41116222739219666,
"eval_rundkast_runtime": 31.7737,
"eval_rundkast_samples_per_second": 42.331,
"eval_rundkast_steps_per_second": 1.353,
"eval_rundkast_wer": 0.21293350302258987,
"step": 8835
},
{
"epoch": 19.0,
"eval_NB_BB_loss": 0.9378307461738586,
"eval_NB_BB_runtime": 94.3567,
"eval_NB_BB_samples_per_second": 20.168,
"eval_NB_BB_steps_per_second": 0.636,
"eval_NB_BB_wer": 0.3072345249180195,
"step": 8835
},
{
"epoch": 19.0,
"eval_nb_samtale_loss": 0.46919578313827515,
"eval_nb_samtale_runtime": 35.5991,
"eval_nb_samtale_samples_per_second": 14.972,
"eval_nb_samtale_steps_per_second": 0.478,
"eval_nb_samtale_wer": 0.19327799479166666,
"step": 8835
},
{
"epoch": 19.0,
"eval_bigbrother_loss": 1.1198594570159912,
"eval_bigbrother_runtime": 39.6114,
"eval_bigbrother_samples_per_second": 34.586,
"eval_bigbrother_steps_per_second": 1.086,
"eval_bigbrother_wer": 0.4197212599693869,
"step": 8835
},
{
"epoch": 20.0,
"grad_norm": 6.254478931427002,
"learning_rate": 5.4415204678362576e-05,
"loss": 1.0192,
"step": 9300
},
{
"epoch": 20.0,
"eval_rundkast_loss": 0.4086886942386627,
"eval_rundkast_runtime": 32.5071,
"eval_rundkast_samples_per_second": 41.376,
"eval_rundkast_steps_per_second": 1.323,
"eval_rundkast_wer": 0.20752465797009226,
"step": 9300
},
{
"epoch": 20.0,
"eval_NB_BB_loss": 0.9522827863693237,
"eval_NB_BB_runtime": 100.9277,
"eval_NB_BB_samples_per_second": 18.855,
"eval_NB_BB_steps_per_second": 0.594,
"eval_NB_BB_wer": 0.3014048014250435,
"step": 9300
},
{
"epoch": 20.0,
"eval_nb_samtale_loss": 0.4663674533367157,
"eval_nb_samtale_runtime": 35.8162,
"eval_nb_samtale_samples_per_second": 14.882,
"eval_nb_samtale_steps_per_second": 0.475,
"eval_nb_samtale_wer": 0.18782552083333334,
"step": 9300
},
{
"epoch": 20.0,
"eval_bigbrother_loss": 1.1411128044128418,
"eval_bigbrother_runtime": 39.8861,
"eval_bigbrother_samples_per_second": 34.348,
"eval_bigbrother_steps_per_second": 1.078,
"eval_bigbrother_wer": 0.4136792072826875,
"step": 9300
},
{
"epoch": 21.0,
"grad_norm": 11.991388320922852,
"learning_rate": 5.169590643274854e-05,
"loss": 1.0087,
"step": 9765
},
{
"epoch": 21.0,
"eval_rundkast_loss": 0.41283562779426575,
"eval_rundkast_runtime": 31.8401,
"eval_rundkast_samples_per_second": 42.242,
"eval_rundkast_steps_per_second": 1.351,
"eval_rundkast_wer": 0.20919503658924593,
"step": 9765
},
{
"epoch": 21.0,
"eval_NB_BB_loss": 0.9513369202613831,
"eval_NB_BB_runtime": 83.7994,
"eval_NB_BB_samples_per_second": 22.709,
"eval_NB_BB_steps_per_second": 0.716,
"eval_NB_BB_wer": 0.30274077972551716,
"step": 9765
},
{
"epoch": 21.0,
"eval_nb_samtale_loss": 0.47523027658462524,
"eval_nb_samtale_runtime": 35.727,
"eval_nb_samtale_samples_per_second": 14.919,
"eval_nb_samtale_steps_per_second": 0.476,
"eval_nb_samtale_wer": 0.18977864583333334,
"step": 9765
},
{
"epoch": 21.0,
"eval_bigbrother_loss": 1.1363465785980225,
"eval_bigbrother_runtime": 39.6372,
"eval_bigbrother_samples_per_second": 34.564,
"eval_bigbrother_steps_per_second": 1.085,
"eval_bigbrother_wer": 0.4141625714976235,
"step": 9765
},
{
"epoch": 22.0,
"grad_norm": 8.134933471679688,
"learning_rate": 4.8976608187134504e-05,
"loss": 0.982,
"step": 10230
},
{
"epoch": 22.0,
"eval_rundkast_loss": 0.4441734850406647,
"eval_rundkast_runtime": 31.8611,
"eval_rundkast_samples_per_second": 42.214,
"eval_rundkast_steps_per_second": 1.35,
"eval_rundkast_wer": 0.20696786509704104,
"step": 10230
},
{
"epoch": 22.0,
"eval_NB_BB_loss": 1.0050716400146484,
"eval_NB_BB_runtime": 83.4701,
"eval_NB_BB_samples_per_second": 22.799,
"eval_NB_BB_steps_per_second": 0.719,
"eval_NB_BB_wer": 0.30059511760657465,
"step": 10230
},
{
"epoch": 22.0,
"eval_nb_samtale_loss": 0.4712933897972107,
"eval_nb_samtale_runtime": 35.6009,
"eval_nb_samtale_samples_per_second": 14.972,
"eval_nb_samtale_steps_per_second": 0.478,
"eval_nb_samtale_wer": 0.18782552083333334,
"step": 10230
},
{
"epoch": 22.0,
"eval_bigbrother_loss": 1.213335394859314,
"eval_bigbrother_runtime": 39.7468,
"eval_bigbrother_samples_per_second": 34.468,
"eval_bigbrother_steps_per_second": 1.082,
"eval_bigbrother_wer": 0.41247079674534765,
"step": 10230
},
{
"epoch": 23.0,
"grad_norm": 33.663204193115234,
"learning_rate": 4.625730994152047e-05,
"loss": 0.9667,
"step": 10695
},
{
"epoch": 23.0,
"eval_rundkast_loss": 0.43352487683296204,
"eval_rundkast_runtime": 32.6485,
"eval_rundkast_samples_per_second": 41.196,
"eval_rundkast_steps_per_second": 1.317,
"eval_rundkast_wer": 0.2063315303849825,
"step": 10695
},
{
"epoch": 23.0,
"eval_NB_BB_loss": 0.9717670679092407,
"eval_NB_BB_runtime": 84.3242,
"eval_NB_BB_samples_per_second": 22.568,
"eval_NB_BB_steps_per_second": 0.712,
"eval_NB_BB_wer": 0.2978826768147039,
"step": 10695
},
{
"epoch": 23.0,
"eval_nb_samtale_loss": 0.451678067445755,
"eval_nb_samtale_runtime": 36.8422,
"eval_nb_samtale_samples_per_second": 14.467,
"eval_nb_samtale_steps_per_second": 0.461,
"eval_nb_samtale_wer": 0.18570963541666666,
"step": 10695
},
{
"epoch": 23.0,
"eval_bigbrother_loss": 1.173987865447998,
"eval_bigbrother_runtime": 40.426,
"eval_bigbrother_samples_per_second": 33.889,
"eval_bigbrother_steps_per_second": 1.064,
"eval_bigbrother_wer": 0.408362200918392,
"step": 10695
},
{
"epoch": 24.0,
"grad_norm": 3.15181827545166,
"learning_rate": 4.354385964912281e-05,
"loss": 0.9586,
"step": 11160
},
{
"epoch": 24.0,
"eval_rundkast_loss": 0.43574872612953186,
"eval_rundkast_runtime": 34.0532,
"eval_rundkast_samples_per_second": 39.497,
"eval_rundkast_steps_per_second": 1.263,
"eval_rundkast_wer": 0.20776328348711423,
"step": 11160
},
{
"epoch": 24.0,
"eval_NB_BB_loss": 0.9633657932281494,
"eval_NB_BB_runtime": 85.5761,
"eval_NB_BB_samples_per_second": 22.238,
"eval_NB_BB_steps_per_second": 0.701,
"eval_NB_BB_wer": 0.2978421926237804,
"step": 11160
},
{
"epoch": 24.0,
"eval_nb_samtale_loss": 0.45962560176849365,
"eval_nb_samtale_runtime": 36.3588,
"eval_nb_samtale_samples_per_second": 14.659,
"eval_nb_samtale_steps_per_second": 0.468,
"eval_nb_samtale_wer": 0.186767578125,
"step": 11160
},
{
"epoch": 24.0,
"eval_bigbrother_loss": 1.159108281135559,
"eval_bigbrother_runtime": 40.6416,
"eval_bigbrother_samples_per_second": 33.709,
"eval_bigbrother_steps_per_second": 1.058,
"eval_bigbrother_wer": 0.4082816402159027,
"step": 11160
},
{
"epoch": 25.0,
"grad_norm": 15.837915420532227,
"learning_rate": 4.082456140350878e-05,
"loss": 0.9366,
"step": 11625
},
{
"epoch": 25.0,
"eval_rundkast_loss": 0.43792787194252014,
"eval_rundkast_runtime": 32.8971,
"eval_rundkast_samples_per_second": 40.885,
"eval_rundkast_steps_per_second": 1.307,
"eval_rundkast_wer": 0.20664969774101177,
"step": 11625
},
{
"epoch": 25.0,
"eval_NB_BB_loss": 1.0051846504211426,
"eval_NB_BB_runtime": 85.0128,
"eval_NB_BB_samples_per_second": 22.385,
"eval_NB_BB_steps_per_second": 0.706,
"eval_NB_BB_wer": 0.2959394356503785,
"step": 11625
},
{
"epoch": 25.0,
"eval_nb_samtale_loss": 0.478113055229187,
"eval_nb_samtale_runtime": 36.2152,
"eval_nb_samtale_samples_per_second": 14.718,
"eval_nb_samtale_steps_per_second": 0.469,
"eval_nb_samtale_wer": 0.18636067708333334,
"step": 11625
},
{
"epoch": 25.0,
"eval_bigbrother_loss": 1.2104246616363525,
"eval_bigbrother_runtime": 40.5472,
"eval_bigbrother_samples_per_second": 33.788,
"eval_bigbrother_steps_per_second": 1.06,
"eval_bigbrother_wer": 0.404656408603883,
"step": 11625
},
{
"epoch": 26.0,
"grad_norm": 3.201197624206543,
"learning_rate": 3.8105263157894735e-05,
"loss": 0.9325,
"step": 12090
},
{
"epoch": 26.0,
"eval_rundkast_loss": 0.41804516315460205,
"eval_rundkast_runtime": 31.7914,
"eval_rundkast_samples_per_second": 42.307,
"eval_rundkast_steps_per_second": 1.353,
"eval_rundkast_wer": 0.2049793191218581,
"step": 12090
},
{
"epoch": 26.0,
"eval_NB_BB_loss": 0.9606844186782837,
"eval_NB_BB_runtime": 83.5304,
"eval_NB_BB_samples_per_second": 22.782,
"eval_NB_BB_steps_per_second": 0.718,
"eval_NB_BB_wer": 0.2959394356503785,
"step": 12090
},
{
"epoch": 26.0,
"eval_nb_samtale_loss": 0.44722747802734375,
"eval_nb_samtale_runtime": 35.6931,
"eval_nb_samtale_samples_per_second": 14.933,
"eval_nb_samtale_steps_per_second": 0.476,
"eval_nb_samtale_wer": 0.18611653645833334,
"step": 12090
},
{
"epoch": 26.0,
"eval_bigbrother_loss": 1.160502314567566,
"eval_bigbrother_runtime": 39.8504,
"eval_bigbrother_samples_per_second": 34.379,
"eval_bigbrother_steps_per_second": 1.079,
"eval_bigbrother_wer": 0.4047369693063724,
"step": 12090
},
{
"epoch": 27.0,
"grad_norm": 5.304738521575928,
"learning_rate": 3.5385964912280706e-05,
"loss": 0.9189,
"step": 12555
},
{
"epoch": 27.0,
"eval_rundkast_loss": 0.4250892698764801,
"eval_rundkast_runtime": 31.7351,
"eval_rundkast_samples_per_second": 42.382,
"eval_rundkast_steps_per_second": 1.355,
"eval_rundkast_wer": 0.20641107222398983,
"step": 12555
},
{
"epoch": 27.0,
"eval_NB_BB_loss": 0.9551168084144592,
"eval_NB_BB_runtime": 83.3377,
"eval_NB_BB_samples_per_second": 22.835,
"eval_NB_BB_steps_per_second": 0.72,
"eval_NB_BB_wer": 0.29614185660499576,
"step": 12555
},
{
"epoch": 27.0,
"eval_nb_samtale_loss": 0.4538469910621643,
"eval_nb_samtale_runtime": 35.5954,
"eval_nb_samtale_samples_per_second": 14.974,
"eval_nb_samtale_steps_per_second": 0.478,
"eval_nb_samtale_wer": 0.18416341145833334,
"step": 12555
},
{
"epoch": 27.0,
"eval_bigbrother_loss": 1.149815559387207,
"eval_bigbrother_runtime": 39.7731,
"eval_bigbrother_samples_per_second": 34.445,
"eval_bigbrother_steps_per_second": 1.081,
"eval_bigbrother_wer": 0.40634818335615885,
"step": 12555
},
{
"epoch": 28.0,
"grad_norm": 20.373756408691406,
"learning_rate": 3.266666666666667e-05,
"loss": 0.9033,
"step": 13020
},
{
"epoch": 28.0,
"eval_rundkast_loss": 0.42664840817451477,
"eval_rundkast_runtime": 31.8414,
"eval_rundkast_samples_per_second": 42.241,
"eval_rundkast_steps_per_second": 1.35,
"eval_rundkast_wer": 0.2053770283168947,
"step": 13020
},
{
"epoch": 28.0,
"eval_NB_BB_loss": 0.9819029569625854,
"eval_NB_BB_runtime": 83.3501,
"eval_NB_BB_samples_per_second": 22.831,
"eval_NB_BB_steps_per_second": 0.72,
"eval_NB_BB_wer": 0.2954536253592972,
"step": 13020
},
{
"epoch": 28.0,
"eval_nb_samtale_loss": 0.4682862460613251,
"eval_nb_samtale_runtime": 35.6354,
"eval_nb_samtale_samples_per_second": 14.957,
"eval_nb_samtale_steps_per_second": 0.477,
"eval_nb_samtale_wer": 0.185791015625,
"step": 13020
},
{
"epoch": 28.0,
"eval_bigbrother_loss": 1.1819084882736206,
"eval_bigbrother_runtime": 39.7653,
"eval_bigbrother_samples_per_second": 34.452,
"eval_bigbrother_steps_per_second": 1.081,
"eval_bigbrother_wer": 0.4032868766615645,
"step": 13020
},
{
"epoch": 29.0,
"grad_norm": 2.7378759384155273,
"learning_rate": 2.9947368421052634e-05,
"loss": 0.9018,
"step": 13485
},
{
"epoch": 29.0,
"eval_rundkast_loss": 0.4359777867794037,
"eval_rundkast_runtime": 31.7585,
"eval_rundkast_samples_per_second": 42.351,
"eval_rundkast_steps_per_second": 1.354,
"eval_rundkast_wer": 0.20553611199490932,
"step": 13485
},
{
"epoch": 29.0,
"eval_NB_BB_loss": 0.9609730243682861,
"eval_NB_BB_runtime": 83.7711,
"eval_NB_BB_samples_per_second": 22.717,
"eval_NB_BB_steps_per_second": 0.716,
"eval_NB_BB_wer": 0.2929840897129671,
"step": 13485
},
{
"epoch": 29.0,
"eval_nb_samtale_loss": 0.4618481695652008,
"eval_nb_samtale_runtime": 36.0874,
"eval_nb_samtale_samples_per_second": 14.77,
"eval_nb_samtale_steps_per_second": 0.471,
"eval_nb_samtale_wer": 0.18489583333333334,
"step": 13485
},
{
"epoch": 29.0,
"eval_bigbrother_loss": 1.1553022861480713,
"eval_bigbrother_runtime": 39.8384,
"eval_bigbrother_samples_per_second": 34.389,
"eval_bigbrother_steps_per_second": 1.079,
"eval_bigbrother_wer": 0.3999838878595021,
"step": 13485
},
{
"epoch": 30.0,
"grad_norm": 27.257183074951172,
"learning_rate": 2.7228070175438598e-05,
"loss": 0.8937,
"step": 13950
},
{
"epoch": 30.0,
"eval_rundkast_loss": 0.45607230067253113,
"eval_rundkast_runtime": 32.367,
"eval_rundkast_samples_per_second": 41.555,
"eval_rundkast_steps_per_second": 1.329,
"eval_rundkast_wer": 0.20688832325803372,
"step": 13950
},
{
"epoch": 30.0,
"eval_NB_BB_loss": 1.0051723718643188,
"eval_NB_BB_runtime": 103.4936,
"eval_NB_BB_samples_per_second": 18.388,
"eval_NB_BB_steps_per_second": 0.58,
"eval_NB_BB_wer": 0.294522488968058,
"step": 13950
},
{
"epoch": 30.0,
"eval_nb_samtale_loss": 0.470134973526001,
"eval_nb_samtale_runtime": 36.186,
"eval_nb_samtale_samples_per_second": 14.729,
"eval_nb_samtale_steps_per_second": 0.47,
"eval_nb_samtale_wer": 0.18440755208333334,
"step": 13950
},
{
"epoch": 30.0,
"eval_bigbrother_loss": 1.2132840156555176,
"eval_bigbrother_runtime": 40.683,
"eval_bigbrother_samples_per_second": 33.675,
"eval_bigbrother_steps_per_second": 1.057,
"eval_bigbrother_wer": 0.4032063159590752,
"step": 13950
},
{
"epoch": 31.0,
"grad_norm": 5.251443862915039,
"learning_rate": 2.4508771929824562e-05,
"loss": 0.8814,
"step": 14415
},
{
"epoch": 31.0,
"eval_rundkast_loss": 0.4411740005016327,
"eval_rundkast_runtime": 32.5448,
"eval_rundkast_samples_per_second": 41.328,
"eval_rundkast_steps_per_second": 1.321,
"eval_rundkast_wer": 0.20617244670696785,
"step": 14415
},
{
"epoch": 31.0,
"eval_NB_BB_loss": 0.9743751287460327,
"eval_NB_BB_runtime": 84.3758,
"eval_NB_BB_samples_per_second": 22.554,
"eval_NB_BB_steps_per_second": 0.711,
"eval_NB_BB_wer": 0.2928626371401968,
"step": 14415
},
{
"epoch": 31.0,
"eval_nb_samtale_loss": 0.47333696484565735,
"eval_nb_samtale_runtime": 36.2272,
"eval_nb_samtale_samples_per_second": 14.713,
"eval_nb_samtale_steps_per_second": 0.469,
"eval_nb_samtale_wer": 0.18359375,
"step": 14415
},
{
"epoch": 31.0,
"eval_bigbrother_loss": 1.1694875955581665,
"eval_bigbrother_runtime": 40.7287,
"eval_bigbrother_samples_per_second": 33.637,
"eval_bigbrother_steps_per_second": 1.056,
"eval_bigbrother_wer": 0.4003061306694594,
"step": 14415
},
{
"epoch": 32.0,
"grad_norm": 5.162887096405029,
"learning_rate": 2.1789473684210526e-05,
"loss": 0.8784,
"step": 14880
},
{
"epoch": 32.0,
"eval_rundkast_loss": 0.45319777727127075,
"eval_rundkast_runtime": 33.2279,
"eval_rundkast_samples_per_second": 40.478,
"eval_rundkast_steps_per_second": 1.294,
"eval_rundkast_wer": 0.2041043588927776,
"step": 14880
},
{
"epoch": 32.0,
"eval_NB_BB_loss": 1.0061391592025757,
"eval_NB_BB_runtime": 85.8491,
"eval_NB_BB_samples_per_second": 22.167,
"eval_NB_BB_steps_per_second": 0.699,
"eval_NB_BB_wer": 0.2929031213311202,
"step": 14880
},
{
"epoch": 32.0,
"eval_nb_samtale_loss": 0.486108660697937,
"eval_nb_samtale_runtime": 35.9271,
"eval_nb_samtale_samples_per_second": 14.836,
"eval_nb_samtale_steps_per_second": 0.473,
"eval_nb_samtale_wer": 0.18400065104166666,
"step": 14880
},
{
"epoch": 32.0,
"eval_bigbrother_loss": 1.208513855934143,
"eval_bigbrother_runtime": 40.5432,
"eval_bigbrother_samples_per_second": 33.791,
"eval_bigbrother_steps_per_second": 1.061,
"eval_bigbrother_wer": 0.4007894948843954,
"step": 14880
},
{
"epoch": 33.0,
"grad_norm": 5.579722881317139,
"learning_rate": 1.907017543859649e-05,
"loss": 0.8831,
"step": 15345
},
{
"epoch": 33.0,
"eval_rundkast_loss": 0.44335484504699707,
"eval_rundkast_runtime": 32.683,
"eval_rundkast_samples_per_second": 41.153,
"eval_rundkast_steps_per_second": 1.316,
"eval_rundkast_wer": 0.2053770283168947,
"step": 15345
},
{
"epoch": 33.0,
"eval_NB_BB_loss": 1.0044219493865967,
"eval_NB_BB_runtime": 85.3142,
"eval_NB_BB_samples_per_second": 22.306,
"eval_NB_BB_steps_per_second": 0.703,
"eval_NB_BB_wer": 0.2922958584672685,
"step": 15345
},
{
"epoch": 33.0,
"eval_nb_samtale_loss": 0.4627678096294403,
"eval_nb_samtale_runtime": 36.1313,
"eval_nb_samtale_samples_per_second": 14.752,
"eval_nb_samtale_steps_per_second": 0.471,
"eval_nb_samtale_wer": 0.18367513020833334,
"step": 15345
},
{
"epoch": 33.0,
"eval_bigbrother_loss": 1.2153956890106201,
"eval_bigbrother_runtime": 40.81,
"eval_bigbrother_samples_per_second": 33.57,
"eval_bigbrother_steps_per_second": 1.054,
"eval_bigbrother_wer": 0.40070893418190606,
"step": 15345
},
{
"epoch": 34.0,
"grad_norm": 5.071865081787109,
"learning_rate": 1.6356725146198832e-05,
"loss": 0.8722,
"step": 15810
},
{
"epoch": 34.0,
"eval_rundkast_loss": 0.4348403215408325,
"eval_rundkast_runtime": 32.9227,
"eval_rundkast_samples_per_second": 40.853,
"eval_rundkast_steps_per_second": 1.306,
"eval_rundkast_wer": 0.20521794463888005,
"step": 15810
},
{
"epoch": 34.0,
"eval_NB_BB_loss": 0.9682305455207825,
"eval_NB_BB_runtime": 85.5917,
"eval_NB_BB_samples_per_second": 22.233,
"eval_NB_BB_steps_per_second": 0.701,
"eval_NB_BB_wer": 0.2904335856847901,
"step": 15810
},
{
"epoch": 34.0,
"eval_nb_samtale_loss": 0.44841158390045166,
"eval_nb_samtale_runtime": 36.1939,
"eval_nb_samtale_samples_per_second": 14.726,
"eval_nb_samtale_steps_per_second": 0.47,
"eval_nb_samtale_wer": 0.18212890625,
"step": 15810
},
{
"epoch": 34.0,
"eval_bigbrother_loss": 1.170255422592163,
"eval_bigbrother_runtime": 40.7341,
"eval_bigbrother_samples_per_second": 33.633,
"eval_bigbrother_steps_per_second": 1.056,
"eval_bigbrother_wer": 0.39813099170224764,
"step": 15810
},
{
"epoch": 35.0,
"grad_norm": 8.128209114074707,
"learning_rate": 1.3637426900584796e-05,
"loss": 0.859,
"step": 16275
},
{
"epoch": 35.0,
"eval_rundkast_loss": 0.446013867855072,
"eval_rundkast_runtime": 32.6724,
"eval_rundkast_samples_per_second": 41.166,
"eval_rundkast_steps_per_second": 1.316,
"eval_rundkast_wer": 0.20243398027362391,
"step": 16275
},
{
"epoch": 35.0,
"eval_NB_BB_loss": 1.003732442855835,
"eval_NB_BB_runtime": 84.4708,
"eval_NB_BB_samples_per_second": 22.528,
"eval_NB_BB_steps_per_second": 0.71,
"eval_NB_BB_wer": 0.29023116473017285,
"step": 16275
},
{
"epoch": 35.0,
"eval_nb_samtale_loss": 0.4694906175136566,
"eval_nb_samtale_runtime": 35.8944,
"eval_nb_samtale_samples_per_second": 14.849,
"eval_nb_samtale_steps_per_second": 0.474,
"eval_nb_samtale_wer": 0.18359375,
"step": 16275
},
{
"epoch": 35.0,
"eval_bigbrother_loss": 1.2112008333206177,
"eval_bigbrother_runtime": 40.7858,
"eval_bigbrother_samples_per_second": 33.59,
"eval_bigbrother_steps_per_second": 1.054,
"eval_bigbrother_wer": 0.39635865624748245,
"step": 16275
},
{
"epoch": 36.0,
"grad_norm": 7.049020767211914,
"learning_rate": 1.091812865497076e-05,
"loss": 0.8508,
"step": 16740
},
{
"epoch": 36.0,
"eval_rundkast_loss": 0.4368053376674652,
"eval_rundkast_runtime": 32.6393,
"eval_rundkast_samples_per_second": 41.208,
"eval_rundkast_steps_per_second": 1.317,
"eval_rundkast_wer": 0.20330894050270443,
"step": 16740
},
{
"epoch": 36.0,
"eval_NB_BB_loss": 0.9765028357505798,
"eval_NB_BB_runtime": 86.1031,
"eval_NB_BB_samples_per_second": 22.101,
"eval_NB_BB_steps_per_second": 0.697,
"eval_NB_BB_wer": 0.29031213311201975,
"step": 16740
},
{
"epoch": 36.0,
"eval_nb_samtale_loss": 0.45226001739501953,
"eval_nb_samtale_runtime": 36.3397,
"eval_nb_samtale_samples_per_second": 14.667,
"eval_nb_samtale_steps_per_second": 0.468,
"eval_nb_samtale_wer": 0.182373046875,
"step": 16740
},
{
"epoch": 36.0,
"eval_bigbrother_loss": 1.180801272392273,
"eval_bigbrother_runtime": 41.007,
"eval_bigbrother_samples_per_second": 33.409,
"eval_bigbrother_steps_per_second": 1.049,
"eval_bigbrother_wer": 0.3970031418673971,
"step": 16740
},
{
"epoch": 37.0,
"grad_norm": 8.417683601379395,
"learning_rate": 8.198830409356726e-06,
"loss": 0.8547,
"step": 17205
},
{
"epoch": 37.0,
"eval_rundkast_loss": 0.44972118735313416,
"eval_rundkast_runtime": 32.9953,
"eval_rundkast_samples_per_second": 40.763,
"eval_rundkast_steps_per_second": 1.303,
"eval_rundkast_wer": 0.20291123130766783,
"step": 17205
},
{
"epoch": 37.0,
"eval_NB_BB_loss": 1.0050333738327026,
"eval_NB_BB_runtime": 85.63,
"eval_NB_BB_samples_per_second": 22.224,
"eval_NB_BB_steps_per_second": 0.701,
"eval_NB_BB_wer": 0.29002874377555565,
"step": 17205
},
{
"epoch": 37.0,
"eval_nb_samtale_loss": 0.4681548774242401,
"eval_nb_samtale_runtime": 35.9123,
"eval_nb_samtale_samples_per_second": 14.842,
"eval_nb_samtale_steps_per_second": 0.473,
"eval_nb_samtale_wer": 0.18212890625,
"step": 17205
},
{
"epoch": 37.0,
"eval_bigbrother_loss": 1.2139179706573486,
"eval_bigbrother_runtime": 40.7816,
"eval_bigbrother_samples_per_second": 33.594,
"eval_bigbrother_steps_per_second": 1.054,
"eval_bigbrother_wer": 0.3976476274873117,
"step": 17205
},
{
"epoch": 38.0,
"grad_norm": 6.699246883392334,
"learning_rate": 5.479532163742691e-06,
"loss": 0.8443,
"step": 17670
},
{
"epoch": 38.0,
"eval_rundkast_loss": 0.4439980089664459,
"eval_rundkast_runtime": 32.4126,
"eval_rundkast_samples_per_second": 41.496,
"eval_rundkast_steps_per_second": 1.327,
"eval_rundkast_wer": 0.20370664969774102,
"step": 17670
},
{
"epoch": 38.0,
"eval_NB_BB_loss": 0.9929541349411011,
"eval_NB_BB_runtime": 85.6285,
"eval_NB_BB_samples_per_second": 22.224,
"eval_NB_BB_steps_per_second": 0.701,
"eval_NB_BB_wer": 0.289421480911704,
"step": 17670
},
{
"epoch": 38.0,
"eval_nb_samtale_loss": 0.46245497465133667,
"eval_nb_samtale_runtime": 36.3757,
"eval_nb_samtale_samples_per_second": 14.653,
"eval_nb_samtale_steps_per_second": 0.467,
"eval_nb_samtale_wer": 0.18229166666666666,
"step": 17670
},
{
"epoch": 38.0,
"eval_bigbrother_loss": 1.1993677616119385,
"eval_bigbrother_runtime": 40.9524,
"eval_bigbrother_samples_per_second": 33.453,
"eval_bigbrother_steps_per_second": 1.05,
"eval_bigbrother_wer": 0.3961975348425038,
"step": 17670
},
{
"epoch": 39.0,
"grad_norm": 5.469863414764404,
"learning_rate": 2.760233918128655e-06,
"loss": 0.835,
"step": 18135
},
{
"epoch": 39.0,
"eval_rundkast_loss": 0.44508007168769836,
"eval_rundkast_runtime": 32.7027,
"eval_rundkast_samples_per_second": 41.128,
"eval_rundkast_steps_per_second": 1.315,
"eval_rundkast_wer": 0.2041043588927776,
"step": 18135
},
{
"epoch": 39.0,
"eval_NB_BB_loss": 0.9969344139099121,
"eval_NB_BB_runtime": 84.86,
"eval_NB_BB_samples_per_second": 22.425,
"eval_NB_BB_steps_per_second": 0.707,
"eval_NB_BB_wer": 0.29023116473017285,
"step": 18135
},
{
"epoch": 39.0,
"eval_nb_samtale_loss": 0.4631071090698242,
"eval_nb_samtale_runtime": 35.8723,
"eval_nb_samtale_samples_per_second": 14.858,
"eval_nb_samtale_steps_per_second": 0.474,
"eval_nb_samtale_wer": 0.18180338541666666,
"step": 18135
},
{
"epoch": 39.0,
"eval_bigbrother_loss": 1.2046737670898438,
"eval_bigbrother_runtime": 40.6261,
"eval_bigbrother_samples_per_second": 33.722,
"eval_bigbrother_steps_per_second": 1.058,
"eval_bigbrother_wer": 0.3973253846773544,
"step": 18135
},
{
"epoch": 40.0,
"grad_norm": 2.851428508758545,
"learning_rate": 4.678362573099416e-08,
"loss": 0.8346,
"step": 18600
},
{
"epoch": 40.0,
"eval_rundkast_loss": 0.44796615839004517,
"eval_rundkast_runtime": 32.5088,
"eval_rundkast_samples_per_second": 41.373,
"eval_rundkast_steps_per_second": 1.323,
"eval_rundkast_wer": 0.2036271078587337,
"step": 18600
},
{
"epoch": 40.0,
"eval_NB_BB_loss": 1.0030395984649658,
"eval_NB_BB_runtime": 94.7646,
"eval_NB_BB_samples_per_second": 20.081,
"eval_NB_BB_steps_per_second": 0.633,
"eval_NB_BB_wer": 0.28958341767539775,
"step": 18600
},
{
"epoch": 40.0,
"eval_nb_samtale_loss": 0.4656994044780731,
"eval_nb_samtale_runtime": 36.739,
"eval_nb_samtale_samples_per_second": 14.508,
"eval_nb_samtale_steps_per_second": 0.463,
"eval_nb_samtale_wer": 0.18123372395833334,
"step": 18600
},
{
"epoch": 40.0,
"eval_bigbrother_loss": 1.2117459774017334,
"eval_bigbrother_runtime": 40.801,
"eval_bigbrother_samples_per_second": 33.578,
"eval_bigbrother_steps_per_second": 1.054,
"eval_bigbrother_wer": 0.3970031418673971,
"step": 18600
}
],
"logging_steps": 500,
"max_steps": 18600,
"num_input_tokens_seen": 0,
"num_train_epochs": 40,
"save_steps": 500,
"total_flos": 1.281422114476163e+20,
"train_batch_size": 48,
"trial_name": null,
"trial_params": null
}