Tflatval commited on Jun 24

Commit

ef3dc17

•

1 Parent(s): 5ed99e9

Upload folder using huggingface_hub

Browse files

Files changed (31) hide show

.gitattributes +1 -0
added_tokens.json +4 -0
alphabet.json +1 -0
checkpoint-40425/config.json +116 -0
checkpoint-40425/model.safetensors +3 -0
checkpoint-40425/optimizer.pt +3 -0
checkpoint-40425/preprocessor_config.json +10 -0
checkpoint-40425/rng_state.pth +3 -0
checkpoint-40425/scheduler.pt +3 -0
checkpoint-40425/trainer_state.json +1143 -0
checkpoint-40425/training_args.bin +3 -0
checkpoint-49000/config.json +116 -0
checkpoint-49000/model.safetensors +3 -0
checkpoint-49000/optimizer.pt +3 -0
checkpoint-49000/preprocessor_config.json +10 -0
checkpoint-49000/rng_state.pth +3 -0
checkpoint-49000/scheduler.pt +3 -0
checkpoint-49000/trainer_state.json +1381 -0
checkpoint-49000/training_args.bin +3 -0
config.json +116 -0
language_model/5gram.bin +3 -0
language_model/attrs.json +1 -0
language_model/unigrams.txt +3 -0
model.safetensors +3 -0
preprocessor_config.json +10 -0
runs/May30_19-47-26_idun-04-10/events.out.tfevents.1717092397.idun-04-10.304569.0 +3 -0
runs/May31_15-59-49_idun-04-10/events.out.tfevents.1717165018.idun-04-10.1353968.0 +3 -0
special_tokens_map.json +6 -0
tokenizer_config.json +47 -0
training_args.bin +3 -0
vocab.json +34 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+language_model/unigrams.txt filter=lfs diff=lfs merge=lfs -text

added_tokens.json ADDED Viewed

	@@ -0,0 +1,4 @@

+{
+  "</s>": 33,
+  "<s>": 32
+}

alphabet.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"labels": [" ", "a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k", "l", "m", "n", "o", "p", "q", "r", "s", "t", "u", "v", "w", "x", "y", "z", "\u00e5", "\u00e6", "\u00f8" ,"\u2047", "", "<s>", "</s>"], "is_bpe": false}

checkpoint-40425/config.json ADDED Viewed

	@@ -0,0 +1,116 @@

+{
+  "_name_or_path": "NbAiLab/nb-wav2vec2-300m-bokmaal",
+  "activation_dropout": 0.055,
+  "adapter_attn_dim": null,
+  "adapter_kernel_size": 3,
+  "adapter_stride": 2,
+  "add_adapter": false,
+  "apply_spec_augment": true,
+  "architectures": [
+    "Wav2Vec2ForCTC"
+  ],
+  "attention_dropout": 0.094,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "codevector_dim": 768,
+  "contrastive_logits_temperature": 0.1,
+  "conv_bias": true,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "mean",
+  "ctc_zero_infinity": true,
+  "diversity_loss_weight": 0.1,
+  "do_stable_layer_norm": true,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_dropout": 0.0,
+  "feat_extract_norm": "layer",
+  "feat_proj_dropout": 0.04,
+  "feat_quantizer_dropout": 0.0,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.047,
+  "hidden_size": 1024,
+  "initializer_range": 0.02,
+  "intermediate_size": 4096,
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.041,
+  "mask_channel_length": 10,
+  "mask_channel_min_space": 1,
+  "mask_channel_other": 0.0,
+  "mask_channel_prob": 0.0,
+  "mask_channel_selection": "static",
+  "mask_feature_length": 64,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.25,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_min_space": 1,
+  "mask_time_other": 0.0,
+  "mask_time_prob": 0.082,
+  "mask_time_selection": "static",
+  "model_type": "wav2vec2",
+  "num_adapter_layers": 3,
+  "num_attention_heads": 16,
+  "num_codevector_groups": 2,
+  "num_codevectors_per_group": 320,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 24,
+  "num_negatives": 100,
+  "output_hidden_size": 1024,
+  "pad_token_id": 31,
+  "proj_codevector_dim": 768,
+  "tdnn_dilation": [
+    1,
+    2,
+    3,
+    1,
+    1
+  ],
+  "tdnn_dim": [
+    512,
+    512,
+    512,
+    512,
+    1500
+  ],
+  "tdnn_kernel": [
+    5,
+    3,
+    3,
+    1,
+    1
+  ],
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 34,
+  "xvector_output_dim": 512
+}

checkpoint-40425/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e7b5c2997f82b0ae7618c7c41aa32b4e6d27cdbfb713bd96b3970a416d72bd39
+size 1261946880

checkpoint-40425/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c186523a15948881fa36d0ba5857c9acd64276812daeffa855e760193a9adfbf
+size 2490438582

checkpoint-40425/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "do_normalize": true,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "processor_class": "Wav2Vec2ProcessorWithLM",
+  "return_attention_mask": true,
+  "sampling_rate": 16000
+}

checkpoint-40425/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7a3d525701ad3999010ad8f8d22a8531ee80f7a55d8fb5daf55f00674c8a058d
+size 14308

checkpoint-40425/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b2aba5f0fa582878bcdab6ba7fd60fa7e6e949919623c84d14ea53f4607bf4b3
+size 1064

checkpoint-40425/trainer_state.json ADDED Viewed

	@@ -0,0 +1,1143 @@

+{
+  "best_metric": 0.12615335666560612,
+  "best_model_checkpoint": "/cluster/home/torstefl/Master/saved_model/W2V/single/RUND/30.05/checkpoint-40425",
+  "epoch": 33.0,
+  "eval_steps": 500,
+  "global_step": 40425,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "grad_norm": 3.7080862522125244,
+      "learning_rate": 8.16e-05,
+      "loss": 0.5467,
+      "step": 1225
+    },
+    {
+      "epoch": 1.0,
+      "eval_rundkast_loss": 0.30231863260269165,
+      "eval_rundkast_runtime": 32.5305,
+      "eval_rundkast_samples_per_second": 41.346,
+      "eval_rundkast_steps_per_second": 1.322,
+      "eval_rundkast_wer": 0.19145720649061407,
+      "step": 1225
+    },
+    {
+      "epoch": 1.0,
+      "eval_nb_samtale_loss": 0.5260343551635742,
+      "eval_nb_samtale_runtime": 37.7602,
+      "eval_nb_samtale_samples_per_second": 14.115,
+      "eval_nb_samtale_steps_per_second": 0.45,
+      "eval_nb_samtale_wer": 0.2622884114583333,
+      "step": 1225
+    },
+    {
+      "epoch": 1.0,
+      "eval_bigbrother_loss": 1.871883511543274,
+      "eval_bigbrother_runtime": 40.2594,
+      "eval_bigbrother_samples_per_second": 34.029,
+      "eval_bigbrother_steps_per_second": 1.068,
+      "eval_bigbrother_wer": 0.6054136792072827,
+      "step": 1225
+    },
+    {
+      "epoch": 2.0,
+      "grad_norm": 2.773157835006714,
+      "learning_rate": 9.800210526315789e-05,
+      "loss": 0.4578,
+      "step": 2450
+    },
+    {
+      "epoch": 2.0,
+      "eval_rundkast_loss": 0.31110912561416626,
+      "eval_rundkast_runtime": 31.8038,
+      "eval_rundkast_samples_per_second": 42.291,
+      "eval_rundkast_steps_per_second": 1.352,
+      "eval_rundkast_wer": 0.17236716512885777,
+      "step": 2450
+    },
+    {
+      "epoch": 2.0,
+      "eval_nb_samtale_loss": 0.5243741273880005,
+      "eval_nb_samtale_runtime": 37.3513,
+      "eval_nb_samtale_samples_per_second": 14.27,
+      "eval_nb_samtale_steps_per_second": 0.455,
+      "eval_nb_samtale_wer": 0.24796549479166666,
+      "step": 2450
+    },
+    {
+      "epoch": 2.0,
+      "eval_bigbrother_loss": 1.9609774351119995,
+      "eval_bigbrother_runtime": 40.3603,
+      "eval_bigbrother_samples_per_second": 33.944,
+      "eval_bigbrother_steps_per_second": 1.065,
+      "eval_bigbrother_wer": 0.5801981793281238,
+      "step": 2450
+    },
+    {
+      "epoch": 3.0,
+      "grad_norm": 2.448107957839966,
+      "learning_rate": 9.542315789473685e-05,
+      "loss": 0.4141,
+      "step": 3675
+    },
+    {
+      "epoch": 3.0,
+      "eval_rundkast_loss": 0.28843000531196594,
+      "eval_rundkast_runtime": 31.4496,
+      "eval_rundkast_samples_per_second": 42.767,
+      "eval_rundkast_steps_per_second": 1.367,
+      "eval_rundkast_wer": 0.1697422844416163,
+      "step": 3675
+    },
+    {
+      "epoch": 3.0,
+      "eval_nb_samtale_loss": 0.5364730954170227,
+      "eval_nb_samtale_runtime": 36.197,
+      "eval_nb_samtale_samples_per_second": 14.725,
+      "eval_nb_samtale_steps_per_second": 0.47,
+      "eval_nb_samtale_wer": 0.24007161458333334,
+      "step": 3675
+    },
+    {
+      "epoch": 3.0,
+      "eval_bigbrother_loss": 1.9849306344985962,
+      "eval_bigbrother_runtime": 39.5166,
+      "eval_bigbrother_samples_per_second": 34.669,
+      "eval_bigbrother_steps_per_second": 1.088,
+      "eval_bigbrother_wer": 0.5797953758156771,
+      "step": 3675
+    },
+    {
+      "epoch": 4.0,
+      "grad_norm": 5.366342544555664,
+      "learning_rate": 9.28463157894737e-05,
+      "loss": 0.3852,
+      "step": 4900
+    },
+    {
+      "epoch": 4.0,
+      "eval_rundkast_loss": 0.2692658603191376,
+      "eval_rundkast_runtime": 31.6518,
+      "eval_rundkast_samples_per_second": 42.494,
+      "eval_rundkast_steps_per_second": 1.359,
+      "eval_rundkast_wer": 0.16321985364301622,
+      "step": 4900
+    },
+    {
+      "epoch": 4.0,
+      "eval_nb_samtale_loss": 0.5346274971961975,
+      "eval_nb_samtale_runtime": 36.5542,
+      "eval_nb_samtale_samples_per_second": 14.581,
+      "eval_nb_samtale_steps_per_second": 0.465,
+      "eval_nb_samtale_wer": 0.23860677083333334,
+      "step": 4900
+    },
+    {
+      "epoch": 4.0,
+      "eval_bigbrother_loss": 1.9121719598770142,
+      "eval_bigbrother_runtime": 40.1737,
+      "eval_bigbrother_samples_per_second": 34.102,
+      "eval_bigbrother_steps_per_second": 1.07,
+      "eval_bigbrother_wer": 0.5557077257713687,
+      "step": 4900
+    },
+    {
+      "epoch": 5.0,
+      "grad_norm": 4.274389266967773,
+      "learning_rate": 9.026736842105264e-05,
+      "loss": 0.3654,
+      "step": 6125
+    },
+    {
+      "epoch": 5.0,
+      "eval_rundkast_loss": 0.29252347350120544,
+      "eval_rundkast_runtime": 31.5872,
+      "eval_rundkast_samples_per_second": 42.581,
+      "eval_rundkast_steps_per_second": 1.361,
+      "eval_rundkast_wer": 0.15701559020044542,
+      "step": 6125
+    },
+    {
+      "epoch": 5.0,
+      "eval_nb_samtale_loss": 0.5537768006324768,
+      "eval_nb_samtale_runtime": 36.3537,
+      "eval_nb_samtale_samples_per_second": 14.662,
+      "eval_nb_samtale_steps_per_second": 0.468,
+      "eval_nb_samtale_wer": 0.23079427083333334,
+      "step": 6125
+    },
+    {
+      "epoch": 5.0,
+      "eval_bigbrother_loss": 2.0775458812713623,
+      "eval_bigbrother_runtime": 39.681,
+      "eval_bigbrother_samples_per_second": 34.525,
+      "eval_bigbrother_steps_per_second": 1.084,
+      "eval_bigbrother_wer": 0.5554660436639007,
+      "step": 6125
+    },
+    {
+      "epoch": 6.0,
+      "grad_norm": 5.030076026916504,
+      "learning_rate": 8.769052631578948e-05,
+      "loss": 0.3452,
+      "step": 7350
+    },
+    {
+      "epoch": 6.0,
+      "eval_rundkast_loss": 0.29516521096229553,
+      "eval_rundkast_runtime": 31.5112,
+      "eval_rundkast_samples_per_second": 42.683,
+      "eval_rundkast_steps_per_second": 1.365,
+      "eval_rundkast_wer": 0.15089086859688197,
+      "step": 7350
+    },
+    {
+      "epoch": 6.0,
+      "eval_nb_samtale_loss": 0.5526564717292786,
+      "eval_nb_samtale_runtime": 36.1333,
+      "eval_nb_samtale_samples_per_second": 14.751,
+      "eval_nb_samtale_steps_per_second": 0.47,
+      "eval_nb_samtale_wer": 0.22517903645833334,
+      "step": 7350
+    },
+    {
+      "epoch": 6.0,
+      "eval_bigbrother_loss": 2.038280725479126,
+      "eval_bigbrother_runtime": 39.4829,
+      "eval_bigbrother_samples_per_second": 34.699,
+      "eval_bigbrother_steps_per_second": 1.089,
+      "eval_bigbrother_wer": 0.5402400708934182,
+      "step": 7350
+    },
+    {
+      "epoch": 7.0,
+      "grad_norm": 5.610586166381836,
+      "learning_rate": 8.511157894736842e-05,
+      "loss": 0.3301,
+      "step": 8575
+    },
+    {
+      "epoch": 7.0,
+      "eval_rundkast_loss": 0.27553433179855347,
+      "eval_rundkast_runtime": 31.4793,
+      "eval_rundkast_samples_per_second": 42.727,
+      "eval_rundkast_steps_per_second": 1.366,
+      "eval_rundkast_wer": 0.14460706331530385,
+      "step": 8575
+    },
+    {
+      "epoch": 7.0,
+      "eval_nb_samtale_loss": 0.5609863996505737,
+      "eval_nb_samtale_runtime": 36.0218,
+      "eval_nb_samtale_samples_per_second": 14.797,
+      "eval_nb_samtale_steps_per_second": 0.472,
+      "eval_nb_samtale_wer": 0.22281901041666666,
+      "step": 8575
+    },
+    {
+      "epoch": 7.0,
+      "eval_bigbrother_loss": 2.06436824798584,
+      "eval_bigbrother_runtime": 39.4099,
+      "eval_bigbrother_samples_per_second": 34.763,
+      "eval_bigbrother_steps_per_second": 1.091,
+      "eval_bigbrother_wer": 0.5374204463062918,
+      "step": 8575
+    },
+    {
+      "epoch": 8.0,
+      "grad_norm": 3.3816378116607666,
+      "learning_rate": 8.253263157894737e-05,
+      "loss": 0.3152,
+      "step": 9800
+    },
+    {
+      "epoch": 8.0,
+      "eval_rundkast_loss": 0.27358707785606384,
+      "eval_rundkast_runtime": 31.4538,
+      "eval_rundkast_samples_per_second": 42.761,
+      "eval_rundkast_steps_per_second": 1.367,
+      "eval_rundkast_wer": 0.14675469296850144,
+      "step": 9800
+    },
+    {
+      "epoch": 8.0,
+      "eval_nb_samtale_loss": 0.5373356938362122,
+      "eval_nb_samtale_runtime": 36.0235,
+      "eval_nb_samtale_samples_per_second": 14.796,
+      "eval_nb_samtale_steps_per_second": 0.472,
+      "eval_nb_samtale_wer": 0.2265625,
+      "step": 9800
+    },
+    {
+      "epoch": 8.0,
+      "eval_bigbrother_loss": 2.0022764205932617,
+      "eval_bigbrother_runtime": 39.5126,
+      "eval_bigbrother_samples_per_second": 34.673,
+      "eval_bigbrother_steps_per_second": 1.088,
+      "eval_bigbrother_wer": 0.5332312897768469,
+      "step": 9800
+    },
+    {
+      "epoch": 9.0,
+      "grad_norm": 2.7853925228118896,
+      "learning_rate": 7.995578947368422e-05,
+      "loss": 0.301,
+      "step": 11025
+    },
+    {
+      "epoch": 9.0,
+      "eval_rundkast_loss": 0.257459819316864,
+      "eval_rundkast_runtime": 31.4423,
+      "eval_rundkast_samples_per_second": 42.777,
+      "eval_rundkast_steps_per_second": 1.368,
+      "eval_rundkast_wer": 0.14293668469615017,
+      "step": 11025
+    },
+    {
+      "epoch": 9.0,
+      "eval_nb_samtale_loss": 0.5285869240760803,
+      "eval_nb_samtale_runtime": 36.2554,
+      "eval_nb_samtale_samples_per_second": 14.701,
+      "eval_nb_samtale_steps_per_second": 0.469,
+      "eval_nb_samtale_wer": 0.22509765625,
+      "step": 11025
+    },
+    {
+      "epoch": 9.0,
+      "eval_bigbrother_loss": 2.0163955688476562,
+      "eval_bigbrother_runtime": 39.6281,
+      "eval_bigbrother_samples_per_second": 34.571,
+      "eval_bigbrother_steps_per_second": 1.085,
+      "eval_bigbrother_wer": 0.5354869894465479,
+      "step": 11025
+    },
+    {
+      "epoch": 10.0,
+      "grad_norm": 2.2737765312194824,
+      "learning_rate": 7.737684210526317e-05,
+      "loss": 0.2912,
+      "step": 12250
+    },
+    {
+      "epoch": 10.0,
+      "eval_rundkast_loss": 0.2834290564060211,
+      "eval_rundkast_runtime": 31.605,
+      "eval_rundkast_samples_per_second": 42.557,
+      "eval_rundkast_steps_per_second": 1.361,
+      "eval_rundkast_wer": 0.14230034998409163,
+      "step": 12250
+    },
+    {
+      "epoch": 10.0,
+      "eval_nb_samtale_loss": 0.524945080280304,
+      "eval_nb_samtale_runtime": 36.2711,
+      "eval_nb_samtale_samples_per_second": 14.695,
+      "eval_nb_samtale_steps_per_second": 0.469,
+      "eval_nb_samtale_wer": 0.21956380208333334,
+      "step": 12250
+    },
+    {
+      "epoch": 10.0,
+      "eval_bigbrother_loss": 2.0072944164276123,
+      "eval_bigbrother_runtime": 39.7952,
+      "eval_bigbrother_samples_per_second": 34.426,
+      "eval_bigbrother_steps_per_second": 1.081,
+      "eval_bigbrother_wer": 0.5287198904374446,
+      "step": 12250
+    },
+    {
+      "epoch": 11.0,
+      "grad_norm": 4.1641364097595215,
+      "learning_rate": 7.479789473684211e-05,
+      "loss": 0.2818,
+      "step": 13475
+    },
+    {
+      "epoch": 11.0,
+      "eval_rundkast_loss": 0.291464626789093,
+      "eval_rundkast_runtime": 31.4279,
+      "eval_rundkast_samples_per_second": 42.796,
+      "eval_rundkast_steps_per_second": 1.368,
+      "eval_rundkast_wer": 0.1403118040089087,
+      "step": 13475
+    },
+    {
+      "epoch": 11.0,
+      "eval_nb_samtale_loss": 0.5573220252990723,
+      "eval_nb_samtale_runtime": 35.8245,
+      "eval_nb_samtale_samples_per_second": 14.878,
+      "eval_nb_samtale_steps_per_second": 0.475,
+      "eval_nb_samtale_wer": 0.21744791666666666,
+      "step": 13475
+    },
+    {
+      "epoch": 11.0,
+      "eval_bigbrother_loss": 2.2074215412139893,
+      "eval_bigbrother_runtime": 39.3859,
+      "eval_bigbrother_samples_per_second": 34.784,
+      "eval_bigbrother_steps_per_second": 1.092,
+      "eval_bigbrother_wer": 0.5279142834125513,
+      "step": 13475
+    },
+    {
+      "epoch": 12.0,
+      "grad_norm": 2.796776533126831,
+      "learning_rate": 7.222105263157896e-05,
+      "loss": 0.2718,
+      "step": 14700
+    },
+    {
+      "epoch": 12.0,
+      "eval_rundkast_loss": 0.2955363988876343,
+      "eval_rundkast_runtime": 31.4317,
+      "eval_rundkast_samples_per_second": 42.791,
+      "eval_rundkast_steps_per_second": 1.368,
+      "eval_rundkast_wer": 0.1376869233216672,
+      "step": 14700
+    },
+    {
+      "epoch": 12.0,
+      "eval_nb_samtale_loss": 0.5371569991111755,
+      "eval_nb_samtale_runtime": 36.1485,
+      "eval_nb_samtale_samples_per_second": 14.745,
+      "eval_nb_samtale_steps_per_second": 0.47,
+      "eval_nb_samtale_wer": 0.21891276041666666,
+      "step": 14700
+    },
+    {
+      "epoch": 12.0,
+      "eval_bigbrother_loss": 2.0551300048828125,
+      "eval_bigbrother_runtime": 39.5331,
+      "eval_bigbrother_samples_per_second": 34.655,
+      "eval_bigbrother_steps_per_second": 1.088,
+      "eval_bigbrother_wer": 0.524611294610489,
+      "step": 14700
+    },
+    {
+      "epoch": 13.0,
+      "grad_norm": 2.6839964389801025,
+      "learning_rate": 6.96442105263158e-05,
+      "loss": 0.2614,
+      "step": 15925
+    },
+    {
+      "epoch": 13.0,
+      "eval_rundkast_loss": 0.28540924191474915,
+      "eval_rundkast_runtime": 32.0138,
+      "eval_rundkast_samples_per_second": 42.013,
+      "eval_rundkast_steps_per_second": 1.343,
+      "eval_rundkast_wer": 0.13959592745784283,
+      "step": 15925
+    },
+    {
+      "epoch": 13.0,
+      "eval_nb_samtale_loss": 0.5376082062721252,
+      "eval_nb_samtale_runtime": 36.0007,
+      "eval_nb_samtale_samples_per_second": 14.805,
+      "eval_nb_samtale_steps_per_second": 0.472,
+      "eval_nb_samtale_wer": 0.215087890625,
+      "step": 15925
+    },
+    {
+      "epoch": 13.0,
+      "eval_bigbrother_loss": 2.0468454360961914,
+      "eval_bigbrother_runtime": 39.695,
+      "eval_bigbrother_samples_per_second": 34.513,
+      "eval_bigbrother_steps_per_second": 1.083,
+      "eval_bigbrother_wer": 0.5228389591557239,
+      "step": 15925
+    },
+    {
+      "epoch": 14.0,
+      "grad_norm": 2.8357603549957275,
+      "learning_rate": 6.706526315789474e-05,
+      "loss": 0.2556,
+      "step": 17150
+    },
+    {
+      "epoch": 14.0,
+      "eval_rundkast_loss": 0.34074199199676514,
+      "eval_rundkast_runtime": 31.6633,
+      "eval_rundkast_samples_per_second": 42.478,
+      "eval_rundkast_steps_per_second": 1.358,
+      "eval_rundkast_wer": 0.13728921412663062,
+      "step": 17150
+    },
+    {
+      "epoch": 14.0,
+      "eval_nb_samtale_loss": 0.5684360861778259,
+      "eval_nb_samtale_runtime": 35.7903,
+      "eval_nb_samtale_samples_per_second": 14.892,
+      "eval_nb_samtale_steps_per_second": 0.475,
+      "eval_nb_samtale_wer": 0.214111328125,
+      "step": 17150
+    },
+    {
+      "epoch": 14.0,
+      "eval_bigbrother_loss": 2.249138593673706,
+      "eval_bigbrother_runtime": 39.6983,
+      "eval_bigbrother_samples_per_second": 34.51,
+      "eval_bigbrother_steps_per_second": 1.083,
+      "eval_bigbrother_wer": 0.5262225086602755,
+      "step": 17150
+    },
+    {
+      "epoch": 15.0,
+      "grad_norm": 4.659173965454102,
+      "learning_rate": 6.448842105263159e-05,
+      "loss": 0.2473,
+      "step": 18375
+    },
+    {
+      "epoch": 15.0,
+      "eval_rundkast_loss": 0.3245847225189209,
+      "eval_rundkast_runtime": 31.5529,
+      "eval_rundkast_samples_per_second": 42.627,
+      "eval_rundkast_steps_per_second": 1.363,
+      "eval_rundkast_wer": 0.13665287941457208,
+      "step": 18375
+    },
+    {
+      "epoch": 15.0,
+      "eval_nb_samtale_loss": 0.5528948307037354,
+      "eval_nb_samtale_runtime": 36.5998,
+      "eval_nb_samtale_samples_per_second": 14.563,
+      "eval_nb_samtale_steps_per_second": 0.464,
+      "eval_nb_samtale_wer": 0.21427408854166666,
+      "step": 18375
+    },
+    {
+      "epoch": 15.0,
+      "eval_bigbrother_loss": 2.2172372341156006,
+      "eval_bigbrother_runtime": 39.8062,
+      "eval_bigbrother_samples_per_second": 34.417,
+      "eval_bigbrother_steps_per_second": 1.08,
+      "eval_bigbrother_wer": 0.524611294610489,
+      "step": 18375
+    },
+    {
+      "epoch": 16.0,
+      "grad_norm": 4.046926975250244,
+      "learning_rate": 6.191157894736842e-05,
+      "loss": 0.2414,
+      "step": 19600
+    },
+    {
+      "epoch": 16.0,
+      "eval_rundkast_loss": 0.28036314249038696,
+      "eval_rundkast_runtime": 31.8175,
+      "eval_rundkast_samples_per_second": 42.272,
+      "eval_rundkast_steps_per_second": 1.351,
+      "eval_rundkast_wer": 0.1349825007954184,
+      "step": 19600
+    },
+    {
+      "epoch": 16.0,
+      "eval_nb_samtale_loss": 0.5292507410049438,
+      "eval_nb_samtale_runtime": 35.9006,
+      "eval_nb_samtale_samples_per_second": 14.847,
+      "eval_nb_samtale_steps_per_second": 0.474,
+      "eval_nb_samtale_wer": 0.21533203125,
+      "step": 19600
+    },
+    {
+      "epoch": 16.0,
+      "eval_bigbrother_loss": 2.0556137561798096,
+      "eval_bigbrother_runtime": 39.6218,
+      "eval_bigbrother_samples_per_second": 34.577,
+      "eval_bigbrother_steps_per_second": 1.085,
+      "eval_bigbrother_wer": 0.5206638201885121,
+      "step": 19600
+    },
+    {
+      "epoch": 17.0,
+      "grad_norm": 2.713061809539795,
+      "learning_rate": 5.933263157894737e-05,
+      "loss": 0.2328,
+      "step": 20825
+    },
+    {
+      "epoch": 17.0,
+      "eval_rundkast_loss": 0.3071937561035156,
+      "eval_rundkast_runtime": 31.6947,
+      "eval_rundkast_samples_per_second": 42.436,
+      "eval_rundkast_steps_per_second": 1.357,
+      "eval_rundkast_wer": 0.13490295895641108,
+      "step": 20825
+    },
+    {
+      "epoch": 17.0,
+      "eval_nb_samtale_loss": 0.5693681240081787,
+      "eval_nb_samtale_runtime": 35.8134,
+      "eval_nb_samtale_samples_per_second": 14.883,
+      "eval_nb_samtale_steps_per_second": 0.475,
+      "eval_nb_samtale_wer": 0.21476236979166666,
+      "step": 20825
+    },
+    {
+      "epoch": 17.0,
+      "eval_bigbrother_loss": 2.2417101860046387,
+      "eval_bigbrother_runtime": 39.6674,
+      "eval_bigbrother_samples_per_second": 34.537,
+      "eval_bigbrother_steps_per_second": 1.084,
+      "eval_bigbrother_wer": 0.5163135422540884,
+      "step": 20825
+    },
+    {
+      "epoch": 18.0,
+      "grad_norm": 3.662180185317993,
+      "learning_rate": 5.6753684210526313e-05,
+      "loss": 0.228,
+      "step": 22050
+    },
+    {
+      "epoch": 18.0,
+      "eval_rundkast_loss": 0.3300894796848297,
+      "eval_rundkast_runtime": 31.6144,
+      "eval_rundkast_samples_per_second": 42.544,
+      "eval_rundkast_steps_per_second": 1.36,
+      "eval_rundkast_wer": 0.13140311804008908,
+      "step": 22050
+    },
+    {
+      "epoch": 18.0,
+      "eval_nb_samtale_loss": 0.6102511286735535,
+      "eval_nb_samtale_runtime": 36.3906,
+      "eval_nb_samtale_samples_per_second": 14.647,
+      "eval_nb_samtale_steps_per_second": 0.467,
+      "eval_nb_samtale_wer": 0.21280924479166666,
+      "step": 22050
+    },
+    {
+      "epoch": 18.0,
+      "eval_bigbrother_loss": 2.433946371078491,
+      "eval_bigbrother_runtime": 39.8718,
+      "eval_bigbrother_samples_per_second": 34.36,
+      "eval_bigbrother_steps_per_second": 1.078,
+      "eval_bigbrother_wer": 0.5265447514702328,
+      "step": 22050
+    },
+    {
+      "epoch": 19.0,
+      "grad_norm": 3.2172813415527344,
+      "learning_rate": 5.417473684210527e-05,
+      "loss": 0.2227,
+      "step": 23275
+    },
+    {
+      "epoch": 19.0,
+      "eval_rundkast_loss": 0.2971687316894531,
+      "eval_rundkast_runtime": 31.7336,
+      "eval_rundkast_samples_per_second": 42.384,
+      "eval_rundkast_steps_per_second": 1.355,
+      "eval_rundkast_wer": 0.12949411390391347,
+      "step": 23275
+    },
+    {
+      "epoch": 19.0,
+      "eval_nb_samtale_loss": 0.5440128445625305,
+      "eval_nb_samtale_runtime": 35.6562,
+      "eval_nb_samtale_samples_per_second": 14.948,
+      "eval_nb_samtale_steps_per_second": 0.477,
+      "eval_nb_samtale_wer": 0.21337890625,
+      "step": 23275
+    },
+    {
+      "epoch": 19.0,
+      "eval_bigbrother_loss": 2.229306936264038,
+      "eval_bigbrother_runtime": 39.499,
+      "eval_bigbrother_samples_per_second": 34.684,
+      "eval_bigbrother_steps_per_second": 1.089,
+      "eval_bigbrother_wer": 0.5155884959316845,
+      "step": 23275
+    },
+    {
+      "epoch": 20.0,
+      "grad_norm": 3.76371431350708,
+      "learning_rate": 5.159789473684211e-05,
+      "loss": 0.2201,
+      "step": 24500
+    },
+    {
+      "epoch": 20.0,
+      "eval_rundkast_loss": 0.33149319887161255,
+      "eval_rundkast_runtime": 31.7066,
+      "eval_rundkast_samples_per_second": 42.42,
+      "eval_rundkast_steps_per_second": 1.356,
+      "eval_rundkast_wer": 0.13211899459115495,
+      "step": 24500
+    },
+    {
+      "epoch": 20.0,
+      "eval_nb_samtale_loss": 0.5641424655914307,
+      "eval_nb_samtale_runtime": 35.6835,
+      "eval_nb_samtale_samples_per_second": 14.937,
+      "eval_nb_samtale_steps_per_second": 0.476,
+      "eval_nb_samtale_wer": 0.214599609375,
+      "step": 24500
+    },
+    {
+      "epoch": 20.0,
+      "eval_bigbrother_loss": 2.2568540573120117,
+      "eval_bigbrother_runtime": 39.6597,
+      "eval_bigbrother_samples_per_second": 34.544,
+      "eval_bigbrother_steps_per_second": 1.084,
+      "eval_bigbrother_wer": 0.5247724160154676,
+      "step": 24500
+    },
+    {
+      "epoch": 21.0,
+      "grad_norm": 2.644437789916992,
+      "learning_rate": 4.9018947368421054e-05,
+      "loss": 0.2104,
+      "step": 25725
+    },
+    {
+      "epoch": 21.0,
+      "eval_rundkast_loss": 0.32245177030563354,
+      "eval_rundkast_runtime": 31.7772,
+      "eval_rundkast_samples_per_second": 42.326,
+      "eval_rundkast_steps_per_second": 1.353,
+      "eval_rundkast_wer": 0.1305281578110086,
+      "step": 25725
+    },
+    {
+      "epoch": 21.0,
+      "eval_nb_samtale_loss": 0.5810007452964783,
+      "eval_nb_samtale_runtime": 36.1863,
+      "eval_nb_samtale_samples_per_second": 14.729,
+      "eval_nb_samtale_steps_per_second": 0.47,
+      "eval_nb_samtale_wer": 0.2138671875,
+      "step": 25725
+    },
+    {
+      "epoch": 21.0,
+      "eval_bigbrother_loss": 2.2536792755126953,
+      "eval_bigbrother_runtime": 40.2452,
+      "eval_bigbrother_samples_per_second": 34.041,
+      "eval_bigbrother_steps_per_second": 1.068,
+      "eval_bigbrother_wer": 0.514218963989366,
+      "step": 25725
+    },
+    {
+      "epoch": 22.0,
+      "grad_norm": 4.817940711975098,
+      "learning_rate": 4.64421052631579e-05,
+      "loss": 0.2078,
+      "step": 26950
+    },
+    {
+      "epoch": 22.0,
+      "eval_rundkast_loss": 0.30675747990608215,
+      "eval_rundkast_runtime": 31.923,
+      "eval_rundkast_samples_per_second": 42.133,
+      "eval_rundkast_steps_per_second": 1.347,
+      "eval_rundkast_wer": 0.13068724148902322,
+      "step": 26950
+    },
+    {
+      "epoch": 22.0,
+      "eval_nb_samtale_loss": 0.5920718312263489,
+      "eval_nb_samtale_runtime": 35.946,
+      "eval_nb_samtale_samples_per_second": 14.828,
+      "eval_nb_samtale_steps_per_second": 0.473,
+      "eval_nb_samtale_wer": 0.21085611979166666,
+      "step": 26950
+    },
+    {
+      "epoch": 22.0,
+      "eval_bigbrother_loss": 2.283834457397461,
+      "eval_bigbrother_runtime": 39.6029,
+      "eval_bigbrother_samples_per_second": 34.593,
+      "eval_bigbrother_steps_per_second": 1.086,
+      "eval_bigbrother_wer": 0.5115604608072183,
+      "step": 26950
+    },
+    {
+      "epoch": 23.0,
+      "grad_norm": 2.2001821994781494,
+      "learning_rate": 4.3863157894736846e-05,
+      "loss": 0.2039,
+      "step": 28175
+    },
+    {
+      "epoch": 23.0,
+      "eval_rundkast_loss": 0.31590384244918823,
+      "eval_rundkast_runtime": 31.6509,
+      "eval_rundkast_samples_per_second": 42.495,
+      "eval_rundkast_steps_per_second": 1.359,
+      "eval_rundkast_wer": 0.13005090677696468,
+      "step": 28175
+    },
+    {
+      "epoch": 23.0,
+      "eval_nb_samtale_loss": 0.5807461142539978,
+      "eval_nb_samtale_runtime": 35.4812,
+      "eval_nb_samtale_samples_per_second": 15.022,
+      "eval_nb_samtale_steps_per_second": 0.479,
+      "eval_nb_samtale_wer": 0.21044921875,
+      "step": 28175
+    },
+    {
+      "epoch": 23.0,
+      "eval_bigbrother_loss": 2.346367835998535,
+      "eval_bigbrother_runtime": 39.6789,
+      "eval_bigbrother_samples_per_second": 34.527,
+      "eval_bigbrother_steps_per_second": 1.084,
+      "eval_bigbrother_wer": 0.5138161604769194,
+      "step": 28175
+    },
+    {
+      "epoch": 24.0,
+      "grad_norm": 3.352459669113159,
+      "learning_rate": 4.128631578947368e-05,
+      "loss": 0.1973,
+      "step": 29400
+    },
+    {
+      "epoch": 24.0,
+      "eval_rundkast_loss": 0.3300403654575348,
+      "eval_rundkast_runtime": 31.6022,
+      "eval_rundkast_samples_per_second": 42.56,
+      "eval_rundkast_steps_per_second": 1.361,
+      "eval_rundkast_wer": 0.1322780782691696,
+      "step": 29400
+    },
+    {
+      "epoch": 24.0,
+      "eval_nb_samtale_loss": 0.5806035995483398,
+      "eval_nb_samtale_runtime": 35.9632,
+      "eval_nb_samtale_samples_per_second": 14.821,
+      "eval_nb_samtale_steps_per_second": 0.473,
+      "eval_nb_samtale_wer": 0.21126302083333334,
+      "step": 29400
+    },
+    {
+      "epoch": 24.0,
+      "eval_bigbrother_loss": 2.317692518234253,
+      "eval_bigbrother_runtime": 40.1241,
+      "eval_bigbrother_samples_per_second": 34.144,
+      "eval_bigbrother_steps_per_second": 1.072,
+      "eval_bigbrother_wer": 0.5184081205188109,
+      "step": 29400
+    },
+    {
+      "epoch": 25.0,
+      "grad_norm": 2.7289795875549316,
+      "learning_rate": 3.870736842105263e-05,
+      "loss": 0.1962,
+      "step": 30625
+    },
+    {
+      "epoch": 25.0,
+      "eval_rundkast_loss": 0.34277400374412537,
+      "eval_rundkast_runtime": 32.0615,
+      "eval_rundkast_samples_per_second": 41.951,
+      "eval_rundkast_steps_per_second": 1.341,
+      "eval_rundkast_wer": 0.1319599109131403,
+      "step": 30625
+    },
+    {
+      "epoch": 25.0,
+      "eval_nb_samtale_loss": 0.6326170563697815,
+      "eval_nb_samtale_runtime": 35.8107,
+      "eval_nb_samtale_samples_per_second": 14.884,
+      "eval_nb_samtale_steps_per_second": 0.475,
+      "eval_nb_samtale_wer": 0.21183268229166666,
+      "step": 30625
+    },
+    {
+      "epoch": 25.0,
+      "eval_bigbrother_loss": 2.443657875061035,
+      "eval_bigbrother_runtime": 39.6514,
+      "eval_bigbrother_samples_per_second": 34.551,
+      "eval_bigbrother_steps_per_second": 1.084,
+      "eval_bigbrother_wer": 0.5142995246918554,
+      "step": 30625
+    },
+    {
+      "epoch": 26.0,
+      "grad_norm": 3.723717212677002,
+      "learning_rate": 3.612842105263158e-05,
+      "loss": 0.1887,
+      "step": 31850
+    },
+    {
+      "epoch": 26.0,
+      "eval_rundkast_loss": 0.32608622312545776,
+      "eval_rundkast_runtime": 31.9056,
+      "eval_rundkast_samples_per_second": 42.156,
+      "eval_rundkast_steps_per_second": 1.348,
+      "eval_rundkast_wer": 0.13267578746420616,
+      "step": 31850
+    },
+    {
+      "epoch": 26.0,
+      "eval_nb_samtale_loss": 0.6086393594741821,
+      "eval_nb_samtale_runtime": 35.8839,
+      "eval_nb_samtale_samples_per_second": 14.853,
+      "eval_nb_samtale_steps_per_second": 0.474,
+      "eval_nb_samtale_wer": 0.21004231770833334,
+      "step": 31850
+    },
+    {
+      "epoch": 26.0,
+      "eval_bigbrother_loss": 2.344693422317505,
+      "eval_bigbrother_runtime": 39.7842,
+      "eval_bigbrother_samples_per_second": 34.436,
+      "eval_bigbrother_steps_per_second": 1.081,
+      "eval_bigbrother_wer": 0.5134939176669621,
+      "step": 31850
+    },
+    {
+      "epoch": 27.0,
+      "grad_norm": 3.741575241088867,
+      "learning_rate": 3.3551578947368424e-05,
+      "loss": 0.1886,
+      "step": 33075
+    },
+    {
+      "epoch": 27.0,
+      "eval_rundkast_loss": 0.32595619559288025,
+      "eval_rundkast_runtime": 31.7292,
+      "eval_rundkast_samples_per_second": 42.39,
+      "eval_rundkast_steps_per_second": 1.355,
+      "eval_rundkast_wer": 0.13164174355711103,
+      "step": 33075
+    },
+    {
+      "epoch": 27.0,
+      "eval_nb_samtale_loss": 0.6121112704277039,
+      "eval_nb_samtale_runtime": 35.7885,
+      "eval_nb_samtale_samples_per_second": 14.893,
+      "eval_nb_samtale_steps_per_second": 0.475,
+      "eval_nb_samtale_wer": 0.20890299479166666,
+      "step": 33075
+    },
+    {
+      "epoch": 27.0,
+      "eval_bigbrother_loss": 2.368227005004883,
+      "eval_bigbrother_runtime": 39.9121,
+      "eval_bigbrother_samples_per_second": 34.325,
+      "eval_bigbrother_steps_per_second": 1.077,
+      "eval_bigbrother_wer": 0.511238217997261,
+      "step": 33075
+    },
+    {
+      "epoch": 28.0,
+      "grad_norm": 5.783115863800049,
+      "learning_rate": 3.097263157894737e-05,
+      "loss": 0.1836,
+      "step": 34300
+    },
+    {
+      "epoch": 28.0,
+      "eval_rundkast_loss": 0.33696532249450684,
+      "eval_rundkast_runtime": 31.5417,
+      "eval_rundkast_samples_per_second": 42.642,
+      "eval_rundkast_steps_per_second": 1.363,
+      "eval_rundkast_wer": 0.12949411390391347,
+      "step": 34300
+    },
+    {
+      "epoch": 28.0,
+      "eval_nb_samtale_loss": 0.6101709008216858,
+      "eval_nb_samtale_runtime": 35.522,
+      "eval_nb_samtale_samples_per_second": 15.005,
+      "eval_nb_samtale_steps_per_second": 0.479,
+      "eval_nb_samtale_wer": 0.21012369791666666,
+      "step": 34300
+    },
+    {
+      "epoch": 28.0,
+      "eval_bigbrother_loss": 2.353733777999878,
+      "eval_bigbrother_runtime": 39.5513,
+      "eval_bigbrother_samples_per_second": 34.639,
+      "eval_bigbrother_steps_per_second": 1.087,
+      "eval_bigbrother_wer": 0.5056795295254974,
+      "step": 34300
+    },
+    {
+      "epoch": 29.0,
+      "grad_norm": 8.664693832397461,
+      "learning_rate": 2.8395789473684216e-05,
+      "loss": 0.1804,
+      "step": 35525
+    },
+    {
+      "epoch": 29.0,
+      "eval_rundkast_loss": 0.3452693819999695,
+      "eval_rundkast_runtime": 31.2833,
+      "eval_rundkast_samples_per_second": 42.994,
+      "eval_rundkast_steps_per_second": 1.375,
+      "eval_rundkast_wer": 0.1309258670060452,
+      "step": 35525
+    },
+    {
+      "epoch": 29.0,
+      "eval_nb_samtale_loss": 0.6237297654151917,
+      "eval_nb_samtale_runtime": 35.8619,
+      "eval_nb_samtale_samples_per_second": 14.863,
+      "eval_nb_samtale_steps_per_second": 0.474,
+      "eval_nb_samtale_wer": 0.21134440104166666,
+      "step": 35525
+    },
+    {
+      "epoch": 29.0,
+      "eval_bigbrother_loss": 2.3944995403289795,
+      "eval_bigbrother_runtime": 39.4367,
+      "eval_bigbrother_samples_per_second": 34.739,
+      "eval_bigbrother_steps_per_second": 1.09,
+      "eval_bigbrother_wer": 0.5084185934101345,
+      "step": 35525
+    },
+    {
+      "epoch": 30.0,
+      "grad_norm": 4.139631748199463,
+      "learning_rate": 2.5818947368421053e-05,
+      "loss": 0.1766,
+      "step": 36750
+    },
+    {
+      "epoch": 30.0,
+      "eval_rundkast_loss": 0.3432329297065735,
+      "eval_rundkast_runtime": 31.3849,
+      "eval_rundkast_samples_per_second": 42.855,
+      "eval_rundkast_steps_per_second": 1.37,
+      "eval_rundkast_wer": 0.13020999045497933,
+      "step": 36750
+    },
+    {
+      "epoch": 30.0,
+      "eval_nb_samtale_loss": 0.6131173968315125,
+      "eval_nb_samtale_runtime": 35.6634,
+      "eval_nb_samtale_samples_per_second": 14.945,
+      "eval_nb_samtale_steps_per_second": 0.477,
+      "eval_nb_samtale_wer": 0.21199544270833334,
+      "step": 36750
+    },
+    {
+      "epoch": 30.0,
+      "eval_bigbrother_loss": 2.3949081897735596,
+      "eval_bigbrother_runtime": 39.8587,
+      "eval_bigbrother_samples_per_second": 34.371,
+      "eval_bigbrother_steps_per_second": 1.079,
+      "eval_bigbrother_wer": 0.510271489567389,
+      "step": 36750
+    },
+    {
+      "epoch": 31.0,
+      "grad_norm": 3.3099727630615234,
+      "learning_rate": 2.324e-05,
+      "loss": 0.1767,
+      "step": 37975
+    },
+    {
+      "epoch": 31.0,
+      "eval_rundkast_loss": 0.3425343930721283,
+      "eval_rundkast_runtime": 31.3869,
+      "eval_rundkast_samples_per_second": 42.852,
+      "eval_rundkast_steps_per_second": 1.37,
+      "eval_rundkast_wer": 0.1291759465478842,
+      "step": 37975
+    },
+    {
+      "epoch": 31.0,
+      "eval_nb_samtale_loss": 0.6133290529251099,
+      "eval_nb_samtale_runtime": 35.2473,
+      "eval_nb_samtale_samples_per_second": 15.122,
+      "eval_nb_samtale_steps_per_second": 0.482,
+      "eval_nb_samtale_wer": 0.21044921875,
+      "step": 37975
+    },
+    {
+      "epoch": 31.0,
+      "eval_bigbrother_loss": 2.503601312637329,
+      "eval_bigbrother_runtime": 39.2061,
+      "eval_bigbrother_samples_per_second": 34.944,
+      "eval_bigbrother_steps_per_second": 1.097,
+      "eval_bigbrother_wer": 0.5097881253524531,
+      "step": 37975
+    },
+    {
+      "epoch": 32.0,
+      "grad_norm": 3.798198938369751,
+      "learning_rate": 2.0661052631578946e-05,
+      "loss": 0.1712,
+      "step": 39200
+    },
+    {
+      "epoch": 32.0,
+      "eval_rundkast_loss": 0.3596391975879669,
+      "eval_rundkast_runtime": 31.2765,
+      "eval_rundkast_samples_per_second": 43.004,
+      "eval_rundkast_steps_per_second": 1.375,
+      "eval_rundkast_wer": 0.128380528157811,
+      "step": 39200
+    },
+    {
+      "epoch": 32.0,
+      "eval_nb_samtale_loss": 0.6345717906951904,
+      "eval_nb_samtale_runtime": 36.1693,
+      "eval_nb_samtale_samples_per_second": 14.736,
+      "eval_nb_samtale_steps_per_second": 0.47,
+      "eval_nb_samtale_wer": 0.21036783854166666,
+      "step": 39200
+    },
+    {
+      "epoch": 32.0,
+      "eval_bigbrother_loss": 2.506143569946289,
+      "eval_bigbrother_runtime": 39.8743,
+      "eval_bigbrother_samples_per_second": 34.358,
+      "eval_bigbrother_steps_per_second": 1.078,
+      "eval_bigbrother_wer": 0.5095464432449851,
+      "step": 39200
+    },
+    {
+      "epoch": 33.0,
+      "grad_norm": 3.5819003582000732,
+      "learning_rate": 1.8082105263157895e-05,
+      "loss": 0.1712,
+      "step": 40425
+    },
+    {
+      "epoch": 33.0,
+      "eval_rundkast_loss": 0.3613539934158325,
+      "eval_rundkast_runtime": 31.3392,
+      "eval_rundkast_samples_per_second": 42.918,
+      "eval_rundkast_steps_per_second": 1.372,
+      "eval_rundkast_wer": 0.12615335666560612,
+      "step": 40425
+    },
+    {
+      "epoch": 33.0,
+      "eval_nb_samtale_loss": 0.644898533821106,
+      "eval_nb_samtale_runtime": 35.4393,
+      "eval_nb_samtale_samples_per_second": 15.04,
+      "eval_nb_samtale_steps_per_second": 0.48,
+      "eval_nb_samtale_wer": 0.20914713541666666,
+      "step": 40425
+    },
+    {
+      "epoch": 33.0,
+      "eval_bigbrother_loss": 2.489149570465088,
+      "eval_bigbrother_runtime": 39.804,
+      "eval_bigbrother_samples_per_second": 34.419,
+      "eval_bigbrother_steps_per_second": 1.08,
+      "eval_bigbrother_wer": 0.5090630790300491,
+      "step": 40425
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 49000,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 40,
+  "save_steps": 500,
+  "total_flos": 1.974178763172653e+20,
+  "train_batch_size": 48,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-40425/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:76b1726f88a10b6122b423394ba676a6e1dc0ef8bf3b3a06cb5dae0ad5561656
+size 4984

checkpoint-49000/config.json ADDED Viewed

	@@ -0,0 +1,116 @@

+{
+  "_name_or_path": "NbAiLab/nb-wav2vec2-300m-bokmaal",
+  "activation_dropout": 0.055,
+  "adapter_attn_dim": null,
+  "adapter_kernel_size": 3,
+  "adapter_stride": 2,
+  "add_adapter": false,
+  "apply_spec_augment": true,
+  "architectures": [
+    "Wav2Vec2ForCTC"
+  ],
+  "attention_dropout": 0.094,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "codevector_dim": 768,
+  "contrastive_logits_temperature": 0.1,
+  "conv_bias": true,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "mean",
+  "ctc_zero_infinity": true,
+  "diversity_loss_weight": 0.1,
+  "do_stable_layer_norm": true,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_dropout": 0.0,
+  "feat_extract_norm": "layer",
+  "feat_proj_dropout": 0.04,
+  "feat_quantizer_dropout": 0.0,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.047,
+  "hidden_size": 1024,
+  "initializer_range": 0.02,
+  "intermediate_size": 4096,
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.041,
+  "mask_channel_length": 10,
+  "mask_channel_min_space": 1,
+  "mask_channel_other": 0.0,
+  "mask_channel_prob": 0.0,
+  "mask_channel_selection": "static",
+  "mask_feature_length": 64,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.25,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_min_space": 1,
+  "mask_time_other": 0.0,
+  "mask_time_prob": 0.082,
+  "mask_time_selection": "static",
+  "model_type": "wav2vec2",
+  "num_adapter_layers": 3,
+  "num_attention_heads": 16,
+  "num_codevector_groups": 2,
+  "num_codevectors_per_group": 320,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 24,
+  "num_negatives": 100,
+  "output_hidden_size": 1024,
+  "pad_token_id": 31,
+  "proj_codevector_dim": 768,
+  "tdnn_dilation": [
+    1,
+    2,
+    3,
+    1,
+    1
+  ],
+  "tdnn_dim": [
+    512,
+    512,
+    512,
+    512,
+    1500
+  ],
+  "tdnn_kernel": [
+    5,
+    3,
+    3,
+    1,
+    1
+  ],
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 34,
+  "xvector_output_dim": 512
+}

checkpoint-49000/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ba6c792b39ddb54d9fa2e70e7949b477cd7ffd7f5159cc8dd45eafb363ab94ca
+size 1261946880

checkpoint-49000/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:68be997161d0ae0df3b3126259f79c514a2618607ed6eef3316ce629fb0e74d2
+size 2490438582

checkpoint-49000/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "do_normalize": true,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "processor_class": "Wav2Vec2ProcessorWithLM",
+  "return_attention_mask": true,
+  "sampling_rate": 16000
+}

checkpoint-49000/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:04a33a03ff70cdcef08a945cd5fadd32e4d37e76465d8fdb3c47b1535b24ec7e
+size 14308

checkpoint-49000/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0aa1196d52948121882416750adc484a35b1744e8e9422cd1bceec8a5dfa8e04
+size 1064

checkpoint-49000/trainer_state.json ADDED Viewed

	@@ -0,0 +1,1381 @@

+{
+  "best_metric": 0.12615335666560612,
+  "best_model_checkpoint": "/cluster/home/torstefl/Master/saved_model/W2V/single/RUND/30.05/checkpoint-40425",
+  "epoch": 40.0,
+  "eval_steps": 500,
+  "global_step": 49000,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "grad_norm": 3.7080862522125244,
+      "learning_rate": 8.16e-05,
+      "loss": 0.5467,
+      "step": 1225
+    },
+    {
+      "epoch": 1.0,
+      "eval_rundkast_loss": 0.30231863260269165,
+      "eval_rundkast_runtime": 32.5305,
+      "eval_rundkast_samples_per_second": 41.346,
+      "eval_rundkast_steps_per_second": 1.322,
+      "eval_rundkast_wer": 0.19145720649061407,
+      "step": 1225
+    },
+    {
+      "epoch": 1.0,
+      "eval_nb_samtale_loss": 0.5260343551635742,
+      "eval_nb_samtale_runtime": 37.7602,
+      "eval_nb_samtale_samples_per_second": 14.115,
+      "eval_nb_samtale_steps_per_second": 0.45,
+      "eval_nb_samtale_wer": 0.2622884114583333,
+      "step": 1225
+    },
+    {
+      "epoch": 1.0,
+      "eval_bigbrother_loss": 1.871883511543274,
+      "eval_bigbrother_runtime": 40.2594,
+      "eval_bigbrother_samples_per_second": 34.029,
+      "eval_bigbrother_steps_per_second": 1.068,
+      "eval_bigbrother_wer": 0.6054136792072827,
+      "step": 1225
+    },
+    {
+      "epoch": 2.0,
+      "grad_norm": 2.773157835006714,
+      "learning_rate": 9.800210526315789e-05,
+      "loss": 0.4578,
+      "step": 2450
+    },
+    {
+      "epoch": 2.0,
+      "eval_rundkast_loss": 0.31110912561416626,
+      "eval_rundkast_runtime": 31.8038,
+      "eval_rundkast_samples_per_second": 42.291,
+      "eval_rundkast_steps_per_second": 1.352,
+      "eval_rundkast_wer": 0.17236716512885777,
+      "step": 2450
+    },
+    {
+      "epoch": 2.0,
+      "eval_nb_samtale_loss": 0.5243741273880005,
+      "eval_nb_samtale_runtime": 37.3513,
+      "eval_nb_samtale_samples_per_second": 14.27,
+      "eval_nb_samtale_steps_per_second": 0.455,
+      "eval_nb_samtale_wer": 0.24796549479166666,
+      "step": 2450
+    },
+    {
+      "epoch": 2.0,
+      "eval_bigbrother_loss": 1.9609774351119995,
+      "eval_bigbrother_runtime": 40.3603,
+      "eval_bigbrother_samples_per_second": 33.944,
+      "eval_bigbrother_steps_per_second": 1.065,
+      "eval_bigbrother_wer": 0.5801981793281238,
+      "step": 2450
+    },
+    {
+      "epoch": 3.0,
+      "grad_norm": 2.448107957839966,
+      "learning_rate": 9.542315789473685e-05,
+      "loss": 0.4141,
+      "step": 3675
+    },
+    {
+      "epoch": 3.0,
+      "eval_rundkast_loss": 0.28843000531196594,
+      "eval_rundkast_runtime": 31.4496,
+      "eval_rundkast_samples_per_second": 42.767,
+      "eval_rundkast_steps_per_second": 1.367,
+      "eval_rundkast_wer": 0.1697422844416163,
+      "step": 3675
+    },
+    {
+      "epoch": 3.0,
+      "eval_nb_samtale_loss": 0.5364730954170227,
+      "eval_nb_samtale_runtime": 36.197,
+      "eval_nb_samtale_samples_per_second": 14.725,
+      "eval_nb_samtale_steps_per_second": 0.47,
+      "eval_nb_samtale_wer": 0.24007161458333334,
+      "step": 3675
+    },
+    {
+      "epoch": 3.0,
+      "eval_bigbrother_loss": 1.9849306344985962,
+      "eval_bigbrother_runtime": 39.5166,
+      "eval_bigbrother_samples_per_second": 34.669,
+      "eval_bigbrother_steps_per_second": 1.088,
+      "eval_bigbrother_wer": 0.5797953758156771,
+      "step": 3675
+    },
+    {
+      "epoch": 4.0,
+      "grad_norm": 5.366342544555664,
+      "learning_rate": 9.28463157894737e-05,
+      "loss": 0.3852,
+      "step": 4900
+    },
+    {
+      "epoch": 4.0,
+      "eval_rundkast_loss": 0.2692658603191376,
+      "eval_rundkast_runtime": 31.6518,
+      "eval_rundkast_samples_per_second": 42.494,
+      "eval_rundkast_steps_per_second": 1.359,
+      "eval_rundkast_wer": 0.16321985364301622,
+      "step": 4900
+    },
+    {
+      "epoch": 4.0,
+      "eval_nb_samtale_loss": 0.5346274971961975,
+      "eval_nb_samtale_runtime": 36.5542,
+      "eval_nb_samtale_samples_per_second": 14.581,
+      "eval_nb_samtale_steps_per_second": 0.465,
+      "eval_nb_samtale_wer": 0.23860677083333334,
+      "step": 4900
+    },
+    {
+      "epoch": 4.0,
+      "eval_bigbrother_loss": 1.9121719598770142,
+      "eval_bigbrother_runtime": 40.1737,
+      "eval_bigbrother_samples_per_second": 34.102,
+      "eval_bigbrother_steps_per_second": 1.07,
+      "eval_bigbrother_wer": 0.5557077257713687,
+      "step": 4900
+    },
+    {
+      "epoch": 5.0,
+      "grad_norm": 4.274389266967773,
+      "learning_rate": 9.026736842105264e-05,
+      "loss": 0.3654,
+      "step": 6125
+    },
+    {
+      "epoch": 5.0,
+      "eval_rundkast_loss": 0.29252347350120544,
+      "eval_rundkast_runtime": 31.5872,
+      "eval_rundkast_samples_per_second": 42.581,
+      "eval_rundkast_steps_per_second": 1.361,
+      "eval_rundkast_wer": 0.15701559020044542,
+      "step": 6125
+    },
+    {
+      "epoch": 5.0,
+      "eval_nb_samtale_loss": 0.5537768006324768,
+      "eval_nb_samtale_runtime": 36.3537,
+      "eval_nb_samtale_samples_per_second": 14.662,
+      "eval_nb_samtale_steps_per_second": 0.468,
+      "eval_nb_samtale_wer": 0.23079427083333334,
+      "step": 6125
+    },
+    {
+      "epoch": 5.0,
+      "eval_bigbrother_loss": 2.0775458812713623,
+      "eval_bigbrother_runtime": 39.681,
+      "eval_bigbrother_samples_per_second": 34.525,
+      "eval_bigbrother_steps_per_second": 1.084,
+      "eval_bigbrother_wer": 0.5554660436639007,
+      "step": 6125
+    },
+    {
+      "epoch": 6.0,
+      "grad_norm": 5.030076026916504,
+      "learning_rate": 8.769052631578948e-05,
+      "loss": 0.3452,
+      "step": 7350
+    },
+    {
+      "epoch": 6.0,
+      "eval_rundkast_loss": 0.29516521096229553,
+      "eval_rundkast_runtime": 31.5112,
+      "eval_rundkast_samples_per_second": 42.683,
+      "eval_rundkast_steps_per_second": 1.365,
+      "eval_rundkast_wer": 0.15089086859688197,
+      "step": 7350
+    },
+    {
+      "epoch": 6.0,
+      "eval_nb_samtale_loss": 0.5526564717292786,
+      "eval_nb_samtale_runtime": 36.1333,
+      "eval_nb_samtale_samples_per_second": 14.751,
+      "eval_nb_samtale_steps_per_second": 0.47,
+      "eval_nb_samtale_wer": 0.22517903645833334,
+      "step": 7350
+    },
+    {
+      "epoch": 6.0,
+      "eval_bigbrother_loss": 2.038280725479126,
+      "eval_bigbrother_runtime": 39.4829,
+      "eval_bigbrother_samples_per_second": 34.699,
+      "eval_bigbrother_steps_per_second": 1.089,
+      "eval_bigbrother_wer": 0.5402400708934182,
+      "step": 7350
+    },
+    {
+      "epoch": 7.0,
+      "grad_norm": 5.610586166381836,
+      "learning_rate": 8.511157894736842e-05,
+      "loss": 0.3301,
+      "step": 8575
+    },
+    {
+      "epoch": 7.0,
+      "eval_rundkast_loss": 0.27553433179855347,
+      "eval_rundkast_runtime": 31.4793,
+      "eval_rundkast_samples_per_second": 42.727,
+      "eval_rundkast_steps_per_second": 1.366,
+      "eval_rundkast_wer": 0.14460706331530385,
+      "step": 8575
+    },
+    {
+      "epoch": 7.0,
+      "eval_nb_samtale_loss": 0.5609863996505737,
+      "eval_nb_samtale_runtime": 36.0218,
+      "eval_nb_samtale_samples_per_second": 14.797,
+      "eval_nb_samtale_steps_per_second": 0.472,
+      "eval_nb_samtale_wer": 0.22281901041666666,
+      "step": 8575
+    },
+    {
+      "epoch": 7.0,
+      "eval_bigbrother_loss": 2.06436824798584,
+      "eval_bigbrother_runtime": 39.4099,
+      "eval_bigbrother_samples_per_second": 34.763,
+      "eval_bigbrother_steps_per_second": 1.091,
+      "eval_bigbrother_wer": 0.5374204463062918,
+      "step": 8575
+    },
+    {
+      "epoch": 8.0,
+      "grad_norm": 3.3816378116607666,
+      "learning_rate": 8.253263157894737e-05,
+      "loss": 0.3152,
+      "step": 9800
+    },
+    {
+      "epoch": 8.0,
+      "eval_rundkast_loss": 0.27358707785606384,
+      "eval_rundkast_runtime": 31.4538,
+      "eval_rundkast_samples_per_second": 42.761,
+      "eval_rundkast_steps_per_second": 1.367,
+      "eval_rundkast_wer": 0.14675469296850144,
+      "step": 9800
+    },
+    {
+      "epoch": 8.0,
+      "eval_nb_samtale_loss": 0.5373356938362122,
+      "eval_nb_samtale_runtime": 36.0235,
+      "eval_nb_samtale_samples_per_second": 14.796,
+      "eval_nb_samtale_steps_per_second": 0.472,
+      "eval_nb_samtale_wer": 0.2265625,
+      "step": 9800
+    },
+    {
+      "epoch": 8.0,
+      "eval_bigbrother_loss": 2.0022764205932617,
+      "eval_bigbrother_runtime": 39.5126,
+      "eval_bigbrother_samples_per_second": 34.673,
+      "eval_bigbrother_steps_per_second": 1.088,
+      "eval_bigbrother_wer": 0.5332312897768469,
+      "step": 9800
+    },
+    {
+      "epoch": 9.0,
+      "grad_norm": 2.7853925228118896,
+      "learning_rate": 7.995578947368422e-05,
+      "loss": 0.301,
+      "step": 11025
+    },
+    {
+      "epoch": 9.0,
+      "eval_rundkast_loss": 0.257459819316864,
+      "eval_rundkast_runtime": 31.4423,
+      "eval_rundkast_samples_per_second": 42.777,
+      "eval_rundkast_steps_per_second": 1.368,
+      "eval_rundkast_wer": 0.14293668469615017,
+      "step": 11025
+    },
+    {
+      "epoch": 9.0,
+      "eval_nb_samtale_loss": 0.5285869240760803,
+      "eval_nb_samtale_runtime": 36.2554,
+      "eval_nb_samtale_samples_per_second": 14.701,
+      "eval_nb_samtale_steps_per_second": 0.469,
+      "eval_nb_samtale_wer": 0.22509765625,
+      "step": 11025
+    },
+    {
+      "epoch": 9.0,
+      "eval_bigbrother_loss": 2.0163955688476562,
+      "eval_bigbrother_runtime": 39.6281,
+      "eval_bigbrother_samples_per_second": 34.571,
+      "eval_bigbrother_steps_per_second": 1.085,
+      "eval_bigbrother_wer": 0.5354869894465479,
+      "step": 11025
+    },
+    {
+      "epoch": 10.0,
+      "grad_norm": 2.2737765312194824,
+      "learning_rate": 7.737684210526317e-05,
+      "loss": 0.2912,
+      "step": 12250
+    },
+    {
+      "epoch": 10.0,
+      "eval_rundkast_loss": 0.2834290564060211,
+      "eval_rundkast_runtime": 31.605,
+      "eval_rundkast_samples_per_second": 42.557,
+      "eval_rundkast_steps_per_second": 1.361,
+      "eval_rundkast_wer": 0.14230034998409163,
+      "step": 12250
+    },
+    {
+      "epoch": 10.0,
+      "eval_nb_samtale_loss": 0.524945080280304,
+      "eval_nb_samtale_runtime": 36.2711,
+      "eval_nb_samtale_samples_per_second": 14.695,
+      "eval_nb_samtale_steps_per_second": 0.469,
+      "eval_nb_samtale_wer": 0.21956380208333334,
+      "step": 12250
+    },
+    {
+      "epoch": 10.0,
+      "eval_bigbrother_loss": 2.0072944164276123,
+      "eval_bigbrother_runtime": 39.7952,
+      "eval_bigbrother_samples_per_second": 34.426,
+      "eval_bigbrother_steps_per_second": 1.081,
+      "eval_bigbrother_wer": 0.5287198904374446,
+      "step": 12250
+    },
+    {
+      "epoch": 11.0,
+      "grad_norm": 4.1641364097595215,
+      "learning_rate": 7.479789473684211e-05,
+      "loss": 0.2818,
+      "step": 13475
+    },
+    {
+      "epoch": 11.0,
+      "eval_rundkast_loss": 0.291464626789093,
+      "eval_rundkast_runtime": 31.4279,
+      "eval_rundkast_samples_per_second": 42.796,
+      "eval_rundkast_steps_per_second": 1.368,
+      "eval_rundkast_wer": 0.1403118040089087,
+      "step": 13475
+    },
+    {
+      "epoch": 11.0,
+      "eval_nb_samtale_loss": 0.5573220252990723,
+      "eval_nb_samtale_runtime": 35.8245,
+      "eval_nb_samtale_samples_per_second": 14.878,
+      "eval_nb_samtale_steps_per_second": 0.475,
+      "eval_nb_samtale_wer": 0.21744791666666666,
+      "step": 13475
+    },
+    {
+      "epoch": 11.0,
+      "eval_bigbrother_loss": 2.2074215412139893,
+      "eval_bigbrother_runtime": 39.3859,
+      "eval_bigbrother_samples_per_second": 34.784,
+      "eval_bigbrother_steps_per_second": 1.092,
+      "eval_bigbrother_wer": 0.5279142834125513,
+      "step": 13475
+    },
+    {
+      "epoch": 12.0,
+      "grad_norm": 2.796776533126831,
+      "learning_rate": 7.222105263157896e-05,
+      "loss": 0.2718,
+      "step": 14700
+    },
+    {
+      "epoch": 12.0,
+      "eval_rundkast_loss": 0.2955363988876343,
+      "eval_rundkast_runtime": 31.4317,
+      "eval_rundkast_samples_per_second": 42.791,
+      "eval_rundkast_steps_per_second": 1.368,
+      "eval_rundkast_wer": 0.1376869233216672,
+      "step": 14700
+    },
+    {
+      "epoch": 12.0,
+      "eval_nb_samtale_loss": 0.5371569991111755,
+      "eval_nb_samtale_runtime": 36.1485,
+      "eval_nb_samtale_samples_per_second": 14.745,
+      "eval_nb_samtale_steps_per_second": 0.47,
+      "eval_nb_samtale_wer": 0.21891276041666666,
+      "step": 14700
+    },
+    {
+      "epoch": 12.0,
+      "eval_bigbrother_loss": 2.0551300048828125,
+      "eval_bigbrother_runtime": 39.5331,
+      "eval_bigbrother_samples_per_second": 34.655,
+      "eval_bigbrother_steps_per_second": 1.088,
+      "eval_bigbrother_wer": 0.524611294610489,
+      "step": 14700
+    },
+    {
+      "epoch": 13.0,
+      "grad_norm": 2.6839964389801025,
+      "learning_rate": 6.96442105263158e-05,
+      "loss": 0.2614,
+      "step": 15925
+    },
+    {
+      "epoch": 13.0,
+      "eval_rundkast_loss": 0.28540924191474915,
+      "eval_rundkast_runtime": 32.0138,
+      "eval_rundkast_samples_per_second": 42.013,
+      "eval_rundkast_steps_per_second": 1.343,
+      "eval_rundkast_wer": 0.13959592745784283,
+      "step": 15925
+    },
+    {
+      "epoch": 13.0,
+      "eval_nb_samtale_loss": 0.5376082062721252,
+      "eval_nb_samtale_runtime": 36.0007,
+      "eval_nb_samtale_samples_per_second": 14.805,
+      "eval_nb_samtale_steps_per_second": 0.472,
+      "eval_nb_samtale_wer": 0.215087890625,
+      "step": 15925
+    },
+    {
+      "epoch": 13.0,
+      "eval_bigbrother_loss": 2.0468454360961914,
+      "eval_bigbrother_runtime": 39.695,
+      "eval_bigbrother_samples_per_second": 34.513,
+      "eval_bigbrother_steps_per_second": 1.083,
+      "eval_bigbrother_wer": 0.5228389591557239,
+      "step": 15925
+    },
+    {
+      "epoch": 14.0,
+      "grad_norm": 2.8357603549957275,
+      "learning_rate": 6.706526315789474e-05,
+      "loss": 0.2556,
+      "step": 17150
+    },
+    {
+      "epoch": 14.0,
+      "eval_rundkast_loss": 0.34074199199676514,
+      "eval_rundkast_runtime": 31.6633,
+      "eval_rundkast_samples_per_second": 42.478,
+      "eval_rundkast_steps_per_second": 1.358,
+      "eval_rundkast_wer": 0.13728921412663062,
+      "step": 17150
+    },
+    {
+      "epoch": 14.0,
+      "eval_nb_samtale_loss": 0.5684360861778259,
+      "eval_nb_samtale_runtime": 35.7903,
+      "eval_nb_samtale_samples_per_second": 14.892,
+      "eval_nb_samtale_steps_per_second": 0.475,
+      "eval_nb_samtale_wer": 0.214111328125,
+      "step": 17150
+    },
+    {
+      "epoch": 14.0,
+      "eval_bigbrother_loss": 2.249138593673706,
+      "eval_bigbrother_runtime": 39.6983,
+      "eval_bigbrother_samples_per_second": 34.51,
+      "eval_bigbrother_steps_per_second": 1.083,
+      "eval_bigbrother_wer": 0.5262225086602755,
+      "step": 17150
+    },
+    {
+      "epoch": 15.0,
+      "grad_norm": 4.659173965454102,
+      "learning_rate": 6.448842105263159e-05,
+      "loss": 0.2473,
+      "step": 18375
+    },
+    {
+      "epoch": 15.0,
+      "eval_rundkast_loss": 0.3245847225189209,
+      "eval_rundkast_runtime": 31.5529,
+      "eval_rundkast_samples_per_second": 42.627,
+      "eval_rundkast_steps_per_second": 1.363,
+      "eval_rundkast_wer": 0.13665287941457208,
+      "step": 18375
+    },
+    {
+      "epoch": 15.0,
+      "eval_nb_samtale_loss": 0.5528948307037354,
+      "eval_nb_samtale_runtime": 36.5998,
+      "eval_nb_samtale_samples_per_second": 14.563,
+      "eval_nb_samtale_steps_per_second": 0.464,
+      "eval_nb_samtale_wer": 0.21427408854166666,
+      "step": 18375
+    },
+    {
+      "epoch": 15.0,
+      "eval_bigbrother_loss": 2.2172372341156006,
+      "eval_bigbrother_runtime": 39.8062,
+      "eval_bigbrother_samples_per_second": 34.417,
+      "eval_bigbrother_steps_per_second": 1.08,
+      "eval_bigbrother_wer": 0.524611294610489,
+      "step": 18375
+    },
+    {
+      "epoch": 16.0,
+      "grad_norm": 4.046926975250244,
+      "learning_rate": 6.191157894736842e-05,
+      "loss": 0.2414,
+      "step": 19600
+    },
+    {
+      "epoch": 16.0,
+      "eval_rundkast_loss": 0.28036314249038696,
+      "eval_rundkast_runtime": 31.8175,
+      "eval_rundkast_samples_per_second": 42.272,
+      "eval_rundkast_steps_per_second": 1.351,
+      "eval_rundkast_wer": 0.1349825007954184,
+      "step": 19600
+    },
+    {
+      "epoch": 16.0,
+      "eval_nb_samtale_loss": 0.5292507410049438,
+      "eval_nb_samtale_runtime": 35.9006,
+      "eval_nb_samtale_samples_per_second": 14.847,
+      "eval_nb_samtale_steps_per_second": 0.474,
+      "eval_nb_samtale_wer": 0.21533203125,
+      "step": 19600
+    },
+    {
+      "epoch": 16.0,
+      "eval_bigbrother_loss": 2.0556137561798096,
+      "eval_bigbrother_runtime": 39.6218,
+      "eval_bigbrother_samples_per_second": 34.577,
+      "eval_bigbrother_steps_per_second": 1.085,
+      "eval_bigbrother_wer": 0.5206638201885121,
+      "step": 19600
+    },
+    {
+      "epoch": 17.0,
+      "grad_norm": 2.713061809539795,
+      "learning_rate": 5.933263157894737e-05,
+      "loss": 0.2328,
+      "step": 20825
+    },
+    {
+      "epoch": 17.0,
+      "eval_rundkast_loss": 0.3071937561035156,
+      "eval_rundkast_runtime": 31.6947,
+      "eval_rundkast_samples_per_second": 42.436,
+      "eval_rundkast_steps_per_second": 1.357,
+      "eval_rundkast_wer": 0.13490295895641108,
+      "step": 20825
+    },
+    {
+      "epoch": 17.0,
+      "eval_nb_samtale_loss": 0.5693681240081787,
+      "eval_nb_samtale_runtime": 35.8134,
+      "eval_nb_samtale_samples_per_second": 14.883,
+      "eval_nb_samtale_steps_per_second": 0.475,
+      "eval_nb_samtale_wer": 0.21476236979166666,
+      "step": 20825
+    },
+    {
+      "epoch": 17.0,
+      "eval_bigbrother_loss": 2.2417101860046387,
+      "eval_bigbrother_runtime": 39.6674,
+      "eval_bigbrother_samples_per_second": 34.537,
+      "eval_bigbrother_steps_per_second": 1.084,
+      "eval_bigbrother_wer": 0.5163135422540884,
+      "step": 20825
+    },
+    {
+      "epoch": 18.0,
+      "grad_norm": 3.662180185317993,
+      "learning_rate": 5.6753684210526313e-05,
+      "loss": 0.228,
+      "step": 22050
+    },
+    {
+      "epoch": 18.0,
+      "eval_rundkast_loss": 0.3300894796848297,
+      "eval_rundkast_runtime": 31.6144,
+      "eval_rundkast_samples_per_second": 42.544,
+      "eval_rundkast_steps_per_second": 1.36,
+      "eval_rundkast_wer": 0.13140311804008908,
+      "step": 22050
+    },
+    {
+      "epoch": 18.0,
+      "eval_nb_samtale_loss": 0.6102511286735535,
+      "eval_nb_samtale_runtime": 36.3906,
+      "eval_nb_samtale_samples_per_second": 14.647,
+      "eval_nb_samtale_steps_per_second": 0.467,
+      "eval_nb_samtale_wer": 0.21280924479166666,
+      "step": 22050
+    },
+    {
+      "epoch": 18.0,
+      "eval_bigbrother_loss": 2.433946371078491,
+      "eval_bigbrother_runtime": 39.8718,
+      "eval_bigbrother_samples_per_second": 34.36,
+      "eval_bigbrother_steps_per_second": 1.078,
+      "eval_bigbrother_wer": 0.5265447514702328,
+      "step": 22050
+    },
+    {
+      "epoch": 19.0,
+      "grad_norm": 3.2172813415527344,
+      "learning_rate": 5.417473684210527e-05,
+      "loss": 0.2227,
+      "step": 23275
+    },
+    {
+      "epoch": 19.0,
+      "eval_rundkast_loss": 0.2971687316894531,
+      "eval_rundkast_runtime": 31.7336,
+      "eval_rundkast_samples_per_second": 42.384,
+      "eval_rundkast_steps_per_second": 1.355,
+      "eval_rundkast_wer": 0.12949411390391347,
+      "step": 23275
+    },
+    {
+      "epoch": 19.0,
+      "eval_nb_samtale_loss": 0.5440128445625305,
+      "eval_nb_samtale_runtime": 35.6562,
+      "eval_nb_samtale_samples_per_second": 14.948,
+      "eval_nb_samtale_steps_per_second": 0.477,
+      "eval_nb_samtale_wer": 0.21337890625,
+      "step": 23275
+    },
+    {
+      "epoch": 19.0,
+      "eval_bigbrother_loss": 2.229306936264038,
+      "eval_bigbrother_runtime": 39.499,
+      "eval_bigbrother_samples_per_second": 34.684,
+      "eval_bigbrother_steps_per_second": 1.089,
+      "eval_bigbrother_wer": 0.5155884959316845,
+      "step": 23275
+    },
+    {
+      "epoch": 20.0,
+      "grad_norm": 3.76371431350708,
+      "learning_rate": 5.159789473684211e-05,
+      "loss": 0.2201,
+      "step": 24500
+    },
+    {
+      "epoch": 20.0,
+      "eval_rundkast_loss": 0.33149319887161255,
+      "eval_rundkast_runtime": 31.7066,
+      "eval_rundkast_samples_per_second": 42.42,
+      "eval_rundkast_steps_per_second": 1.356,
+      "eval_rundkast_wer": 0.13211899459115495,
+      "step": 24500
+    },
+    {
+      "epoch": 20.0,
+      "eval_nb_samtale_loss": 0.5641424655914307,
+      "eval_nb_samtale_runtime": 35.6835,
+      "eval_nb_samtale_samples_per_second": 14.937,
+      "eval_nb_samtale_steps_per_second": 0.476,
+      "eval_nb_samtale_wer": 0.214599609375,
+      "step": 24500
+    },
+    {
+      "epoch": 20.0,
+      "eval_bigbrother_loss": 2.2568540573120117,
+      "eval_bigbrother_runtime": 39.6597,
+      "eval_bigbrother_samples_per_second": 34.544,
+      "eval_bigbrother_steps_per_second": 1.084,
+      "eval_bigbrother_wer": 0.5247724160154676,
+      "step": 24500
+    },
+    {
+      "epoch": 21.0,
+      "grad_norm": 2.644437789916992,
+      "learning_rate": 4.9018947368421054e-05,
+      "loss": 0.2104,
+      "step": 25725
+    },
+    {
+      "epoch": 21.0,
+      "eval_rundkast_loss": 0.32245177030563354,
+      "eval_rundkast_runtime": 31.7772,
+      "eval_rundkast_samples_per_second": 42.326,
+      "eval_rundkast_steps_per_second": 1.353,
+      "eval_rundkast_wer": 0.1305281578110086,
+      "step": 25725
+    },
+    {
+      "epoch": 21.0,
+      "eval_nb_samtale_loss": 0.5810007452964783,
+      "eval_nb_samtale_runtime": 36.1863,
+      "eval_nb_samtale_samples_per_second": 14.729,
+      "eval_nb_samtale_steps_per_second": 0.47,
+      "eval_nb_samtale_wer": 0.2138671875,
+      "step": 25725
+    },
+    {
+      "epoch": 21.0,
+      "eval_bigbrother_loss": 2.2536792755126953,
+      "eval_bigbrother_runtime": 40.2452,
+      "eval_bigbrother_samples_per_second": 34.041,
+      "eval_bigbrother_steps_per_second": 1.068,
+      "eval_bigbrother_wer": 0.514218963989366,
+      "step": 25725
+    },
+    {
+      "epoch": 22.0,
+      "grad_norm": 4.817940711975098,
+      "learning_rate": 4.64421052631579e-05,
+      "loss": 0.2078,
+      "step": 26950
+    },
+    {
+      "epoch": 22.0,
+      "eval_rundkast_loss": 0.30675747990608215,
+      "eval_rundkast_runtime": 31.923,
+      "eval_rundkast_samples_per_second": 42.133,
+      "eval_rundkast_steps_per_second": 1.347,
+      "eval_rundkast_wer": 0.13068724148902322,
+      "step": 26950
+    },
+    {
+      "epoch": 22.0,
+      "eval_nb_samtale_loss": 0.5920718312263489,
+      "eval_nb_samtale_runtime": 35.946,
+      "eval_nb_samtale_samples_per_second": 14.828,
+      "eval_nb_samtale_steps_per_second": 0.473,
+      "eval_nb_samtale_wer": 0.21085611979166666,
+      "step": 26950
+    },
+    {
+      "epoch": 22.0,
+      "eval_bigbrother_loss": 2.283834457397461,
+      "eval_bigbrother_runtime": 39.6029,
+      "eval_bigbrother_samples_per_second": 34.593,
+      "eval_bigbrother_steps_per_second": 1.086,
+      "eval_bigbrother_wer": 0.5115604608072183,
+      "step": 26950
+    },
+    {
+      "epoch": 23.0,
+      "grad_norm": 2.2001821994781494,
+      "learning_rate": 4.3863157894736846e-05,
+      "loss": 0.2039,
+      "step": 28175
+    },
+    {
+      "epoch": 23.0,
+      "eval_rundkast_loss": 0.31590384244918823,
+      "eval_rundkast_runtime": 31.6509,
+      "eval_rundkast_samples_per_second": 42.495,
+      "eval_rundkast_steps_per_second": 1.359,
+      "eval_rundkast_wer": 0.13005090677696468,
+      "step": 28175
+    },
+    {
+      "epoch": 23.0,
+      "eval_nb_samtale_loss": 0.5807461142539978,
+      "eval_nb_samtale_runtime": 35.4812,
+      "eval_nb_samtale_samples_per_second": 15.022,
+      "eval_nb_samtale_steps_per_second": 0.479,
+      "eval_nb_samtale_wer": 0.21044921875,
+      "step": 28175
+    },
+    {
+      "epoch": 23.0,
+      "eval_bigbrother_loss": 2.346367835998535,
+      "eval_bigbrother_runtime": 39.6789,
+      "eval_bigbrother_samples_per_second": 34.527,
+      "eval_bigbrother_steps_per_second": 1.084,
+      "eval_bigbrother_wer": 0.5138161604769194,
+      "step": 28175
+    },
+    {
+      "epoch": 24.0,
+      "grad_norm": 3.352459669113159,
+      "learning_rate": 4.128631578947368e-05,
+      "loss": 0.1973,
+      "step": 29400
+    },
+    {
+      "epoch": 24.0,
+      "eval_rundkast_loss": 0.3300403654575348,
+      "eval_rundkast_runtime": 31.6022,
+      "eval_rundkast_samples_per_second": 42.56,
+      "eval_rundkast_steps_per_second": 1.361,
+      "eval_rundkast_wer": 0.1322780782691696,
+      "step": 29400
+    },
+    {
+      "epoch": 24.0,
+      "eval_nb_samtale_loss": 0.5806035995483398,
+      "eval_nb_samtale_runtime": 35.9632,
+      "eval_nb_samtale_samples_per_second": 14.821,
+      "eval_nb_samtale_steps_per_second": 0.473,
+      "eval_nb_samtale_wer": 0.21126302083333334,
+      "step": 29400
+    },
+    {
+      "epoch": 24.0,
+      "eval_bigbrother_loss": 2.317692518234253,
+      "eval_bigbrother_runtime": 40.1241,
+      "eval_bigbrother_samples_per_second": 34.144,
+      "eval_bigbrother_steps_per_second": 1.072,
+      "eval_bigbrother_wer": 0.5184081205188109,
+      "step": 29400
+    },
+    {
+      "epoch": 25.0,
+      "grad_norm": 2.7289795875549316,
+      "learning_rate": 3.870736842105263e-05,
+      "loss": 0.1962,
+      "step": 30625
+    },
+    {
+      "epoch": 25.0,
+      "eval_rundkast_loss": 0.34277400374412537,
+      "eval_rundkast_runtime": 32.0615,
+      "eval_rundkast_samples_per_second": 41.951,
+      "eval_rundkast_steps_per_second": 1.341,
+      "eval_rundkast_wer": 0.1319599109131403,
+      "step": 30625
+    },
+    {
+      "epoch": 25.0,
+      "eval_nb_samtale_loss": 0.6326170563697815,
+      "eval_nb_samtale_runtime": 35.8107,
+      "eval_nb_samtale_samples_per_second": 14.884,
+      "eval_nb_samtale_steps_per_second": 0.475,
+      "eval_nb_samtale_wer": 0.21183268229166666,
+      "step": 30625
+    },
+    {
+      "epoch": 25.0,
+      "eval_bigbrother_loss": 2.443657875061035,
+      "eval_bigbrother_runtime": 39.6514,
+      "eval_bigbrother_samples_per_second": 34.551,
+      "eval_bigbrother_steps_per_second": 1.084,
+      "eval_bigbrother_wer": 0.5142995246918554,
+      "step": 30625
+    },
+    {
+      "epoch": 26.0,
+      "grad_norm": 3.723717212677002,
+      "learning_rate": 3.612842105263158e-05,
+      "loss": 0.1887,
+      "step": 31850
+    },
+    {
+      "epoch": 26.0,
+      "eval_rundkast_loss": 0.32608622312545776,
+      "eval_rundkast_runtime": 31.9056,
+      "eval_rundkast_samples_per_second": 42.156,
+      "eval_rundkast_steps_per_second": 1.348,
+      "eval_rundkast_wer": 0.13267578746420616,
+      "step": 31850
+    },
+    {
+      "epoch": 26.0,
+      "eval_nb_samtale_loss": 0.6086393594741821,
+      "eval_nb_samtale_runtime": 35.8839,
+      "eval_nb_samtale_samples_per_second": 14.853,
+      "eval_nb_samtale_steps_per_second": 0.474,
+      "eval_nb_samtale_wer": 0.21004231770833334,
+      "step": 31850
+    },
+    {
+      "epoch": 26.0,
+      "eval_bigbrother_loss": 2.344693422317505,
+      "eval_bigbrother_runtime": 39.7842,
+      "eval_bigbrother_samples_per_second": 34.436,
+      "eval_bigbrother_steps_per_second": 1.081,
+      "eval_bigbrother_wer": 0.5134939176669621,
+      "step": 31850
+    },
+    {
+      "epoch": 27.0,
+      "grad_norm": 3.741575241088867,
+      "learning_rate": 3.3551578947368424e-05,
+      "loss": 0.1886,
+      "step": 33075
+    },
+    {
+      "epoch": 27.0,
+      "eval_rundkast_loss": 0.32595619559288025,
+      "eval_rundkast_runtime": 31.7292,
+      "eval_rundkast_samples_per_second": 42.39,
+      "eval_rundkast_steps_per_second": 1.355,
+      "eval_rundkast_wer": 0.13164174355711103,
+      "step": 33075
+    },
+    {
+      "epoch": 27.0,
+      "eval_nb_samtale_loss": 0.6121112704277039,
+      "eval_nb_samtale_runtime": 35.7885,
+      "eval_nb_samtale_samples_per_second": 14.893,
+      "eval_nb_samtale_steps_per_second": 0.475,
+      "eval_nb_samtale_wer": 0.20890299479166666,
+      "step": 33075
+    },
+    {
+      "epoch": 27.0,
+      "eval_bigbrother_loss": 2.368227005004883,
+      "eval_bigbrother_runtime": 39.9121,
+      "eval_bigbrother_samples_per_second": 34.325,
+      "eval_bigbrother_steps_per_second": 1.077,
+      "eval_bigbrother_wer": 0.511238217997261,
+      "step": 33075
+    },
+    {
+      "epoch": 28.0,
+      "grad_norm": 5.783115863800049,
+      "learning_rate": 3.097263157894737e-05,
+      "loss": 0.1836,
+      "step": 34300
+    },
+    {
+      "epoch": 28.0,
+      "eval_rundkast_loss": 0.33696532249450684,
+      "eval_rundkast_runtime": 31.5417,
+      "eval_rundkast_samples_per_second": 42.642,
+      "eval_rundkast_steps_per_second": 1.363,
+      "eval_rundkast_wer": 0.12949411390391347,
+      "step": 34300
+    },
+    {
+      "epoch": 28.0,
+      "eval_nb_samtale_loss": 0.6101709008216858,
+      "eval_nb_samtale_runtime": 35.522,
+      "eval_nb_samtale_samples_per_second": 15.005,
+      "eval_nb_samtale_steps_per_second": 0.479,
+      "eval_nb_samtale_wer": 0.21012369791666666,
+      "step": 34300
+    },
+    {
+      "epoch": 28.0,
+      "eval_bigbrother_loss": 2.353733777999878,
+      "eval_bigbrother_runtime": 39.5513,
+      "eval_bigbrother_samples_per_second": 34.639,
+      "eval_bigbrother_steps_per_second": 1.087,
+      "eval_bigbrother_wer": 0.5056795295254974,
+      "step": 34300
+    },
+    {
+      "epoch": 29.0,
+      "grad_norm": 8.664693832397461,
+      "learning_rate": 2.8395789473684216e-05,
+      "loss": 0.1804,
+      "step": 35525
+    },
+    {
+      "epoch": 29.0,
+      "eval_rundkast_loss": 0.3452693819999695,
+      "eval_rundkast_runtime": 31.2833,
+      "eval_rundkast_samples_per_second": 42.994,
+      "eval_rundkast_steps_per_second": 1.375,
+      "eval_rundkast_wer": 0.1309258670060452,
+      "step": 35525
+    },
+    {
+      "epoch": 29.0,
+      "eval_nb_samtale_loss": 0.6237297654151917,
+      "eval_nb_samtale_runtime": 35.8619,
+      "eval_nb_samtale_samples_per_second": 14.863,
+      "eval_nb_samtale_steps_per_second": 0.474,
+      "eval_nb_samtale_wer": 0.21134440104166666,
+      "step": 35525
+    },
+    {
+      "epoch": 29.0,
+      "eval_bigbrother_loss": 2.3944995403289795,
+      "eval_bigbrother_runtime": 39.4367,
+      "eval_bigbrother_samples_per_second": 34.739,
+      "eval_bigbrother_steps_per_second": 1.09,
+      "eval_bigbrother_wer": 0.5084185934101345,
+      "step": 35525
+    },
+    {
+      "epoch": 30.0,
+      "grad_norm": 4.139631748199463,
+      "learning_rate": 2.5818947368421053e-05,
+      "loss": 0.1766,
+      "step": 36750
+    },
+    {
+      "epoch": 30.0,
+      "eval_rundkast_loss": 0.3432329297065735,
+      "eval_rundkast_runtime": 31.3849,
+      "eval_rundkast_samples_per_second": 42.855,
+      "eval_rundkast_steps_per_second": 1.37,
+      "eval_rundkast_wer": 0.13020999045497933,
+      "step": 36750
+    },
+    {
+      "epoch": 30.0,
+      "eval_nb_samtale_loss": 0.6131173968315125,
+      "eval_nb_samtale_runtime": 35.6634,
+      "eval_nb_samtale_samples_per_second": 14.945,
+      "eval_nb_samtale_steps_per_second": 0.477,
+      "eval_nb_samtale_wer": 0.21199544270833334,
+      "step": 36750
+    },
+    {
+      "epoch": 30.0,
+      "eval_bigbrother_loss": 2.3949081897735596,
+      "eval_bigbrother_runtime": 39.8587,
+      "eval_bigbrother_samples_per_second": 34.371,
+      "eval_bigbrother_steps_per_second": 1.079,
+      "eval_bigbrother_wer": 0.510271489567389,
+      "step": 36750
+    },
+    {
+      "epoch": 31.0,
+      "grad_norm": 3.3099727630615234,
+      "learning_rate": 2.324e-05,
+      "loss": 0.1767,
+      "step": 37975
+    },
+    {
+      "epoch": 31.0,
+      "eval_rundkast_loss": 0.3425343930721283,
+      "eval_rundkast_runtime": 31.3869,
+      "eval_rundkast_samples_per_second": 42.852,
+      "eval_rundkast_steps_per_second": 1.37,
+      "eval_rundkast_wer": 0.1291759465478842,
+      "step": 37975
+    },
+    {
+      "epoch": 31.0,
+      "eval_nb_samtale_loss": 0.6133290529251099,
+      "eval_nb_samtale_runtime": 35.2473,
+      "eval_nb_samtale_samples_per_second": 15.122,
+      "eval_nb_samtale_steps_per_second": 0.482,
+      "eval_nb_samtale_wer": 0.21044921875,
+      "step": 37975
+    },
+    {
+      "epoch": 31.0,
+      "eval_bigbrother_loss": 2.503601312637329,
+      "eval_bigbrother_runtime": 39.2061,
+      "eval_bigbrother_samples_per_second": 34.944,
+      "eval_bigbrother_steps_per_second": 1.097,
+      "eval_bigbrother_wer": 0.5097881253524531,
+      "step": 37975
+    },
+    {
+      "epoch": 32.0,
+      "grad_norm": 3.798198938369751,
+      "learning_rate": 2.0661052631578946e-05,
+      "loss": 0.1712,
+      "step": 39200
+    },
+    {
+      "epoch": 32.0,
+      "eval_rundkast_loss": 0.3596391975879669,
+      "eval_rundkast_runtime": 31.2765,
+      "eval_rundkast_samples_per_second": 43.004,
+      "eval_rundkast_steps_per_second": 1.375,
+      "eval_rundkast_wer": 0.128380528157811,
+      "step": 39200
+    },
+    {
+      "epoch": 32.0,
+      "eval_nb_samtale_loss": 0.6345717906951904,
+      "eval_nb_samtale_runtime": 36.1693,
+      "eval_nb_samtale_samples_per_second": 14.736,
+      "eval_nb_samtale_steps_per_second": 0.47,
+      "eval_nb_samtale_wer": 0.21036783854166666,
+      "step": 39200
+    },
+    {
+      "epoch": 32.0,
+      "eval_bigbrother_loss": 2.506143569946289,
+      "eval_bigbrother_runtime": 39.8743,
+      "eval_bigbrother_samples_per_second": 34.358,
+      "eval_bigbrother_steps_per_second": 1.078,
+      "eval_bigbrother_wer": 0.5095464432449851,
+      "step": 39200
+    },
+    {
+      "epoch": 33.0,
+      "grad_norm": 3.5819003582000732,
+      "learning_rate": 1.8082105263157895e-05,
+      "loss": 0.1712,
+      "step": 40425
+    },
+    {
+      "epoch": 33.0,
+      "eval_rundkast_loss": 0.3613539934158325,
+      "eval_rundkast_runtime": 31.3392,
+      "eval_rundkast_samples_per_second": 42.918,
+      "eval_rundkast_steps_per_second": 1.372,
+      "eval_rundkast_wer": 0.12615335666560612,
+      "step": 40425
+    },
+    {
+      "epoch": 33.0,
+      "eval_nb_samtale_loss": 0.644898533821106,
+      "eval_nb_samtale_runtime": 35.4393,
+      "eval_nb_samtale_samples_per_second": 15.04,
+      "eval_nb_samtale_steps_per_second": 0.48,
+      "eval_nb_samtale_wer": 0.20914713541666666,
+      "step": 40425
+    },
+    {
+      "epoch": 33.0,
+      "eval_bigbrother_loss": 2.489149570465088,
+      "eval_bigbrother_runtime": 39.804,
+      "eval_bigbrother_samples_per_second": 34.419,
+      "eval_bigbrother_steps_per_second": 1.08,
+      "eval_bigbrother_wer": 0.5090630790300491,
+      "step": 40425
+    },
+    {
+      "epoch": 34.0,
+      "grad_norm": 2.6166694164276123,
+      "learning_rate": 1.5505263157894735e-05,
+      "loss": 0.1695,
+      "step": 41650
+    },
+    {
+      "epoch": 34.0,
+      "eval_rundkast_loss": 0.35184982419013977,
+      "eval_rundkast_runtime": 31.6077,
+      "eval_rundkast_samples_per_second": 42.553,
+      "eval_rundkast_steps_per_second": 1.36,
+      "eval_rundkast_wer": 0.1270283168946866,
+      "step": 41650
+    },
+    {
+      "epoch": 34.0,
+      "eval_nb_samtale_loss": 0.6456120610237122,
+      "eval_nb_samtale_runtime": 35.3576,
+      "eval_nb_samtale_samples_per_second": 15.075,
+      "eval_nb_samtale_steps_per_second": 0.481,
+      "eval_nb_samtale_wer": 0.20882161458333334,
+      "step": 41650
+    },
+    {
+      "epoch": 34.0,
+      "eval_bigbrother_loss": 2.4751737117767334,
+      "eval_bigbrother_runtime": 39.4345,
+      "eval_bigbrother_samples_per_second": 34.741,
+      "eval_bigbrother_steps_per_second": 1.09,
+      "eval_bigbrother_wer": 0.5080963506001772,
+      "step": 41650
+    },
+    {
+      "epoch": 35.0,
+      "grad_norm": 6.071230411529541,
+      "learning_rate": 1.2926315789473683e-05,
+      "loss": 0.1676,
+      "step": 42875
+    },
+    {
+      "epoch": 35.0,
+      "eval_rundkast_loss": 0.35817253589630127,
+      "eval_rundkast_runtime": 30.8776,
+      "eval_rundkast_samples_per_second": 43.559,
+      "eval_rundkast_steps_per_second": 1.393,
+      "eval_rundkast_wer": 0.12750556792873052,
+      "step": 42875
+    },
+    {
+      "epoch": 35.0,
+      "eval_nb_samtale_loss": 0.6497420072555542,
+      "eval_nb_samtale_runtime": 34.7758,
+      "eval_nb_samtale_samples_per_second": 15.327,
+      "eval_nb_samtale_steps_per_second": 0.489,
+      "eval_nb_samtale_wer": 0.20947265625,
+      "step": 42875
+    },
+    {
+      "epoch": 35.0,
+      "eval_bigbrother_loss": 2.4820265769958496,
+      "eval_bigbrother_runtime": 38.7694,
+      "eval_bigbrother_samples_per_second": 35.337,
+      "eval_bigbrother_steps_per_second": 1.109,
+      "eval_bigbrother_wer": 0.5096270039474744,
+      "step": 42875
+    },
+    {
+      "epoch": 36.0,
+      "grad_norm": 2.893402338027954,
+      "learning_rate": 1.0349473684210527e-05,
+      "loss": 0.1659,
+      "step": 44100
+    },
+    {
+      "epoch": 36.0,
+      "eval_rundkast_loss": 0.34894150495529175,
+      "eval_rundkast_runtime": 30.9604,
+      "eval_rundkast_samples_per_second": 43.443,
+      "eval_rundkast_steps_per_second": 1.389,
+      "eval_rundkast_wer": 0.1292554883868915,
+      "step": 44100
+    },
+    {
+      "epoch": 36.0,
+      "eval_nb_samtale_loss": 0.6365802884101868,
+      "eval_nb_samtale_runtime": 34.8009,
+      "eval_nb_samtale_samples_per_second": 15.316,
+      "eval_nb_samtale_steps_per_second": 0.488,
+      "eval_nb_samtale_wer": 0.209716796875,
+      "step": 44100
+    },
+    {
+      "epoch": 36.0,
+      "eval_bigbrother_loss": 2.4620020389556885,
+      "eval_bigbrother_runtime": 38.8018,
+      "eval_bigbrother_samples_per_second": 35.308,
+      "eval_bigbrother_steps_per_second": 1.108,
+      "eval_bigbrother_wer": 0.506807379360348,
+      "step": 44100
+    },
+    {
+      "epoch": 37.0,
+      "grad_norm": 5.454699993133545,
+      "learning_rate": 7.772631578947369e-06,
+      "loss": 0.1664,
+      "step": 45325
+    },
+    {
+      "epoch": 37.0,
+      "eval_rundkast_loss": 0.3684549033641815,
+      "eval_rundkast_runtime": 31.1693,
+      "eval_rundkast_samples_per_second": 43.151,
+      "eval_rundkast_steps_per_second": 1.38,
+      "eval_rundkast_wer": 0.12774419344575247,
+      "step": 45325
+    },
+    {
+      "epoch": 37.0,
+      "eval_nb_samtale_loss": 0.6549723148345947,
+      "eval_nb_samtale_runtime": 35.1429,
+      "eval_nb_samtale_samples_per_second": 15.167,
+      "eval_nb_samtale_steps_per_second": 0.484,
+      "eval_nb_samtale_wer": 0.20939127604166666,
+      "step": 45325
+    },
+    {
+      "epoch": 37.0,
+      "eval_bigbrother_loss": 2.510341167449951,
+      "eval_bigbrother_runtime": 40.0407,
+      "eval_bigbrother_samples_per_second": 34.215,
+      "eval_bigbrother_steps_per_second": 1.074,
+      "eval_bigbrother_wer": 0.5084991541126238,
+      "step": 45325
+    },
+    {
+      "epoch": 38.0,
+      "grad_norm": 9.69826889038086,
+      "learning_rate": 5.195789473684211e-06,
+      "loss": 0.1636,
+      "step": 46550
+    },
+    {
+      "epoch": 38.0,
+      "eval_rundkast_loss": 0.3660584092140198,
+      "eval_rundkast_runtime": 31.1586,
+      "eval_rundkast_samples_per_second": 43.166,
+      "eval_rundkast_steps_per_second": 1.38,
+      "eval_rundkast_wer": 0.12822144447979636,
+      "step": 46550
+    },
+    {
+      "epoch": 38.0,
+      "eval_nb_samtale_loss": 0.6603749394416809,
+      "eval_nb_samtale_runtime": 34.814,
+      "eval_nb_samtale_samples_per_second": 15.31,
+      "eval_nb_samtale_steps_per_second": 0.488,
+      "eval_nb_samtale_wer": 0.20979817708333334,
+      "step": 46550
+    },
+    {
+      "epoch": 38.0,
+      "eval_bigbrother_loss": 2.5397305488586426,
+      "eval_bigbrother_runtime": 38.941,
+      "eval_bigbrother_samples_per_second": 35.181,
+      "eval_bigbrother_steps_per_second": 1.104,
+      "eval_bigbrother_wer": 0.5069685007653266,
+      "step": 46550
+    },
+    {
+      "epoch": 39.0,
+      "grad_norm": 3.9994399547576904,
+      "learning_rate": 2.616842105263158e-06,
+      "loss": 0.164,
+      "step": 47775
+    },
+    {
+      "epoch": 39.0,
+      "eval_rundkast_loss": 0.3598625063896179,
+      "eval_rundkast_runtime": 31.5329,
+      "eval_rundkast_samples_per_second": 42.654,
+      "eval_rundkast_steps_per_second": 1.364,
+      "eval_rundkast_wer": 0.1279032771237671,
+      "step": 47775
+    },
+    {
+      "epoch": 39.0,
+      "eval_nb_samtale_loss": 0.648256242275238,
+      "eval_nb_samtale_runtime": 35.1662,
+      "eval_nb_samtale_samples_per_second": 15.157,
+      "eval_nb_samtale_steps_per_second": 0.483,
+      "eval_nb_samtale_wer": 0.21004231770833334,
+      "step": 47775
+    },
+    {
+      "epoch": 39.0,
+      "eval_bigbrother_loss": 2.485541820526123,
+      "eval_bigbrother_runtime": 39.2215,
+      "eval_bigbrother_samples_per_second": 34.93,
+      "eval_bigbrother_steps_per_second": 1.096,
+      "eval_bigbrother_wer": 0.5073713042777733,
+      "step": 47775
+    },
+    {
+      "epoch": 40.0,
+      "grad_norm": 2.848135471343994,
+      "learning_rate": 3.7894736842105265e-08,
+      "loss": 0.1637,
+      "step": 49000
+    },
+    {
+      "epoch": 40.0,
+      "eval_rundkast_loss": 0.3625843822956085,
+      "eval_rundkast_runtime": 30.7724,
+      "eval_rundkast_samples_per_second": 43.708,
+      "eval_rundkast_steps_per_second": 1.397,
+      "eval_rundkast_wer": 0.12885777919185493,
+      "step": 49000
+    },
+    {
+      "epoch": 40.0,
+      "eval_nb_samtale_loss": 0.6490209698677063,
+      "eval_nb_samtale_runtime": 34.7701,
+      "eval_nb_samtale_samples_per_second": 15.329,
+      "eval_nb_samtale_steps_per_second": 0.489,
+      "eval_nb_samtale_wer": 0.21036783854166666,
+      "step": 49000
+    },
+    {
+      "epoch": 40.0,
+      "eval_bigbrother_loss": 2.497987985610962,
+      "eval_bigbrother_runtime": 38.8915,
+      "eval_bigbrother_samples_per_second": 35.226,
+      "eval_bigbrother_steps_per_second": 1.106,
+      "eval_bigbrother_wer": 0.5075324256827519,
+      "step": 49000
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 49000,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 40,
+  "save_steps": 500,
+  "total_flos": 2.392992748655231e+20,
+  "train_batch_size": 48,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-49000/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:76b1726f88a10b6122b423394ba676a6e1dc0ef8bf3b3a06cb5dae0ad5561656
+size 4984

config.json ADDED Viewed

	@@ -0,0 +1,116 @@

+{
+  "_name_or_path": "NbAiLab/nb-wav2vec2-300m-bokmaal",
+  "activation_dropout": 0.055,
+  "adapter_attn_dim": null,
+  "adapter_kernel_size": 3,
+  "adapter_stride": 2,
+  "add_adapter": false,
+  "apply_spec_augment": true,
+  "architectures": [
+    "Wav2Vec2ForCTC"
+  ],
+  "attention_dropout": 0.094,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "codevector_dim": 768,
+  "contrastive_logits_temperature": 0.1,
+  "conv_bias": true,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "mean",
+  "ctc_zero_infinity": true,
+  "diversity_loss_weight": 0.1,
+  "do_stable_layer_norm": true,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_dropout": 0.0,
+  "feat_extract_norm": "layer",
+  "feat_proj_dropout": 0.04,
+  "feat_quantizer_dropout": 0.0,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.047,
+  "hidden_size": 1024,
+  "initializer_range": 0.02,
+  "intermediate_size": 4096,
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.041,
+  "mask_channel_length": 10,
+  "mask_channel_min_space": 1,
+  "mask_channel_other": 0.0,
+  "mask_channel_prob": 0.0,
+  "mask_channel_selection": "static",
+  "mask_feature_length": 64,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.25,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_min_space": 1,
+  "mask_time_other": 0.0,
+  "mask_time_prob": 0.082,
+  "mask_time_selection": "static",
+  "model_type": "wav2vec2",
+  "num_adapter_layers": 3,
+  "num_attention_heads": 16,
+  "num_codevector_groups": 2,
+  "num_codevectors_per_group": 320,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 24,
+  "num_negatives": 100,
+  "output_hidden_size": 1024,
+  "pad_token_id": 31,
+  "proj_codevector_dim": 768,
+  "tdnn_dilation": [
+    1,
+    2,
+    3,
+    1,
+    1
+  ],
+  "tdnn_dim": [
+    512,
+    512,
+    512,
+    512,
+    1500
+  ],
+  "tdnn_kernel": [
+    5,
+    3,
+    3,
+    1,
+    1
+  ],
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 34,
+  "xvector_output_dim": 512
+}

language_model/5gram.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7b41c24c63f2f0585bea83666369593f3b3e6d047f327a90f36ebca2c35ef0ff
+size 4243671427

language_model/attrs.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"alpha": 0.5, "beta": 0.1, "unk_score_offset": -10.0, "score_boundary": true}

language_model/unigrams.txt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ac3e71ca49838ca355df6fdcb8d89344a5a9bf9e1a76587cdf5df1367c19b9a9
+size 16759269

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e7b5c2997f82b0ae7618c7c41aa32b4e6d27cdbfb713bd96b3970a416d72bd39
+size 1261946880

preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "do_normalize": true,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "processor_class": "Wav2Vec2ProcessorWithLM",
+  "return_attention_mask": true,
+  "sampling_rate": 16000
+}

runs/May30_19-47-26_idun-04-10/events.out.tfevents.1717092397.idun-04-10.304569.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6ff38f44da21cc78b2ad3f8669b075097677ac839c137ba06d2d19eaaae04074
+size 45019

runs/May31_15-59-49_idun-04-10/events.out.tfevents.1717165018.idun-04-10.1353968.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0a71c8400cc9e795bc8c710e74456717e59c2f8cbefbabedadb00cfd525ab929
+size 60141

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "bos_token": "<s>",
+  "eos_token": "</s>",
+  "pad_token": "[PAD]",
+  "unk_token": "[UNK]"
+}

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,47 @@

+{
+  "added_tokens_decoder": {
+    "30": {
+      "content": "[UNK]",
+      "lstrip": true,
+      "normalized": false,
+      "rstrip": true,
+      "single_word": false,
+      "special": false
+    },
+    "31": {
+      "content": "[PAD]",
+      "lstrip": true,
+      "normalized": false,
+      "rstrip": true,
+      "single_word": false,
+      "special": false
+    },
+    "32": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "33": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": true,
+  "do_lower_case": false,
+  "eos_token": "</s>",
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "[PAD]",
+  "replace_word_delimiter_char": " ",
+  "target_lang": null,
+  "tokenizer_class": "Wav2Vec2CTCTokenizer",
+  "unk_token": "[UNK]",
+  "word_delimiter_token": "|"
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:76b1726f88a10b6122b423394ba676a6e1dc0ef8bf3b3a06cb5dae0ad5561656
+size 4984

vocab.json ADDED Viewed

	@@ -0,0 +1,34 @@

+{
+  "[PAD]": 31,
+  "[UNK]": 30,
+  "a": 1,
+  "b": 2,
+  "c": 3,
+  "d": 4,
+  "e": 5,
+  "f": 6,
+  "g": 7,
+  "h": 8,
+  "i": 9,
+  "j": 10,
+  "k": 11,
+  "l": 12,
+  "m": 13,
+  "n": 14,
+  "o": 15,
+  "p": 16,
+  "q": 17,
+  "r": 18,
+  "s": 19,
+  "t": 20,
+  "u": 21,
+  "v": 22,
+  "w": 23,
+  "x": 24,
+  "y": 25,
+  "z": 26,
+  "|": 0,
+  "å": 27,
+  "æ": 28,
+  "ø": 29
+}