Tflatval commited on Jun 21

Commit

c5d740f

•

1 Parent(s): 13fa854

Upload folder using huggingface_hub

Browse files

Files changed (30) hide show

.gitattributes +1 -0
added_tokens.json +4 -0
alphabet.json +1 -0
checkpoint-59237/config.json +116 -0
checkpoint-59237/model.safetensors +3 -0
checkpoint-59237/optimizer.pt +3 -0
checkpoint-59237/preprocessor_config.json +10 -0
checkpoint-59237/rng_state.pth +3 -0
checkpoint-59237/scheduler.pt +3 -0
checkpoint-59237/trainer_state.json +1612 -0
checkpoint-59237/training_args.bin +3 -0
checkpoint-64040/config.json +116 -0
checkpoint-64040/model.safetensors +3 -0
checkpoint-64040/optimizer.pt +3 -0
checkpoint-64040/preprocessor_config.json +10 -0
checkpoint-64040/rng_state.pth +3 -0
checkpoint-64040/scheduler.pt +3 -0
checkpoint-64040/trainer_state.json +1741 -0
checkpoint-64040/training_args.bin +3 -0
config.json +116 -0
language_model/5gram.bin +3 -0
language_model/attrs.json +1 -0
language_model/unigrams.txt +3 -0
model.safetensors +3 -0
preprocessor_config.json +10 -0
runs/May30_23-02-47_idun-04-08/events.out.tfevents.1717104232.idun-04-08.1448637.0 +3 -0
special_tokens_map.json +6 -0
tokenizer_config.json +47 -0
training_args.bin +3 -0
vocab.json +34 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+language_model/unigrams.txt filter=lfs diff=lfs merge=lfs -text

added_tokens.json ADDED Viewed

	@@ -0,0 +1,4 @@

+{
+  "</s>": 33,
+  "<s>": 32
+}

alphabet.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"labels": [" ", "a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k", "l", "m", "n", "o", "p", "q", "r", "s", "t", "u", "v", "w", "x", "y", "z", "\u00e5", "\u00e6", "\u00f8" ,"\u2047", "", "<s>", "</s>"], "is_bpe": false}

checkpoint-59237/config.json ADDED Viewed

	@@ -0,0 +1,116 @@

+{
+  "_name_or_path": "NbAiLab/nb-wav2vec2-300m-bokmaal",
+  "activation_dropout": 0.055,
+  "adapter_attn_dim": null,
+  "adapter_kernel_size": 3,
+  "adapter_stride": 2,
+  "add_adapter": false,
+  "apply_spec_augment": true,
+  "architectures": [
+    "Wav2Vec2ForCTC"
+  ],
+  "attention_dropout": 0.094,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "codevector_dim": 768,
+  "contrastive_logits_temperature": 0.1,
+  "conv_bias": true,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "mean",
+  "ctc_zero_infinity": true,
+  "diversity_loss_weight": 0.1,
+  "do_stable_layer_norm": true,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_dropout": 0.0,
+  "feat_extract_norm": "layer",
+  "feat_proj_dropout": 0.04,
+  "feat_quantizer_dropout": 0.0,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.047,
+  "hidden_size": 1024,
+  "initializer_range": 0.02,
+  "intermediate_size": 4096,
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.041,
+  "mask_channel_length": 10,
+  "mask_channel_min_space": 1,
+  "mask_channel_other": 0.0,
+  "mask_channel_prob": 0.0,
+  "mask_channel_selection": "static",
+  "mask_feature_length": 64,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.25,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_min_space": 1,
+  "mask_time_other": 0.0,
+  "mask_time_prob": 0.082,
+  "mask_time_selection": "static",
+  "model_type": "wav2vec2",
+  "num_adapter_layers": 3,
+  "num_attention_heads": 16,
+  "num_codevector_groups": 2,
+  "num_codevectors_per_group": 320,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 24,
+  "num_negatives": 100,
+  "output_hidden_size": 1024,
+  "pad_token_id": 31,
+  "proj_codevector_dim": 768,
+  "tdnn_dilation": [
+    1,
+    2,
+    3,
+    1,
+    1
+  ],
+  "tdnn_dim": [
+    512,
+    512,
+    512,
+    512,
+    1500
+  ],
+  "tdnn_kernel": [
+    5,
+    3,
+    3,
+    1,
+    1
+  ],
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 34,
+  "xvector_output_dim": 512
+}

checkpoint-59237/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0f1b72a8661985e694d6249ad4fdebdffc86644e0140a80ac60f082cfeac4024
+size 1261946880

checkpoint-59237/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c2c3b047ddb1c29b2bcc8839961a0f59f822fcd59f2b7fb8db16b5b13ea7112e
+size 2490438582

checkpoint-59237/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "do_normalize": true,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "processor_class": "Wav2Vec2ProcessorWithLM",
+  "return_attention_mask": true,
+  "sampling_rate": 16000
+}

checkpoint-59237/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f5f13c8b13dacbc68a95a5bb675bf2afe6ed6c8101888da97f31a0462591c0db
+size 14308

checkpoint-59237/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ab370388164fb385032b67eff9f30477507323458cd5a60ff10a4d4cc5e8f3b0
+size 1064

checkpoint-59237/trainer_state.json ADDED Viewed

	@@ -0,0 +1,1612 @@

+{
+  "best_metric": 0.2507504502701621,
+  "best_model_checkpoint": "/cluster/home/torstefl/Master/saved_model/W2V/Combined/BB-RUND/30.05/checkpoint-59237",
+  "epoch": 37.0,
+  "eval_steps": 500,
+  "global_step": 59237,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "grad_norm": 3.5616490840911865,
+      "learning_rate": 9.984170131116086e-05,
+      "loss": 0.9316,
+      "step": 1601
+    },
+    {
+      "epoch": 1.0,
+      "eval_rundkast_loss": 0.3094605803489685,
+      "eval_rundkast_runtime": 31.7263,
+      "eval_rundkast_samples_per_second": 42.394,
+      "eval_rundkast_steps_per_second": 1.355,
+      "eval_rundkast_wer": 0.18334393891186765,
+      "step": 1601
+    },
+    {
+      "epoch": 1.0,
+      "eval_nb_samtale_loss": 0.5153853297233582,
+      "eval_nb_samtale_runtime": 36.9199,
+      "eval_nb_samtale_samples_per_second": 14.437,
+      "eval_nb_samtale_steps_per_second": 0.46,
+      "eval_nb_samtale_wer": 0.2501627604166667,
+      "step": 1601
+    },
+    {
+      "epoch": 1.0,
+      "eval_BB_RUND_loss": 0.8934017419815063,
+      "eval_BB_RUND_runtime": 74.2605,
+      "eval_BB_RUND_samples_per_second": 36.56,
+      "eval_BB_RUND_steps_per_second": 1.145,
+      "eval_BB_RUND_wer": 0.3665399239543726,
+      "step": 1601
+    },
+    {
+      "epoch": 1.0,
+      "eval_bigbrother_loss": 1.4666274785995483,
+      "eval_bigbrother_runtime": 39.9935,
+      "eval_bigbrother_samples_per_second": 34.256,
+      "eval_bigbrother_steps_per_second": 1.075,
+      "eval_bigbrother_wer": 0.5517602513493918,
+      "step": 1601
+    },
+    {
+      "epoch": 2.0,
+      "grad_norm": 1.8291858434677124,
+      "learning_rate": 9.728173968660058e-05,
+      "loss": 0.7975,
+      "step": 3202
+    },
+    {
+      "epoch": 2.0,
+      "eval_rundkast_loss": 0.27037981152534485,
+      "eval_rundkast_runtime": 31.304,
+      "eval_rundkast_samples_per_second": 42.966,
+      "eval_rundkast_steps_per_second": 1.374,
+      "eval_rundkast_wer": 0.17968501431753103,
+      "step": 3202
+    },
+    {
+      "epoch": 2.0,
+      "eval_nb_samtale_loss": 0.4818350672721863,
+      "eval_nb_samtale_runtime": 36.3495,
+      "eval_nb_samtale_samples_per_second": 14.663,
+      "eval_nb_samtale_steps_per_second": 0.468,
+      "eval_nb_samtale_wer": 0.2549641927083333,
+      "step": 3202
+    },
+    {
+      "epoch": 2.0,
+      "eval_BB_RUND_loss": 0.7777431607246399,
+      "eval_BB_RUND_runtime": 74.0457,
+      "eval_BB_RUND_samples_per_second": 36.667,
+      "eval_BB_RUND_steps_per_second": 1.148,
+      "eval_BB_RUND_wer": 0.3568941364818891,
+      "step": 3202
+    },
+    {
+      "epoch": 2.0,
+      "eval_bigbrother_loss": 1.2756603956222534,
+      "eval_bigbrother_runtime": 39.2125,
+      "eval_bigbrother_samples_per_second": 34.938,
+      "eval_bigbrother_steps_per_second": 1.097,
+      "eval_bigbrother_wer": 0.5356481108515266,
+      "step": 3202
+    },
+    {
+      "epoch": 3.0,
+      "grad_norm": 1.1911417245864868,
+      "learning_rate": 9.472337703869524e-05,
+      "loss": 0.7318,
+      "step": 4803
+    },
+    {
+      "epoch": 3.0,
+      "eval_rundkast_loss": 0.2820556163787842,
+      "eval_rundkast_runtime": 31.3992,
+      "eval_rundkast_samples_per_second": 42.835,
+      "eval_rundkast_steps_per_second": 1.369,
+      "eval_rundkast_wer": 0.16679923639834554,
+      "step": 4803
+    },
+    {
+      "epoch": 3.0,
+      "eval_nb_samtale_loss": 0.4887722134590149,
+      "eval_nb_samtale_runtime": 36.3679,
+      "eval_nb_samtale_samples_per_second": 14.656,
+      "eval_nb_samtale_steps_per_second": 0.467,
+      "eval_nb_samtale_wer": 0.23697916666666666,
+      "step": 4803
+    },
+    {
+      "epoch": 3.0,
+      "eval_BB_RUND_loss": 0.7739498615264893,
+      "eval_BB_RUND_runtime": 74.2643,
+      "eval_BB_RUND_samples_per_second": 36.559,
+      "eval_BB_RUND_steps_per_second": 1.145,
+      "eval_BB_RUND_wer": 0.3293976385831499,
+      "step": 4803
+    },
+    {
+      "epoch": 3.0,
+      "eval_bigbrother_loss": 1.256850004196167,
+      "eval_bigbrother_runtime": 39.3324,
+      "eval_bigbrother_samples_per_second": 34.831,
+      "eval_bigbrother_steps_per_second": 1.093,
+      "eval_bigbrother_wer": 0.49343430274711997,
+      "step": 4803
+    },
+    {
+      "epoch": 4.0,
+      "grad_norm": 1.5012503862380981,
+      "learning_rate": 9.216341541413495e-05,
+      "loss": 0.6896,
+      "step": 6404
+    },
+    {
+      "epoch": 4.0,
+      "eval_rundkast_loss": 0.2698061466217041,
+      "eval_rundkast_runtime": 31.5141,
+      "eval_rundkast_samples_per_second": 42.679,
+      "eval_rundkast_steps_per_second": 1.364,
+      "eval_rundkast_wer": 0.1590836780146357,
+      "step": 6404
+    },
+    {
+      "epoch": 4.0,
+      "eval_nb_samtale_loss": 0.46429482102394104,
+      "eval_nb_samtale_runtime": 36.1366,
+      "eval_nb_samtale_samples_per_second": 14.75,
+      "eval_nb_samtale_steps_per_second": 0.47,
+      "eval_nb_samtale_wer": 0.22770182291666666,
+      "step": 6404
+    },
+    {
+      "epoch": 4.0,
+      "eval_BB_RUND_loss": 0.7106366157531738,
+      "eval_BB_RUND_runtime": 74.1602,
+      "eval_BB_RUND_samples_per_second": 36.61,
+      "eval_BB_RUND_steps_per_second": 1.146,
+      "eval_BB_RUND_wer": 0.3115469281568941,
+      "step": 6404
+    },
+    {
+      "epoch": 4.0,
+      "eval_bigbrother_loss": 1.1434192657470703,
+      "eval_bigbrother_runtime": 39.4465,
+      "eval_bigbrother_samples_per_second": 34.731,
+      "eval_bigbrother_steps_per_second": 1.09,
+      "eval_bigbrother_wer": 0.4657214210907919,
+      "step": 6404
+    },
+    {
+      "epoch": 5.0,
+      "grad_norm": 1.3953436613082886,
+      "learning_rate": 8.960345378957467e-05,
+      "loss": 0.6527,
+      "step": 8005
+    },
+    {
+      "epoch": 5.0,
+      "eval_rundkast_loss": 0.3087877333164215,
+      "eval_rundkast_runtime": 31.2187,
+      "eval_rundkast_samples_per_second": 43.083,
+      "eval_rundkast_steps_per_second": 1.377,
+      "eval_rundkast_wer": 0.15717467387846007,
+      "step": 8005
+    },
+    {
+      "epoch": 5.0,
+      "eval_nb_samtale_loss": 0.498180627822876,
+      "eval_nb_samtale_runtime": 36.0025,
+      "eval_nb_samtale_samples_per_second": 14.805,
+      "eval_nb_samtale_steps_per_second": 0.472,
+      "eval_nb_samtale_wer": 0.22737630208333334,
+      "step": 8005
+    },
+    {
+      "epoch": 5.0,
+      "eval_BB_RUND_loss": 0.7562405467033386,
+      "eval_BB_RUND_runtime": 73.6895,
+      "eval_BB_RUND_samples_per_second": 36.844,
+      "eval_BB_RUND_steps_per_second": 1.153,
+      "eval_BB_RUND_wer": 0.3094656794076446,
+      "step": 8005
+    },
+    {
+      "epoch": 5.0,
+      "eval_bigbrother_loss": 1.1955605745315552,
+      "eval_bigbrother_runtime": 39.2755,
+      "eval_bigbrother_samples_per_second": 34.882,
+      "eval_bigbrother_steps_per_second": 1.095,
+      "eval_bigbrother_wer": 0.4638685249335374,
+      "step": 8005
+    },
+    {
+      "epoch": 6.0,
+      "grad_norm": 1.5980861186981201,
+      "learning_rate": 8.704828909497922e-05,
+      "loss": 0.6237,
+      "step": 9606
+    },
+    {
+      "epoch": 6.0,
+      "eval_rundkast_loss": 0.269611120223999,
+      "eval_rundkast_runtime": 31.4039,
+      "eval_rundkast_samples_per_second": 42.829,
+      "eval_rundkast_steps_per_second": 1.369,
+      "eval_rundkast_wer": 0.14675469296850144,
+      "step": 9606
+    },
+    {
+      "epoch": 6.0,
+      "eval_nb_samtale_loss": 0.4713493287563324,
+      "eval_nb_samtale_runtime": 35.984,
+      "eval_nb_samtale_samples_per_second": 14.812,
+      "eval_nb_samtale_steps_per_second": 0.472,
+      "eval_nb_samtale_wer": 0.22029622395833334,
+      "step": 9606
+    },
+    {
+      "epoch": 6.0,
+      "eval_BB_RUND_loss": 0.6956652998924255,
+      "eval_BB_RUND_runtime": 73.7058,
+      "eval_BB_RUND_samples_per_second": 36.836,
+      "eval_BB_RUND_steps_per_second": 1.153,
+      "eval_BB_RUND_wer": 0.29605763458074846,
+      "step": 9606
+    },
+    {
+      "epoch": 6.0,
+      "eval_bigbrother_loss": 1.1138566732406616,
+      "eval_bigbrother_runtime": 39.5517,
+      "eval_bigbrother_samples_per_second": 34.638,
+      "eval_bigbrother_steps_per_second": 1.087,
+      "eval_bigbrother_wer": 0.4462257310883751,
+      "step": 9606
+    },
+    {
+      "epoch": 7.0,
+      "grad_norm": 4.422884941101074,
+      "learning_rate": 8.448832747041894e-05,
+      "loss": 0.5972,
+      "step": 11207
+    },
+    {
+      "epoch": 7.0,
+      "eval_rundkast_loss": 0.25946080684661865,
+      "eval_rundkast_runtime": 31.4395,
+      "eval_rundkast_samples_per_second": 42.781,
+      "eval_rundkast_steps_per_second": 1.368,
+      "eval_rundkast_wer": 0.14428889595927458,
+      "step": 11207
+    },
+    {
+      "epoch": 7.0,
+      "eval_nb_samtale_loss": 0.49012112617492676,
+      "eval_nb_samtale_runtime": 35.8902,
+      "eval_nb_samtale_samples_per_second": 14.851,
+      "eval_nb_samtale_steps_per_second": 0.474,
+      "eval_nb_samtale_wer": 0.21590169270833334,
+      "step": 11207
+    },
+    {
+      "epoch": 7.0,
+      "eval_BB_RUND_loss": 0.7060232758522034,
+      "eval_BB_RUND_runtime": 73.9395,
+      "eval_BB_RUND_samples_per_second": 36.719,
+      "eval_BB_RUND_steps_per_second": 1.15,
+      "eval_BB_RUND_wer": 0.29153492095257155,
+      "step": 11207
+    },
+    {
+      "epoch": 7.0,
+      "eval_bigbrother_loss": 1.1444189548492432,
+      "eval_bigbrother_runtime": 39.3579,
+      "eval_bigbrother_samples_per_second": 34.809,
+      "eval_bigbrother_steps_per_second": 1.093,
+      "eval_bigbrother_wer": 0.440264239104165,
+      "step": 11207
+    },
+    {
+      "epoch": 8.0,
+      "grad_norm": 1.6600903272628784,
+      "learning_rate": 8.192836584585866e-05,
+      "loss": 0.5771,
+      "step": 12808
+    },
+    {
+      "epoch": 8.0,
+      "eval_rundkast_loss": 0.27805188298225403,
+      "eval_rundkast_runtime": 31.731,
+      "eval_rundkast_samples_per_second": 42.388,
+      "eval_rundkast_steps_per_second": 1.355,
+      "eval_rundkast_wer": 0.14945911549475024,
+      "step": 12808
+    },
+    {
+      "epoch": 8.0,
+      "eval_nb_samtale_loss": 0.4692385196685791,
+      "eval_nb_samtale_runtime": 36.1624,
+      "eval_nb_samtale_samples_per_second": 14.739,
+      "eval_nb_samtale_steps_per_second": 0.47,
+      "eval_nb_samtale_wer": 0.22216796875,
+      "step": 12808
+    },
+    {
+      "epoch": 8.0,
+      "eval_BB_RUND_loss": 0.7197623252868652,
+      "eval_BB_RUND_runtime": 92.436,
+      "eval_BB_RUND_samples_per_second": 29.372,
+      "eval_BB_RUND_steps_per_second": 0.92,
+      "eval_BB_RUND_wer": 0.2952971783069842,
+      "step": 12808
+    },
+    {
+      "epoch": 8.0,
+      "eval_bigbrother_loss": 1.1536922454833984,
+      "eval_bigbrother_runtime": 39.1987,
+      "eval_bigbrother_samples_per_second": 34.95,
+      "eval_bigbrother_steps_per_second": 1.097,
+      "eval_bigbrother_wer": 0.44260049947635544,
+      "step": 12808
+    },
+    {
+      "epoch": 9.0,
+      "grad_norm": 1.0308187007904053,
+      "learning_rate": 7.936840422129838e-05,
+      "loss": 0.5567,
+      "step": 14409
+    },
+    {
+      "epoch": 9.0,
+      "eval_rundkast_loss": 0.28997811675071716,
+      "eval_rundkast_runtime": 31.3398,
+      "eval_rundkast_samples_per_second": 42.917,
+      "eval_rundkast_steps_per_second": 1.372,
+      "eval_rundkast_wer": 0.1408685968819599,
+      "step": 14409
+    },
+    {
+      "epoch": 9.0,
+      "eval_nb_samtale_loss": 0.46654534339904785,
+      "eval_nb_samtale_runtime": 35.7424,
+      "eval_nb_samtale_samples_per_second": 14.912,
+      "eval_nb_samtale_steps_per_second": 0.476,
+      "eval_nb_samtale_wer": 0.21126302083333334,
+      "step": 14409
+    },
+    {
+      "epoch": 9.0,
+      "eval_BB_RUND_loss": 0.7060103416442871,
+      "eval_BB_RUND_runtime": 73.7474,
+      "eval_BB_RUND_samples_per_second": 36.815,
+      "eval_BB_RUND_steps_per_second": 1.153,
+      "eval_BB_RUND_wer": 0.28328997398439065,
+      "step": 14409
+    },
+    {
+      "epoch": 9.0,
+      "eval_bigbrother_loss": 1.1144466400146484,
+      "eval_bigbrother_runtime": 39.254,
+      "eval_bigbrother_samples_per_second": 34.901,
+      "eval_bigbrother_steps_per_second": 1.095,
+      "eval_bigbrother_wer": 0.4277773302183195,
+      "step": 14409
+    },
+    {
+      "epoch": 10.0,
+      "grad_norm": 3.7091312408447266,
+      "learning_rate": 7.681004157339303e-05,
+      "loss": 0.5422,
+      "step": 16010
+    },
+    {
+      "epoch": 10.0,
+      "eval_rundkast_loss": 0.292531818151474,
+      "eval_rundkast_runtime": 31.6718,
+      "eval_rundkast_samples_per_second": 42.467,
+      "eval_rundkast_steps_per_second": 1.358,
+      "eval_rundkast_wer": 0.14134584791600383,
+      "step": 16010
+    },
+    {
+      "epoch": 10.0,
+      "eval_nb_samtale_loss": 0.4930917024612427,
+      "eval_nb_samtale_runtime": 35.8047,
+      "eval_nb_samtale_samples_per_second": 14.886,
+      "eval_nb_samtale_steps_per_second": 0.475,
+      "eval_nb_samtale_wer": 0.2080078125,
+      "step": 16010
+    },
+    {
+      "epoch": 10.0,
+      "eval_BB_RUND_loss": 0.7012096643447876,
+      "eval_BB_RUND_runtime": 75.6789,
+      "eval_BB_RUND_samples_per_second": 35.875,
+      "eval_BB_RUND_steps_per_second": 1.123,
+      "eval_BB_RUND_wer": 0.28092855713428055,
+      "step": 16010
+    },
+    {
+      "epoch": 10.0,
+      "eval_bigbrother_loss": 1.1022217273712158,
+      "eval_bigbrother_runtime": 39.334,
+      "eval_bigbrother_samples_per_second": 34.83,
+      "eval_bigbrother_steps_per_second": 1.093,
+      "eval_bigbrother_wer": 0.4221380810440667,
+      "step": 16010
+    },
+    {
+      "epoch": 11.0,
+      "grad_norm": 0.9090811014175415,
+      "learning_rate": 7.425167892548769e-05,
+      "loss": 0.5266,
+      "step": 17611
+    },
+    {
+      "epoch": 11.0,
+      "eval_rundkast_loss": 0.30149751901626587,
+      "eval_rundkast_runtime": 31.3393,
+      "eval_rundkast_samples_per_second": 42.917,
+      "eval_rundkast_steps_per_second": 1.372,
+      "eval_rundkast_wer": 0.13935730194082088,
+      "step": 17611
+    },
+    {
+      "epoch": 11.0,
+      "eval_nb_samtale_loss": 0.4974854290485382,
+      "eval_nb_samtale_runtime": 35.6974,
+      "eval_nb_samtale_samples_per_second": 14.931,
+      "eval_nb_samtale_steps_per_second": 0.476,
+      "eval_nb_samtale_wer": 0.20947265625,
+      "step": 17611
+    },
+    {
+      "epoch": 11.0,
+      "eval_BB_RUND_loss": 0.7534126043319702,
+      "eval_BB_RUND_runtime": 73.8118,
+      "eval_BB_RUND_samples_per_second": 36.783,
+      "eval_BB_RUND_steps_per_second": 1.152,
+      "eval_BB_RUND_wer": 0.2830898539123474,
+      "step": 17611
+    },
+    {
+      "epoch": 11.0,
+      "eval_bigbrother_loss": 1.1972620487213135,
+      "eval_bigbrother_runtime": 39.3175,
+      "eval_bigbrother_samples_per_second": 34.845,
+      "eval_bigbrother_steps_per_second": 1.094,
+      "eval_bigbrother_wer": 0.4285829372432128,
+      "step": 17611
+    },
+    {
+      "epoch": 12.0,
+      "grad_norm": 1.5719759464263916,
+      "learning_rate": 7.169331627758235e-05,
+      "loss": 0.5103,
+      "step": 19212
+    },
+    {
+      "epoch": 12.0,
+      "eval_rundkast_loss": 0.2790067195892334,
+      "eval_rundkast_runtime": 31.604,
+      "eval_rundkast_samples_per_second": 42.558,
+      "eval_rundkast_steps_per_second": 1.361,
+      "eval_rundkast_wer": 0.13728921412663062,
+      "step": 19212
+    },
+    {
+      "epoch": 12.0,
+      "eval_nb_samtale_loss": 0.47254645824432373,
+      "eval_nb_samtale_runtime": 36.6581,
+      "eval_nb_samtale_samples_per_second": 14.54,
+      "eval_nb_samtale_steps_per_second": 0.464,
+      "eval_nb_samtale_wer": 0.208740234375,
+      "step": 19212
+    },
+    {
+      "epoch": 12.0,
+      "eval_BB_RUND_loss": 0.7001897096633911,
+      "eval_BB_RUND_runtime": 76.071,
+      "eval_BB_RUND_samples_per_second": 35.69,
+      "eval_BB_RUND_steps_per_second": 1.117,
+      "eval_BB_RUND_wer": 0.27512507504502703,
+      "step": 19212
+    },
+    {
+      "epoch": 12.0,
+      "eval_bigbrother_loss": 1.1136471033096313,
+      "eval_bigbrother_runtime": 39.6183,
+      "eval_bigbrother_samples_per_second": 34.58,
+      "eval_bigbrother_steps_per_second": 1.085,
+      "eval_bigbrother_wer": 0.41456537501007007,
+      "step": 19212
+    },
+    {
+      "epoch": 13.0,
+      "grad_norm": 1.0063461065292358,
+      "learning_rate": 6.913495362967701e-05,
+      "loss": 0.4968,
+      "step": 20813
+    },
+    {
+      "epoch": 13.0,
+      "eval_rundkast_loss": 0.29398083686828613,
+      "eval_rundkast_runtime": 31.5607,
+      "eval_rundkast_samples_per_second": 42.616,
+      "eval_rundkast_steps_per_second": 1.362,
+      "eval_rundkast_wer": 0.1381641743557111,
+      "step": 20813
+    },
+    {
+      "epoch": 13.0,
+      "eval_nb_samtale_loss": 0.4911497235298157,
+      "eval_nb_samtale_runtime": 36.0599,
+      "eval_nb_samtale_samples_per_second": 14.781,
+      "eval_nb_samtale_steps_per_second": 0.471,
+      "eval_nb_samtale_wer": 0.212158203125,
+      "step": 20813
+    },
+    {
+      "epoch": 13.0,
+      "eval_BB_RUND_loss": 0.729911208152771,
+      "eval_BB_RUND_runtime": 74.2919,
+      "eval_BB_RUND_samples_per_second": 36.545,
+      "eval_BB_RUND_steps_per_second": 1.144,
+      "eval_BB_RUND_wer": 0.2774864918951371,
+      "step": 20813
+    },
+    {
+      "epoch": 13.0,
+      "eval_bigbrother_loss": 1.1584389209747314,
+      "eval_bigbrother_runtime": 39.483,
+      "eval_bigbrother_samples_per_second": 34.698,
+      "eval_bigbrother_steps_per_second": 1.089,
+      "eval_bigbrother_wer": 0.41786836381213244,
+      "step": 20813
+    },
+    {
+      "epoch": 14.0,
+      "grad_norm": 1.0339038372039795,
+      "learning_rate": 6.657499200511673e-05,
+      "loss": 0.4867,
+      "step": 22414
+    },
+    {
+      "epoch": 14.0,
+      "eval_rundkast_loss": 0.2678089141845703,
+      "eval_rundkast_runtime": 31.9259,
+      "eval_rundkast_samples_per_second": 42.129,
+      "eval_rundkast_steps_per_second": 1.347,
+      "eval_rundkast_wer": 0.1390391345847916,
+      "step": 22414
+    },
+    {
+      "epoch": 14.0,
+      "eval_nb_samtale_loss": 0.48425397276878357,
+      "eval_nb_samtale_runtime": 35.6709,
+      "eval_nb_samtale_samples_per_second": 14.942,
+      "eval_nb_samtale_steps_per_second": 0.477,
+      "eval_nb_samtale_wer": 0.21004231770833334,
+      "step": 22414
+    },
+    {
+      "epoch": 14.0,
+      "eval_BB_RUND_loss": 0.6763830184936523,
+      "eval_BB_RUND_runtime": 75.1278,
+      "eval_BB_RUND_samples_per_second": 36.138,
+      "eval_BB_RUND_steps_per_second": 1.131,
+      "eval_BB_RUND_wer": 0.2732439463678207,
+      "step": 22414
+    },
+    {
+      "epoch": 14.0,
+      "eval_bigbrother_loss": 1.0772405862808228,
+      "eval_bigbrother_runtime": 39.3624,
+      "eval_bigbrother_samples_per_second": 34.805,
+      "eval_bigbrother_steps_per_second": 1.092,
+      "eval_bigbrother_wer": 0.408845565133328,
+      "step": 22414
+    },
+    {
+      "epoch": 15.0,
+      "grad_norm": 0.5528441667556763,
+      "learning_rate": 6.401662935721138e-05,
+      "loss": 0.4721,
+      "step": 24015
+    },
+    {
+      "epoch": 15.0,
+      "eval_rundkast_loss": 0.2952366769313812,
+      "eval_rundkast_runtime": 31.7087,
+      "eval_rundkast_samples_per_second": 42.417,
+      "eval_rundkast_steps_per_second": 1.356,
+      "eval_rundkast_wer": 0.1345847916003818,
+      "step": 24015
+    },
+    {
+      "epoch": 15.0,
+      "eval_nb_samtale_loss": 0.48395708203315735,
+      "eval_nb_samtale_runtime": 35.8001,
+      "eval_nb_samtale_samples_per_second": 14.888,
+      "eval_nb_samtale_steps_per_second": 0.475,
+      "eval_nb_samtale_wer": 0.20865885416666666,
+      "step": 24015
+    },
+    {
+      "epoch": 15.0,
+      "eval_BB_RUND_loss": 0.7274541854858398,
+      "eval_BB_RUND_runtime": 74.0948,
+      "eval_BB_RUND_samples_per_second": 36.642,
+      "eval_BB_RUND_steps_per_second": 1.147,
+      "eval_BB_RUND_wer": 0.269481689013408,
+      "step": 24015
+    },
+    {
+      "epoch": 15.0,
+      "eval_bigbrother_loss": 1.1518090963363647,
+      "eval_bigbrother_runtime": 39.2366,
+      "eval_bigbrother_samples_per_second": 34.916,
+      "eval_bigbrother_steps_per_second": 1.096,
+      "eval_bigbrother_wer": 0.4053008942237976,
+      "step": 24015
+    },
+    {
+      "epoch": 16.0,
+      "grad_norm": 0.9716380834579468,
+      "learning_rate": 6.14566677326511e-05,
+      "loss": 0.4626,
+      "step": 25616
+    },
+    {
+      "epoch": 16.0,
+      "eval_rundkast_loss": 0.3125823736190796,
+      "eval_rundkast_runtime": 31.5106,
+      "eval_rundkast_samples_per_second": 42.684,
+      "eval_rundkast_steps_per_second": 1.365,
+      "eval_rundkast_wer": 0.13347120585427935,
+      "step": 25616
+    },
+    {
+      "epoch": 16.0,
+      "eval_nb_samtale_loss": 0.5268623232841492,
+      "eval_nb_samtale_runtime": 35.7773,
+      "eval_nb_samtale_samples_per_second": 14.898,
+      "eval_nb_samtale_steps_per_second": 0.475,
+      "eval_nb_samtale_wer": 0.209228515625,
+      "step": 25616
+    },
+    {
+      "epoch": 16.0,
+      "eval_BB_RUND_loss": 0.752697229385376,
+      "eval_BB_RUND_runtime": 75.4571,
+      "eval_BB_RUND_samples_per_second": 35.981,
+      "eval_BB_RUND_steps_per_second": 1.126,
+      "eval_BB_RUND_wer": 0.2700820492295377,
+      "step": 25616
+    },
+    {
+      "epoch": 16.0,
+      "eval_bigbrother_loss": 1.1851829290390015,
+      "eval_bigbrother_runtime": 39.3085,
+      "eval_bigbrother_samples_per_second": 34.853,
+      "eval_bigbrother_steps_per_second": 1.094,
+      "eval_bigbrother_wer": 0.4079593974059454,
+      "step": 25616
+    },
+    {
+      "epoch": 17.0,
+      "grad_norm": 1.0000524520874023,
+      "learning_rate": 5.889830508474577e-05,
+      "loss": 0.4554,
+      "step": 27217
+    },
+    {
+      "epoch": 17.0,
+      "eval_rundkast_loss": 0.28784507513046265,
+      "eval_rundkast_runtime": 31.1375,
+      "eval_rundkast_samples_per_second": 43.196,
+      "eval_rundkast_steps_per_second": 1.381,
+      "eval_rundkast_wer": 0.13140311804008908,
+      "step": 27217
+    },
+    {
+      "epoch": 17.0,
+      "eval_nb_samtale_loss": 0.47152796387672424,
+      "eval_nb_samtale_runtime": 35.203,
+      "eval_nb_samtale_samples_per_second": 15.141,
+      "eval_nb_samtale_steps_per_second": 0.483,
+      "eval_nb_samtale_wer": 0.20361328125,
+      "step": 27217
+    },
+    {
+      "epoch": 17.0,
+      "eval_BB_RUND_loss": 0.705199122428894,
+      "eval_BB_RUND_runtime": 73.2232,
+      "eval_BB_RUND_samples_per_second": 37.078,
+      "eval_BB_RUND_steps_per_second": 1.161,
+      "eval_BB_RUND_wer": 0.2690814488693216,
+      "step": 27217
+    },
+    {
+      "epoch": 17.0,
+      "eval_bigbrother_loss": 1.1149847507476807,
+      "eval_bigbrother_runtime": 39.237,
+      "eval_bigbrother_samples_per_second": 34.916,
+      "eval_bigbrother_steps_per_second": 1.096,
+      "eval_bigbrother_wer": 0.40868444372834933,
+      "step": 27217
+    },
+    {
+      "epoch": 18.0,
+      "grad_norm": 0.8535083532333374,
+      "learning_rate": 5.6338343460185485e-05,
+      "loss": 0.4407,
+      "step": 28818
+    },
+    {
+      "epoch": 18.0,
+      "eval_rundkast_loss": 0.29337021708488464,
+      "eval_rundkast_runtime": 31.587,
+      "eval_rundkast_samples_per_second": 42.581,
+      "eval_rundkast_steps_per_second": 1.361,
+      "eval_rundkast_wer": 0.13044861597200128,
+      "step": 28818
+    },
+    {
+      "epoch": 18.0,
+      "eval_nb_samtale_loss": 0.5154338479042053,
+      "eval_nb_samtale_runtime": 35.5632,
+      "eval_nb_samtale_samples_per_second": 14.987,
+      "eval_nb_samtale_steps_per_second": 0.478,
+      "eval_nb_samtale_wer": 0.204345703125,
+      "step": 28818
+    },
+    {
+      "epoch": 18.0,
+      "eval_BB_RUND_loss": 0.7406498789787292,
+      "eval_BB_RUND_runtime": 73.657,
+      "eval_BB_RUND_samples_per_second": 36.86,
+      "eval_BB_RUND_steps_per_second": 1.154,
+      "eval_BB_RUND_wer": 0.26812087252351413,
+      "step": 28818
+    },
+    {
+      "epoch": 18.0,
+      "eval_bigbrother_loss": 1.1797504425048828,
+      "eval_bigbrother_runtime": 38.9311,
+      "eval_bigbrother_samples_per_second": 35.19,
+      "eval_bigbrother_steps_per_second": 1.105,
+      "eval_bigbrother_wer": 0.40699266897607345,
+      "step": 28818
+    },
+    {
+      "epoch": 19.0,
+      "grad_norm": 4.492996692657471,
+      "learning_rate": 5.378157978893509e-05,
+      "loss": 0.4361,
+      "step": 30419
+    },
+    {
+      "epoch": 19.0,
+      "eval_rundkast_loss": 0.2833118140697479,
+      "eval_rundkast_runtime": 31.0219,
+      "eval_rundkast_samples_per_second": 43.357,
+      "eval_rundkast_steps_per_second": 1.386,
+      "eval_rundkast_wer": 0.13219853643016227,
+      "step": 30419
+    },
+    {
+      "epoch": 19.0,
+      "eval_nb_samtale_loss": 0.4991215765476227,
+      "eval_nb_samtale_runtime": 35.3186,
+      "eval_nb_samtale_samples_per_second": 15.091,
+      "eval_nb_samtale_steps_per_second": 0.481,
+      "eval_nb_samtale_wer": 0.20638020833333334,
+      "step": 30419
+    },
+    {
+      "epoch": 19.0,
+      "eval_BB_RUND_loss": 0.7097201347351074,
+      "eval_BB_RUND_runtime": 73.7433,
+      "eval_BB_RUND_samples_per_second": 36.817,
+      "eval_BB_RUND_steps_per_second": 1.153,
+      "eval_BB_RUND_wer": 0.26451871122673604,
+      "step": 30419
+    },
+    {
+      "epoch": 19.0,
+      "eval_bigbrother_loss": 1.1280052661895752,
+      "eval_bigbrother_runtime": 38.9563,
+      "eval_bigbrother_samples_per_second": 35.168,
+      "eval_bigbrother_steps_per_second": 1.104,
+      "eval_bigbrother_wer": 0.39837267380971564,
+      "step": 30419
+    },
+    {
+      "epoch": 20.0,
+      "grad_norm": 1.5283879041671753,
+      "learning_rate": 5.122161816437481e-05,
+      "loss": 0.4249,
+      "step": 32020
+    },
+    {
+      "epoch": 20.0,
+      "eval_rundkast_loss": 0.309190571308136,
+      "eval_rundkast_runtime": 31.2274,
+      "eval_rundkast_samples_per_second": 43.071,
+      "eval_rundkast_steps_per_second": 1.377,
+      "eval_rundkast_wer": 0.13084632516703787,
+      "step": 32020
+    },
+    {
+      "epoch": 20.0,
+      "eval_nb_samtale_loss": 0.49869558215141296,
+      "eval_nb_samtale_runtime": 35.2581,
+      "eval_nb_samtale_samples_per_second": 15.117,
+      "eval_nb_samtale_steps_per_second": 0.482,
+      "eval_nb_samtale_wer": 0.200927734375,
+      "step": 32020
+    },
+    {
+      "epoch": 20.0,
+      "eval_BB_RUND_loss": 0.7553633451461792,
+      "eval_BB_RUND_runtime": 73.477,
+      "eval_BB_RUND_samples_per_second": 36.95,
+      "eval_BB_RUND_steps_per_second": 1.157,
+      "eval_BB_RUND_wer": 0.26575945567340403,
+      "step": 32020
+    },
+    {
+      "epoch": 20.0,
+      "eval_bigbrother_loss": 1.1935659646987915,
+      "eval_bigbrother_runtime": 39.2084,
+      "eval_bigbrother_samples_per_second": 34.941,
+      "eval_bigbrother_steps_per_second": 1.097,
+      "eval_bigbrother_wer": 0.40248126963667125,
+      "step": 32020
+    },
+    {
+      "epoch": 21.0,
+      "grad_norm": 0.824657142162323,
+      "learning_rate": 4.866165653981452e-05,
+      "loss": 0.4167,
+      "step": 33621
+    },
+    {
+      "epoch": 21.0,
+      "eval_rundkast_loss": 0.3222857415676117,
+      "eval_rundkast_runtime": 31.2353,
+      "eval_rundkast_samples_per_second": 43.06,
+      "eval_rundkast_steps_per_second": 1.377,
+      "eval_rundkast_wer": 0.1296531975819281,
+      "step": 33621
+    },
+    {
+      "epoch": 21.0,
+      "eval_nb_samtale_loss": 0.533822774887085,
+      "eval_nb_samtale_runtime": 35.2167,
+      "eval_nb_samtale_samples_per_second": 15.135,
+      "eval_nb_samtale_steps_per_second": 0.483,
+      "eval_nb_samtale_wer": 0.201171875,
+      "step": 33621
+    },
+    {
+      "epoch": 21.0,
+      "eval_BB_RUND_loss": 0.7721800804138184,
+      "eval_BB_RUND_runtime": 73.7086,
+      "eval_BB_RUND_samples_per_second": 36.834,
+      "eval_BB_RUND_steps_per_second": 1.153,
+      "eval_BB_RUND_wer": 0.2623574144486692,
+      "step": 33621
+    },
+    {
+      "epoch": 21.0,
+      "eval_bigbrother_loss": 1.2132436037063599,
+      "eval_bigbrother_runtime": 39.1843,
+      "eval_bigbrother_samples_per_second": 34.963,
+      "eval_bigbrother_steps_per_second": 1.097,
+      "eval_bigbrother_wer": 0.39660033835495045,
+      "step": 33621
+    },
+    {
+      "epoch": 22.0,
+      "grad_norm": 1.1440060138702393,
+      "learning_rate": 4.6103293891909183e-05,
+      "loss": 0.4105,
+      "step": 35222
+    },
+    {
+      "epoch": 22.0,
+      "eval_rundkast_loss": 0.31660783290863037,
+      "eval_rundkast_runtime": 31.6185,
+      "eval_rundkast_samples_per_second": 42.538,
+      "eval_rundkast_steps_per_second": 1.36,
+      "eval_rundkast_wer": 0.12893732103086222,
+      "step": 35222
+    },
+    {
+      "epoch": 22.0,
+      "eval_nb_samtale_loss": 0.5133374929428101,
+      "eval_nb_samtale_runtime": 35.2449,
+      "eval_nb_samtale_samples_per_second": 15.123,
+      "eval_nb_samtale_steps_per_second": 0.482,
+      "eval_nb_samtale_wer": 0.20157877604166666,
+      "step": 35222
+    },
+    {
+      "epoch": 22.0,
+      "eval_BB_RUND_loss": 0.7647114992141724,
+      "eval_BB_RUND_runtime": 73.4723,
+      "eval_BB_RUND_samples_per_second": 36.953,
+      "eval_BB_RUND_steps_per_second": 1.157,
+      "eval_BB_RUND_wer": 0.26255753452071245,
+      "step": 35222
+    },
+    {
+      "epoch": 22.0,
+      "eval_bigbrother_loss": 1.2045847177505493,
+      "eval_bigbrother_runtime": 39.0811,
+      "eval_bigbrother_samples_per_second": 35.055,
+      "eval_bigbrother_steps_per_second": 1.1,
+      "eval_bigbrother_wer": 0.39813099170224764,
+      "step": 35222
+    },
+    {
+      "epoch": 23.0,
+      "grad_norm": 1.2679944038391113,
+      "learning_rate": 4.354493124400384e-05,
+      "loss": 0.4077,
+      "step": 36823
+    },
+    {
+      "epoch": 23.0,
+      "eval_rundkast_loss": 0.32336536049842834,
+      "eval_rundkast_runtime": 31.2205,
+      "eval_rundkast_samples_per_second": 43.081,
+      "eval_rundkast_steps_per_second": 1.377,
+      "eval_rundkast_wer": 0.13156220171810373,
+      "step": 36823
+    },
+    {
+      "epoch": 23.0,
+      "eval_nb_samtale_loss": 0.5165642499923706,
+      "eval_nb_samtale_runtime": 35.3263,
+      "eval_nb_samtale_samples_per_second": 15.088,
+      "eval_nb_samtale_steps_per_second": 0.481,
+      "eval_nb_samtale_wer": 0.20035807291666666,
+      "step": 36823
+    },
+    {
+      "epoch": 23.0,
+      "eval_BB_RUND_loss": 0.7570832967758179,
+      "eval_BB_RUND_runtime": 90.621,
+      "eval_BB_RUND_samples_per_second": 29.96,
+      "eval_BB_RUND_steps_per_second": 0.938,
+      "eval_BB_RUND_wer": 0.26323794276565937,
+      "step": 36823
+    },
+    {
+      "epoch": 23.0,
+      "eval_bigbrother_loss": 1.1831412315368652,
+      "eval_bigbrother_runtime": 39.2988,
+      "eval_bigbrother_samples_per_second": 34.861,
+      "eval_bigbrother_steps_per_second": 1.094,
+      "eval_bigbrother_wer": 0.3967614597599291,
+      "step": 36823
+    },
+    {
+      "epoch": 24.0,
+      "grad_norm": 6.380431175231934,
+      "learning_rate": 4.098496961944356e-05,
+      "loss": 0.4011,
+      "step": 38424
+    },
+    {
+      "epoch": 24.0,
+      "eval_rundkast_loss": 0.3312782943248749,
+      "eval_rundkast_runtime": 31.4003,
+      "eval_rundkast_samples_per_second": 42.834,
+      "eval_rundkast_steps_per_second": 1.369,
+      "eval_rundkast_wer": 0.12853961183582566,
+      "step": 38424
+    },
+    {
+      "epoch": 24.0,
+      "eval_nb_samtale_loss": 0.5143250823020935,
+      "eval_nb_samtale_runtime": 35.5114,
+      "eval_nb_samtale_samples_per_second": 15.009,
+      "eval_nb_samtale_steps_per_second": 0.479,
+      "eval_nb_samtale_wer": 0.19954427083333334,
+      "step": 38424
+    },
+    {
+      "epoch": 24.0,
+      "eval_BB_RUND_loss": 0.7850114703178406,
+      "eval_BB_RUND_runtime": 74.2024,
+      "eval_BB_RUND_samples_per_second": 36.589,
+      "eval_BB_RUND_steps_per_second": 1.146,
+      "eval_BB_RUND_wer": 0.26135681408845307,
+      "step": 38424
+    },
+    {
+      "epoch": 24.0,
+      "eval_bigbrother_loss": 1.2299407720565796,
+      "eval_bigbrother_runtime": 39.2032,
+      "eval_bigbrother_samples_per_second": 34.946,
+      "eval_bigbrother_steps_per_second": 1.097,
+      "eval_bigbrother_wer": 0.39595585273503586,
+      "step": 38424
+    },
+    {
+      "epoch": 25.0,
+      "grad_norm": 0.8889333009719849,
+      "learning_rate": 3.842660697153822e-05,
+      "loss": 0.3946,
+      "step": 40025
+    },
+    {
+      "epoch": 25.0,
+      "eval_rundkast_loss": 0.3259143829345703,
+      "eval_rundkast_runtime": 31.2371,
+      "eval_rundkast_samples_per_second": 43.058,
+      "eval_rundkast_steps_per_second": 1.377,
+      "eval_rundkast_wer": 0.12822144447979636,
+      "step": 40025
+    },
+    {
+      "epoch": 25.0,
+      "eval_nb_samtale_loss": 0.5260791778564453,
+      "eval_nb_samtale_runtime": 35.2592,
+      "eval_nb_samtale_samples_per_second": 15.117,
+      "eval_nb_samtale_steps_per_second": 0.482,
+      "eval_nb_samtale_wer": 0.19742838541666666,
+      "step": 40025
+    },
+    {
+      "epoch": 25.0,
+      "eval_BB_RUND_loss": 0.7829692959785461,
+      "eval_BB_RUND_runtime": 96.3242,
+      "eval_BB_RUND_samples_per_second": 28.186,
+      "eval_BB_RUND_steps_per_second": 0.882,
+      "eval_BB_RUND_wer": 0.25939563738242943,
+      "step": 40025
+    },
+    {
+      "epoch": 25.0,
+      "eval_bigbrother_loss": 1.2314956188201904,
+      "eval_bigbrother_runtime": 39.2118,
+      "eval_bigbrother_samples_per_second": 34.938,
+      "eval_bigbrother_steps_per_second": 1.097,
+      "eval_bigbrother_wer": 0.3917666962055909,
+      "step": 40025
+    },
+    {
+      "epoch": 26.0,
+      "grad_norm": 2.6945877075195312,
+      "learning_rate": 3.5866645346977936e-05,
+      "loss": 0.3863,
+      "step": 41626
+    },
+    {
+      "epoch": 26.0,
+      "eval_rundkast_loss": 0.3363383412361145,
+      "eval_rundkast_runtime": 31.3558,
+      "eval_rundkast_samples_per_second": 42.895,
+      "eval_rundkast_steps_per_second": 1.371,
+      "eval_rundkast_wer": 0.13124403436207446,
+      "step": 41626
+    },
+    {
+      "epoch": 26.0,
+      "eval_nb_samtale_loss": 0.5427711009979248,
+      "eval_nb_samtale_runtime": 35.2067,
+      "eval_nb_samtale_samples_per_second": 15.139,
+      "eval_nb_samtale_steps_per_second": 0.483,
+      "eval_nb_samtale_wer": 0.20467122395833334,
+      "step": 41626
+    },
+    {
+      "epoch": 26.0,
+      "eval_BB_RUND_loss": 0.8028616905212402,
+      "eval_BB_RUND_runtime": 73.6484,
+      "eval_BB_RUND_samples_per_second": 36.864,
+      "eval_BB_RUND_steps_per_second": 1.154,
+      "eval_BB_RUND_wer": 0.2621172703622173,
+      "step": 41626
+    },
+    {
+      "epoch": 26.0,
+      "eval_bigbrother_loss": 1.2609052658081055,
+      "eval_bigbrother_runtime": 39.2296,
+      "eval_bigbrother_samples_per_second": 34.923,
+      "eval_bigbrother_steps_per_second": 1.096,
+      "eval_bigbrother_wer": 0.39506968500765327,
+      "step": 41626
+    },
+    {
+      "epoch": 27.0,
+      "grad_norm": 0.7852900624275208,
+      "learning_rate": 3.330828269907259e-05,
+      "loss": 0.3799,
+      "step": 43227
+    },
+    {
+      "epoch": 27.0,
+      "eval_rundkast_loss": 0.3347199857234955,
+      "eval_rundkast_runtime": 31.2946,
+      "eval_rundkast_samples_per_second": 42.979,
+      "eval_rundkast_steps_per_second": 1.374,
+      "eval_rundkast_wer": 0.12893732103086222,
+      "step": 43227
+    },
+    {
+      "epoch": 27.0,
+      "eval_nb_samtale_loss": 0.5341453552246094,
+      "eval_nb_samtale_runtime": 35.3834,
+      "eval_nb_samtale_samples_per_second": 15.064,
+      "eval_nb_samtale_steps_per_second": 0.48,
+      "eval_nb_samtale_wer": 0.20328776041666666,
+      "step": 43227
+    },
+    {
+      "epoch": 27.0,
+      "eval_BB_RUND_loss": 0.7905371189117432,
+      "eval_BB_RUND_runtime": 74.2226,
+      "eval_BB_RUND_samples_per_second": 36.579,
+      "eval_BB_RUND_steps_per_second": 1.145,
+      "eval_BB_RUND_wer": 0.25959575745447266,
+      "step": 43227
+    },
+    {
+      "epoch": 27.0,
+      "eval_bigbrother_loss": 1.2384859323501587,
+      "eval_bigbrother_runtime": 39.6106,
+      "eval_bigbrother_samples_per_second": 34.587,
+      "eval_bigbrother_steps_per_second": 1.086,
+      "eval_bigbrother_wer": 0.39192781761056955,
+      "step": 43227
+    },
+    {
+      "epoch": 28.0,
+      "grad_norm": 1.839573621749878,
+      "learning_rate": 3.074992005116725e-05,
+      "loss": 0.3782,
+      "step": 44828
+    },
+    {
+      "epoch": 28.0,
+      "eval_rundkast_loss": 0.33070889115333557,
+      "eval_rundkast_runtime": 31.2558,
+      "eval_rundkast_samples_per_second": 43.032,
+      "eval_rundkast_steps_per_second": 1.376,
+      "eval_rundkast_wer": 0.12750556792873052,
+      "step": 44828
+    },
+    {
+      "epoch": 28.0,
+      "eval_nb_samtale_loss": 0.5499075055122375,
+      "eval_nb_samtale_runtime": 35.4546,
+      "eval_nb_samtale_samples_per_second": 15.033,
+      "eval_nb_samtale_steps_per_second": 0.479,
+      "eval_nb_samtale_wer": 0.19881184895833334,
+      "step": 44828
+    },
+    {
+      "epoch": 28.0,
+      "eval_BB_RUND_loss": 0.7748451232910156,
+      "eval_BB_RUND_runtime": 73.8572,
+      "eval_BB_RUND_samples_per_second": 36.76,
+      "eval_BB_RUND_steps_per_second": 1.151,
+      "eval_BB_RUND_wer": 0.25531318791274765,
+      "step": 44828
+    },
+    {
+      "epoch": 28.0,
+      "eval_bigbrother_loss": 1.2108979225158691,
+      "eval_bigbrother_runtime": 39.3441,
+      "eval_bigbrother_samples_per_second": 34.821,
+      "eval_bigbrother_steps_per_second": 1.093,
+      "eval_bigbrother_wer": 0.3849995971964876,
+      "step": 44828
+    },
+    {
+      "epoch": 29.0,
+      "grad_norm": 1.2005807161331177,
+      "learning_rate": 2.8189958426606973e-05,
+      "loss": 0.3729,
+      "step": 46429
+    },
+    {
+      "epoch": 29.0,
+      "eval_rundkast_loss": 0.3197638690471649,
+      "eval_rundkast_runtime": 31.5545,
+      "eval_rundkast_samples_per_second": 42.625,
+      "eval_rundkast_steps_per_second": 1.363,
+      "eval_rundkast_wer": 0.12671014953865734,
+      "step": 46429
+    },
+    {
+      "epoch": 29.0,
+      "eval_nb_samtale_loss": 0.5454243421554565,
+      "eval_nb_samtale_runtime": 35.43,
+      "eval_nb_samtale_samples_per_second": 15.044,
+      "eval_nb_samtale_steps_per_second": 0.48,
+      "eval_nb_samtale_wer": 0.19832356770833334,
+      "step": 46429
+    },
+    {
+      "epoch": 29.0,
+      "eval_BB_RUND_loss": 0.7797754406929016,
+      "eval_BB_RUND_runtime": 73.7244,
+      "eval_BB_RUND_samples_per_second": 36.826,
+      "eval_BB_RUND_steps_per_second": 1.153,
+      "eval_BB_RUND_wer": 0.25567340404242545,
+      "step": 46429
+    },
+    {
+      "epoch": 29.0,
+      "eval_bigbrother_loss": 1.231561541557312,
+      "eval_bigbrother_runtime": 39.2468,
+      "eval_bigbrother_samples_per_second": 34.907,
+      "eval_bigbrother_steps_per_second": 1.096,
+      "eval_bigbrother_wer": 0.38620800773382746,
+      "step": 46429
+    },
+    {
+      "epoch": 30.0,
+      "grad_norm": 1.4953359365463257,
+      "learning_rate": 2.562999680204669e-05,
+      "loss": 0.3718,
+      "step": 48030
+    },
+    {
+      "epoch": 30.0,
+      "eval_rundkast_loss": 0.33351558446884155,
+      "eval_rundkast_runtime": 31.2627,
+      "eval_rundkast_samples_per_second": 43.023,
+      "eval_rundkast_steps_per_second": 1.375,
+      "eval_rundkast_wer": 0.12830098631880368,
+      "step": 48030
+    },
+    {
+      "epoch": 30.0,
+      "eval_nb_samtale_loss": 0.5619927048683167,
+      "eval_nb_samtale_runtime": 35.2849,
+      "eval_nb_samtale_samples_per_second": 15.106,
+      "eval_nb_samtale_steps_per_second": 0.482,
+      "eval_nb_samtale_wer": 0.19986979166666666,
+      "step": 48030
+    },
+    {
+      "epoch": 30.0,
+      "eval_BB_RUND_loss": 0.7934340238571167,
+      "eval_BB_RUND_runtime": 74.4083,
+      "eval_BB_RUND_samples_per_second": 36.488,
+      "eval_BB_RUND_steps_per_second": 1.142,
+      "eval_BB_RUND_wer": 0.25839503702221334,
+      "step": 48030
+    },
+    {
+      "epoch": 30.0,
+      "eval_bigbrother_loss": 1.2452094554901123,
+      "eval_bigbrother_runtime": 39.1955,
+      "eval_bigbrother_samples_per_second": 34.953,
+      "eval_bigbrother_steps_per_second": 1.097,
+      "eval_bigbrother_wer": 0.39071940707322966,
+      "step": 48030
+    },
+    {
+      "epoch": 31.0,
+      "grad_norm": 2.022852659225464,
+      "learning_rate": 2.307163415414135e-05,
+      "loss": 0.3648,
+      "step": 49631
+    },
+    {
+      "epoch": 31.0,
+      "eval_rundkast_loss": 0.32245931029319763,
+      "eval_rundkast_runtime": 31.3953,
+      "eval_rundkast_samples_per_second": 42.841,
+      "eval_rundkast_steps_per_second": 1.37,
+      "eval_rundkast_wer": 0.1252783964365256,
+      "step": 49631
+    },
+    {
+      "epoch": 31.0,
+      "eval_nb_samtale_loss": 0.547818660736084,
+      "eval_nb_samtale_runtime": 35.3829,
+      "eval_nb_samtale_samples_per_second": 15.064,
+      "eval_nb_samtale_steps_per_second": 0.48,
+      "eval_nb_samtale_wer": 0.19913736979166666,
+      "step": 49631
+    },
+    {
+      "epoch": 31.0,
+      "eval_BB_RUND_loss": 0.7814807295799255,
+      "eval_BB_RUND_runtime": 74.2777,
+      "eval_BB_RUND_samples_per_second": 36.552,
+      "eval_BB_RUND_steps_per_second": 1.144,
+      "eval_BB_RUND_wer": 0.25687412447468483,
+      "step": 49631
+    },
+    {
+      "epoch": 31.0,
+      "eval_bigbrother_loss": 1.232583999633789,
+      "eval_bigbrother_runtime": 39.2964,
+      "eval_bigbrother_samples_per_second": 34.863,
+      "eval_bigbrother_steps_per_second": 1.094,
+      "eval_bigbrother_wer": 0.3895915572383791,
+      "step": 49631
+    },
+    {
+      "epoch": 32.0,
+      "grad_norm": 1.159850001335144,
+      "learning_rate": 2.051327150623601e-05,
+      "loss": 0.3556,
+      "step": 51232
+    },
+    {
+      "epoch": 32.0,
+      "eval_rundkast_loss": 0.33501243591308594,
+      "eval_rundkast_runtime": 31.2712,
+      "eval_rundkast_samples_per_second": 43.011,
+      "eval_rundkast_steps_per_second": 1.375,
+      "eval_rundkast_wer": 0.12623289850461342,
+      "step": 51232
+    },
+    {
+      "epoch": 32.0,
+      "eval_nb_samtale_loss": 0.5665200352668762,
+      "eval_nb_samtale_runtime": 35.0524,
+      "eval_nb_samtale_samples_per_second": 15.206,
+      "eval_nb_samtale_steps_per_second": 0.485,
+      "eval_nb_samtale_wer": 0.19685872395833334,
+      "step": 51232
+    },
+    {
+      "epoch": 32.0,
+      "eval_BB_RUND_loss": 0.8201074004173279,
+      "eval_BB_RUND_runtime": 73.6889,
+      "eval_BB_RUND_samples_per_second": 36.844,
+      "eval_BB_RUND_steps_per_second": 1.153,
+      "eval_BB_RUND_wer": 0.2548328997398439,
+      "step": 51232
+    },
+    {
+      "epoch": 32.0,
+      "eval_bigbrother_loss": 1.296426773071289,
+      "eval_bigbrother_runtime": 39.3283,
+      "eval_bigbrother_samples_per_second": 34.835,
+      "eval_bigbrother_steps_per_second": 1.093,
+      "eval_bigbrother_wer": 0.3852412793039555,
+      "step": 51232
+    },
+    {
+      "epoch": 33.0,
+      "grad_norm": 4.668502330780029,
+      "learning_rate": 1.7954908858330668e-05,
+      "loss": 0.3533,
+      "step": 52833
+    },
+    {
+      "epoch": 33.0,
+      "eval_rundkast_loss": 0.33790138363838196,
+      "eval_rundkast_runtime": 31.5957,
+      "eval_rundkast_samples_per_second": 42.569,
+      "eval_rundkast_steps_per_second": 1.361,
+      "eval_rundkast_wer": 0.12623289850461342,
+      "step": 52833
+    },
+    {
+      "epoch": 33.0,
+      "eval_nb_samtale_loss": 0.5643696784973145,
+      "eval_nb_samtale_runtime": 35.3499,
+      "eval_nb_samtale_samples_per_second": 15.078,
+      "eval_nb_samtale_steps_per_second": 0.481,
+      "eval_nb_samtale_wer": 0.19669596354166666,
+      "step": 52833
+    },
+    {
+      "epoch": 33.0,
+      "eval_BB_RUND_loss": 0.8017848134040833,
+      "eval_BB_RUND_runtime": 74.5846,
+      "eval_BB_RUND_samples_per_second": 36.402,
+      "eval_BB_RUND_steps_per_second": 1.14,
+      "eval_BB_RUND_wer": 0.2553532119271563,
+      "step": 52833
+    },
+    {
+      "epoch": 33.0,
+      "eval_bigbrother_loss": 1.2571812868118286,
+      "eval_bigbrother_runtime": 38.9999,
+      "eval_bigbrother_samples_per_second": 35.128,
+      "eval_bigbrother_steps_per_second": 1.103,
+      "eval_bigbrother_wer": 0.38508015789897687,
+      "step": 52833
+    },
+    {
+      "epoch": 34.0,
+      "grad_norm": 1.0839606523513794,
+      "learning_rate": 1.5394947233770386e-05,
+      "loss": 0.3524,
+      "step": 54434
+    },
+    {
+      "epoch": 34.0,
+      "eval_rundkast_loss": 0.3482387959957123,
+      "eval_rundkast_runtime": 31.231,
+      "eval_rundkast_samples_per_second": 43.066,
+      "eval_rundkast_steps_per_second": 1.377,
+      "eval_rundkast_wer": 0.12496022908049634,
+      "step": 54434
+    },
+    {
+      "epoch": 34.0,
+      "eval_nb_samtale_loss": 0.5782368779182434,
+      "eval_nb_samtale_runtime": 35.115,
+      "eval_nb_samtale_samples_per_second": 15.179,
+      "eval_nb_samtale_steps_per_second": 0.484,
+      "eval_nb_samtale_wer": 0.19881184895833334,
+      "step": 54434
+    },
+    {
+      "epoch": 34.0,
+      "eval_BB_RUND_loss": 0.8167536854743958,
+      "eval_BB_RUND_runtime": 73.4659,
+      "eval_BB_RUND_samples_per_second": 36.956,
+      "eval_BB_RUND_steps_per_second": 1.157,
+      "eval_BB_RUND_wer": 0.2524314588753252,
+      "step": 54434
+    },
+    {
+      "epoch": 34.0,
+      "eval_bigbrother_loss": 1.2767822742462158,
+      "eval_bigbrother_runtime": 39.0487,
+      "eval_bigbrother_samples_per_second": 35.084,
+      "eval_bigbrother_steps_per_second": 1.101,
+      "eval_bigbrother_wer": 0.38121324417948926,
+      "step": 54434
+    },
+    {
+      "epoch": 35.0,
+      "grad_norm": 1.376759648323059,
+      "learning_rate": 1.2836584585865047e-05,
+      "loss": 0.3499,
+      "step": 56035
+    },
+    {
+      "epoch": 35.0,
+      "eval_rundkast_loss": 0.3501284718513489,
+      "eval_rundkast_runtime": 32.4165,
+      "eval_rundkast_samples_per_second": 41.491,
+      "eval_rundkast_steps_per_second": 1.326,
+      "eval_rundkast_wer": 0.12575564747056953,
+      "step": 56035
+    },
+    {
+      "epoch": 35.0,
+      "eval_nb_samtale_loss": 0.5841984152793884,
+      "eval_nb_samtale_runtime": 35.425,
+      "eval_nb_samtale_samples_per_second": 15.046,
+      "eval_nb_samtale_steps_per_second": 0.48,
+      "eval_nb_samtale_wer": 0.1982421875,
+      "step": 56035
+    },
+    {
+      "epoch": 35.0,
+      "eval_BB_RUND_loss": 0.8236829042434692,
+      "eval_BB_RUND_runtime": 74.6418,
+      "eval_BB_RUND_samples_per_second": 36.374,
+      "eval_BB_RUND_steps_per_second": 1.139,
+      "eval_BB_RUND_wer": 0.25203121873123874,
+      "step": 56035
+    },
+    {
+      "epoch": 35.0,
+      "eval_bigbrother_loss": 1.2888648509979248,
+      "eval_bigbrother_runtime": 39.2027,
+      "eval_bigbrother_samples_per_second": 34.947,
+      "eval_bigbrother_steps_per_second": 1.097,
+      "eval_bigbrother_wer": 0.38008539434463867,
+      "step": 56035
+    },
+    {
+      "epoch": 36.0,
+      "grad_norm": 1.6304969787597656,
+      "learning_rate": 1.0276622961304766e-05,
+      "loss": 0.349,
+      "step": 57636
+    },
+    {
+      "epoch": 36.0,
+      "eval_rundkast_loss": 0.3395073413848877,
+      "eval_rundkast_runtime": 31.3594,
+      "eval_rundkast_samples_per_second": 42.89,
+      "eval_rundkast_steps_per_second": 1.371,
+      "eval_rundkast_wer": 0.12583518930957685,
+      "step": 57636
+    },
+    {
+      "epoch": 36.0,
+      "eval_nb_samtale_loss": 0.5508641004562378,
+      "eval_nb_samtale_runtime": 35.3876,
+      "eval_nb_samtale_samples_per_second": 15.062,
+      "eval_nb_samtale_steps_per_second": 0.48,
+      "eval_nb_samtale_wer": 0.198974609375,
+      "step": 57636
+    },
+    {
+      "epoch": 36.0,
+      "eval_BB_RUND_loss": 0.7999393939971924,
+      "eval_BB_RUND_runtime": 73.6053,
+      "eval_BB_RUND_samples_per_second": 36.886,
+      "eval_BB_RUND_steps_per_second": 1.155,
+      "eval_BB_RUND_wer": 0.25139083450070043,
+      "step": 57636
+    },
+    {
+      "epoch": 36.0,
+      "eval_bigbrother_loss": 1.2519750595092773,
+      "eval_bigbrother_runtime": 38.9721,
+      "eval_bigbrother_samples_per_second": 35.153,
+      "eval_bigbrother_steps_per_second": 1.103,
+      "eval_bigbrother_wer": 0.3781519374848949,
+      "step": 57636
+    },
+    {
+      "epoch": 37.0,
+      "grad_norm": 0.9431388974189758,
+      "learning_rate": 7.718260313399425e-06,
+      "loss": 0.3443,
+      "step": 59237
+    },
+    {
+      "epoch": 37.0,
+      "eval_rundkast_loss": 0.3431856632232666,
+      "eval_rundkast_runtime": 32.1917,
+      "eval_rundkast_samples_per_second": 41.781,
+      "eval_rundkast_steps_per_second": 1.336,
+      "eval_rundkast_wer": 0.12440343620744512,
+      "step": 59237
+    },
+    {
+      "epoch": 37.0,
+      "eval_nb_samtale_loss": 0.5509617924690247,
+      "eval_nb_samtale_runtime": 35.3455,
+      "eval_nb_samtale_samples_per_second": 15.08,
+      "eval_nb_samtale_steps_per_second": 0.481,
+      "eval_nb_samtale_wer": 0.19669596354166666,
+      "step": 59237
+    },
+    {
+      "epoch": 37.0,
+      "eval_BB_RUND_loss": 0.8117216229438782,
+      "eval_BB_RUND_runtime": 75.5514,
+      "eval_BB_RUND_samples_per_second": 35.936,
+      "eval_BB_RUND_steps_per_second": 1.125,
+      "eval_BB_RUND_wer": 0.2507504502701621,
+      "step": 59237
+    },
+    {
+      "epoch": 37.0,
+      "eval_bigbrother_loss": 1.272763729095459,
+      "eval_bigbrother_runtime": 39.4053,
+      "eval_bigbrother_samples_per_second": 34.767,
+      "eval_bigbrother_steps_per_second": 1.091,
+      "eval_bigbrother_wer": 0.3785547409973415,
+      "step": 59237
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 64040,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 40,
+  "save_steps": 500,
+  "total_flos": 3.065538584603944e+20,
+  "train_batch_size": 48,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-59237/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b25133bdb24b039668b926e9e3f9c4343b5002d30a14ff9ac158220672a6f871
+size 4984

checkpoint-64040/config.json ADDED Viewed

	@@ -0,0 +1,116 @@

+{
+  "_name_or_path": "NbAiLab/nb-wav2vec2-300m-bokmaal",
+  "activation_dropout": 0.055,
+  "adapter_attn_dim": null,
+  "adapter_kernel_size": 3,
+  "adapter_stride": 2,
+  "add_adapter": false,
+  "apply_spec_augment": true,
+  "architectures": [
+    "Wav2Vec2ForCTC"
+  ],
+  "attention_dropout": 0.094,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "codevector_dim": 768,
+  "contrastive_logits_temperature": 0.1,
+  "conv_bias": true,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "mean",
+  "ctc_zero_infinity": true,
+  "diversity_loss_weight": 0.1,
+  "do_stable_layer_norm": true,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_dropout": 0.0,
+  "feat_extract_norm": "layer",
+  "feat_proj_dropout": 0.04,
+  "feat_quantizer_dropout": 0.0,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.047,
+  "hidden_size": 1024,
+  "initializer_range": 0.02,
+  "intermediate_size": 4096,
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.041,
+  "mask_channel_length": 10,
+  "mask_channel_min_space": 1,
+  "mask_channel_other": 0.0,
+  "mask_channel_prob": 0.0,
+  "mask_channel_selection": "static",
+  "mask_feature_length": 64,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.25,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_min_space": 1,
+  "mask_time_other": 0.0,
+  "mask_time_prob": 0.082,
+  "mask_time_selection": "static",
+  "model_type": "wav2vec2",
+  "num_adapter_layers": 3,
+  "num_attention_heads": 16,
+  "num_codevector_groups": 2,
+  "num_codevectors_per_group": 320,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 24,
+  "num_negatives": 100,
+  "output_hidden_size": 1024,
+  "pad_token_id": 31,
+  "proj_codevector_dim": 768,
+  "tdnn_dilation": [
+    1,
+    2,
+    3,
+    1,
+    1
+  ],
+  "tdnn_dim": [
+    512,
+    512,
+    512,
+    512,
+    1500
+  ],
+  "tdnn_kernel": [
+    5,
+    3,
+    3,
+    1,
+    1
+  ],
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 34,
+  "xvector_output_dim": 512
+}

checkpoint-64040/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9fdd39709fe981bd7b0e964c8c1bb2da7ad17a4bb7f05e2b4b676ba51e9aefe9
+size 1261946880

checkpoint-64040/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ddee96e91cfe8010b081234c0e6a55d2b5a2131764bf2bd761c99ebbff519102
+size 2490438582

checkpoint-64040/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "do_normalize": true,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "processor_class": "Wav2Vec2ProcessorWithLM",
+  "return_attention_mask": true,
+  "sampling_rate": 16000
+}

checkpoint-64040/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6fb97dd47ab1a1236fed22f9bdcfafcfb8420d1d9601f8d46dad23108923f319
+size 14308

checkpoint-64040/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:33594856a90c6ad7601d3393c45218d76a92a225c4bfc73e0c57225b8d75ee18
+size 1064

checkpoint-64040/trainer_state.json ADDED Viewed

	@@ -0,0 +1,1741 @@

+{
+  "best_metric": 0.2507504502701621,
+  "best_model_checkpoint": "/cluster/home/torstefl/Master/saved_model/W2V/Combined/BB-RUND/30.05/checkpoint-59237",
+  "epoch": 40.0,
+  "eval_steps": 500,
+  "global_step": 64040,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "grad_norm": 3.5616490840911865,
+      "learning_rate": 9.984170131116086e-05,
+      "loss": 0.9316,
+      "step": 1601
+    },
+    {
+      "epoch": 1.0,
+      "eval_rundkast_loss": 0.3094605803489685,
+      "eval_rundkast_runtime": 31.7263,
+      "eval_rundkast_samples_per_second": 42.394,
+      "eval_rundkast_steps_per_second": 1.355,
+      "eval_rundkast_wer": 0.18334393891186765,
+      "step": 1601
+    },
+    {
+      "epoch": 1.0,
+      "eval_nb_samtale_loss": 0.5153853297233582,
+      "eval_nb_samtale_runtime": 36.9199,
+      "eval_nb_samtale_samples_per_second": 14.437,
+      "eval_nb_samtale_steps_per_second": 0.46,
+      "eval_nb_samtale_wer": 0.2501627604166667,
+      "step": 1601
+    },
+    {
+      "epoch": 1.0,
+      "eval_BB_RUND_loss": 0.8934017419815063,
+      "eval_BB_RUND_runtime": 74.2605,
+      "eval_BB_RUND_samples_per_second": 36.56,
+      "eval_BB_RUND_steps_per_second": 1.145,
+      "eval_BB_RUND_wer": 0.3665399239543726,
+      "step": 1601
+    },
+    {
+      "epoch": 1.0,
+      "eval_bigbrother_loss": 1.4666274785995483,
+      "eval_bigbrother_runtime": 39.9935,
+      "eval_bigbrother_samples_per_second": 34.256,
+      "eval_bigbrother_steps_per_second": 1.075,
+      "eval_bigbrother_wer": 0.5517602513493918,
+      "step": 1601
+    },
+    {
+      "epoch": 2.0,
+      "grad_norm": 1.8291858434677124,
+      "learning_rate": 9.728173968660058e-05,
+      "loss": 0.7975,
+      "step": 3202
+    },
+    {
+      "epoch": 2.0,
+      "eval_rundkast_loss": 0.27037981152534485,
+      "eval_rundkast_runtime": 31.304,
+      "eval_rundkast_samples_per_second": 42.966,
+      "eval_rundkast_steps_per_second": 1.374,
+      "eval_rundkast_wer": 0.17968501431753103,
+      "step": 3202
+    },
+    {
+      "epoch": 2.0,
+      "eval_nb_samtale_loss": 0.4818350672721863,
+      "eval_nb_samtale_runtime": 36.3495,
+      "eval_nb_samtale_samples_per_second": 14.663,
+      "eval_nb_samtale_steps_per_second": 0.468,
+      "eval_nb_samtale_wer": 0.2549641927083333,
+      "step": 3202
+    },
+    {
+      "epoch": 2.0,
+      "eval_BB_RUND_loss": 0.7777431607246399,
+      "eval_BB_RUND_runtime": 74.0457,
+      "eval_BB_RUND_samples_per_second": 36.667,
+      "eval_BB_RUND_steps_per_second": 1.148,
+      "eval_BB_RUND_wer": 0.3568941364818891,
+      "step": 3202
+    },
+    {
+      "epoch": 2.0,
+      "eval_bigbrother_loss": 1.2756603956222534,
+      "eval_bigbrother_runtime": 39.2125,
+      "eval_bigbrother_samples_per_second": 34.938,
+      "eval_bigbrother_steps_per_second": 1.097,
+      "eval_bigbrother_wer": 0.5356481108515266,
+      "step": 3202
+    },
+    {
+      "epoch": 3.0,
+      "grad_norm": 1.1911417245864868,
+      "learning_rate": 9.472337703869524e-05,
+      "loss": 0.7318,
+      "step": 4803
+    },
+    {
+      "epoch": 3.0,
+      "eval_rundkast_loss": 0.2820556163787842,
+      "eval_rundkast_runtime": 31.3992,
+      "eval_rundkast_samples_per_second": 42.835,
+      "eval_rundkast_steps_per_second": 1.369,
+      "eval_rundkast_wer": 0.16679923639834554,
+      "step": 4803
+    },
+    {
+      "epoch": 3.0,
+      "eval_nb_samtale_loss": 0.4887722134590149,
+      "eval_nb_samtale_runtime": 36.3679,
+      "eval_nb_samtale_samples_per_second": 14.656,
+      "eval_nb_samtale_steps_per_second": 0.467,
+      "eval_nb_samtale_wer": 0.23697916666666666,
+      "step": 4803
+    },
+    {
+      "epoch": 3.0,
+      "eval_BB_RUND_loss": 0.7739498615264893,
+      "eval_BB_RUND_runtime": 74.2643,
+      "eval_BB_RUND_samples_per_second": 36.559,
+      "eval_BB_RUND_steps_per_second": 1.145,
+      "eval_BB_RUND_wer": 0.3293976385831499,
+      "step": 4803
+    },
+    {
+      "epoch": 3.0,
+      "eval_bigbrother_loss": 1.256850004196167,
+      "eval_bigbrother_runtime": 39.3324,
+      "eval_bigbrother_samples_per_second": 34.831,
+      "eval_bigbrother_steps_per_second": 1.093,
+      "eval_bigbrother_wer": 0.49343430274711997,
+      "step": 4803
+    },
+    {
+      "epoch": 4.0,
+      "grad_norm": 1.5012503862380981,
+      "learning_rate": 9.216341541413495e-05,
+      "loss": 0.6896,
+      "step": 6404
+    },
+    {
+      "epoch": 4.0,
+      "eval_rundkast_loss": 0.2698061466217041,
+      "eval_rundkast_runtime": 31.5141,
+      "eval_rundkast_samples_per_second": 42.679,
+      "eval_rundkast_steps_per_second": 1.364,
+      "eval_rundkast_wer": 0.1590836780146357,
+      "step": 6404
+    },
+    {
+      "epoch": 4.0,
+      "eval_nb_samtale_loss": 0.46429482102394104,
+      "eval_nb_samtale_runtime": 36.1366,
+      "eval_nb_samtale_samples_per_second": 14.75,
+      "eval_nb_samtale_steps_per_second": 0.47,
+      "eval_nb_samtale_wer": 0.22770182291666666,
+      "step": 6404
+    },
+    {
+      "epoch": 4.0,
+      "eval_BB_RUND_loss": 0.7106366157531738,
+      "eval_BB_RUND_runtime": 74.1602,
+      "eval_BB_RUND_samples_per_second": 36.61,
+      "eval_BB_RUND_steps_per_second": 1.146,
+      "eval_BB_RUND_wer": 0.3115469281568941,
+      "step": 6404
+    },
+    {
+      "epoch": 4.0,
+      "eval_bigbrother_loss": 1.1434192657470703,
+      "eval_bigbrother_runtime": 39.4465,
+      "eval_bigbrother_samples_per_second": 34.731,
+      "eval_bigbrother_steps_per_second": 1.09,
+      "eval_bigbrother_wer": 0.4657214210907919,
+      "step": 6404
+    },
+    {
+      "epoch": 5.0,
+      "grad_norm": 1.3953436613082886,
+      "learning_rate": 8.960345378957467e-05,
+      "loss": 0.6527,
+      "step": 8005
+    },
+    {
+      "epoch": 5.0,
+      "eval_rundkast_loss": 0.3087877333164215,
+      "eval_rundkast_runtime": 31.2187,
+      "eval_rundkast_samples_per_second": 43.083,
+      "eval_rundkast_steps_per_second": 1.377,
+      "eval_rundkast_wer": 0.15717467387846007,
+      "step": 8005
+    },
+    {
+      "epoch": 5.0,
+      "eval_nb_samtale_loss": 0.498180627822876,
+      "eval_nb_samtale_runtime": 36.0025,
+      "eval_nb_samtale_samples_per_second": 14.805,
+      "eval_nb_samtale_steps_per_second": 0.472,
+      "eval_nb_samtale_wer": 0.22737630208333334,
+      "step": 8005
+    },
+    {
+      "epoch": 5.0,
+      "eval_BB_RUND_loss": 0.7562405467033386,
+      "eval_BB_RUND_runtime": 73.6895,
+      "eval_BB_RUND_samples_per_second": 36.844,
+      "eval_BB_RUND_steps_per_second": 1.153,
+      "eval_BB_RUND_wer": 0.3094656794076446,
+      "step": 8005
+    },
+    {
+      "epoch": 5.0,
+      "eval_bigbrother_loss": 1.1955605745315552,
+      "eval_bigbrother_runtime": 39.2755,
+      "eval_bigbrother_samples_per_second": 34.882,
+      "eval_bigbrother_steps_per_second": 1.095,
+      "eval_bigbrother_wer": 0.4638685249335374,
+      "step": 8005
+    },
+    {
+      "epoch": 6.0,
+      "grad_norm": 1.5980861186981201,
+      "learning_rate": 8.704828909497922e-05,
+      "loss": 0.6237,
+      "step": 9606
+    },
+    {
+      "epoch": 6.0,
+      "eval_rundkast_loss": 0.269611120223999,
+      "eval_rundkast_runtime": 31.4039,
+      "eval_rundkast_samples_per_second": 42.829,
+      "eval_rundkast_steps_per_second": 1.369,
+      "eval_rundkast_wer": 0.14675469296850144,
+      "step": 9606
+    },
+    {
+      "epoch": 6.0,
+      "eval_nb_samtale_loss": 0.4713493287563324,
+      "eval_nb_samtale_runtime": 35.984,
+      "eval_nb_samtale_samples_per_second": 14.812,
+      "eval_nb_samtale_steps_per_second": 0.472,
+      "eval_nb_samtale_wer": 0.22029622395833334,
+      "step": 9606
+    },
+    {
+      "epoch": 6.0,
+      "eval_BB_RUND_loss": 0.6956652998924255,
+      "eval_BB_RUND_runtime": 73.7058,
+      "eval_BB_RUND_samples_per_second": 36.836,
+      "eval_BB_RUND_steps_per_second": 1.153,
+      "eval_BB_RUND_wer": 0.29605763458074846,
+      "step": 9606
+    },
+    {
+      "epoch": 6.0,
+      "eval_bigbrother_loss": 1.1138566732406616,
+      "eval_bigbrother_runtime": 39.5517,
+      "eval_bigbrother_samples_per_second": 34.638,
+      "eval_bigbrother_steps_per_second": 1.087,
+      "eval_bigbrother_wer": 0.4462257310883751,
+      "step": 9606
+    },
+    {
+      "epoch": 7.0,
+      "grad_norm": 4.422884941101074,
+      "learning_rate": 8.448832747041894e-05,
+      "loss": 0.5972,
+      "step": 11207
+    },
+    {
+      "epoch": 7.0,
+      "eval_rundkast_loss": 0.25946080684661865,
+      "eval_rundkast_runtime": 31.4395,
+      "eval_rundkast_samples_per_second": 42.781,
+      "eval_rundkast_steps_per_second": 1.368,
+      "eval_rundkast_wer": 0.14428889595927458,
+      "step": 11207
+    },
+    {
+      "epoch": 7.0,
+      "eval_nb_samtale_loss": 0.49012112617492676,
+      "eval_nb_samtale_runtime": 35.8902,
+      "eval_nb_samtale_samples_per_second": 14.851,
+      "eval_nb_samtale_steps_per_second": 0.474,
+      "eval_nb_samtale_wer": 0.21590169270833334,
+      "step": 11207
+    },
+    {
+      "epoch": 7.0,
+      "eval_BB_RUND_loss": 0.7060232758522034,
+      "eval_BB_RUND_runtime": 73.9395,
+      "eval_BB_RUND_samples_per_second": 36.719,
+      "eval_BB_RUND_steps_per_second": 1.15,
+      "eval_BB_RUND_wer": 0.29153492095257155,
+      "step": 11207
+    },
+    {
+      "epoch": 7.0,
+      "eval_bigbrother_loss": 1.1444189548492432,
+      "eval_bigbrother_runtime": 39.3579,
+      "eval_bigbrother_samples_per_second": 34.809,
+      "eval_bigbrother_steps_per_second": 1.093,
+      "eval_bigbrother_wer": 0.440264239104165,
+      "step": 11207
+    },
+    {
+      "epoch": 8.0,
+      "grad_norm": 1.6600903272628784,
+      "learning_rate": 8.192836584585866e-05,
+      "loss": 0.5771,
+      "step": 12808
+    },
+    {
+      "epoch": 8.0,
+      "eval_rundkast_loss": 0.27805188298225403,
+      "eval_rundkast_runtime": 31.731,
+      "eval_rundkast_samples_per_second": 42.388,
+      "eval_rundkast_steps_per_second": 1.355,
+      "eval_rundkast_wer": 0.14945911549475024,
+      "step": 12808
+    },
+    {
+      "epoch": 8.0,
+      "eval_nb_samtale_loss": 0.4692385196685791,
+      "eval_nb_samtale_runtime": 36.1624,
+      "eval_nb_samtale_samples_per_second": 14.739,
+      "eval_nb_samtale_steps_per_second": 0.47,
+      "eval_nb_samtale_wer": 0.22216796875,
+      "step": 12808
+    },
+    {
+      "epoch": 8.0,
+      "eval_BB_RUND_loss": 0.7197623252868652,
+      "eval_BB_RUND_runtime": 92.436,
+      "eval_BB_RUND_samples_per_second": 29.372,
+      "eval_BB_RUND_steps_per_second": 0.92,
+      "eval_BB_RUND_wer": 0.2952971783069842,
+      "step": 12808
+    },
+    {
+      "epoch": 8.0,
+      "eval_bigbrother_loss": 1.1536922454833984,
+      "eval_bigbrother_runtime": 39.1987,
+      "eval_bigbrother_samples_per_second": 34.95,
+      "eval_bigbrother_steps_per_second": 1.097,
+      "eval_bigbrother_wer": 0.44260049947635544,
+      "step": 12808
+    },
+    {
+      "epoch": 9.0,
+      "grad_norm": 1.0308187007904053,
+      "learning_rate": 7.936840422129838e-05,
+      "loss": 0.5567,
+      "step": 14409
+    },
+    {
+      "epoch": 9.0,
+      "eval_rundkast_loss": 0.28997811675071716,
+      "eval_rundkast_runtime": 31.3398,
+      "eval_rundkast_samples_per_second": 42.917,
+      "eval_rundkast_steps_per_second": 1.372,
+      "eval_rundkast_wer": 0.1408685968819599,
+      "step": 14409
+    },
+    {
+      "epoch": 9.0,
+      "eval_nb_samtale_loss": 0.46654534339904785,
+      "eval_nb_samtale_runtime": 35.7424,
+      "eval_nb_samtale_samples_per_second": 14.912,
+      "eval_nb_samtale_steps_per_second": 0.476,
+      "eval_nb_samtale_wer": 0.21126302083333334,
+      "step": 14409
+    },
+    {
+      "epoch": 9.0,
+      "eval_BB_RUND_loss": 0.7060103416442871,
+      "eval_BB_RUND_runtime": 73.7474,
+      "eval_BB_RUND_samples_per_second": 36.815,
+      "eval_BB_RUND_steps_per_second": 1.153,
+      "eval_BB_RUND_wer": 0.28328997398439065,
+      "step": 14409
+    },
+    {
+      "epoch": 9.0,
+      "eval_bigbrother_loss": 1.1144466400146484,
+      "eval_bigbrother_runtime": 39.254,
+      "eval_bigbrother_samples_per_second": 34.901,
+      "eval_bigbrother_steps_per_second": 1.095,
+      "eval_bigbrother_wer": 0.4277773302183195,
+      "step": 14409
+    },
+    {
+      "epoch": 10.0,
+      "grad_norm": 3.7091312408447266,
+      "learning_rate": 7.681004157339303e-05,
+      "loss": 0.5422,
+      "step": 16010
+    },
+    {
+      "epoch": 10.0,
+      "eval_rundkast_loss": 0.292531818151474,
+      "eval_rundkast_runtime": 31.6718,
+      "eval_rundkast_samples_per_second": 42.467,
+      "eval_rundkast_steps_per_second": 1.358,
+      "eval_rundkast_wer": 0.14134584791600383,
+      "step": 16010
+    },
+    {
+      "epoch": 10.0,
+      "eval_nb_samtale_loss": 0.4930917024612427,
+      "eval_nb_samtale_runtime": 35.8047,
+      "eval_nb_samtale_samples_per_second": 14.886,
+      "eval_nb_samtale_steps_per_second": 0.475,
+      "eval_nb_samtale_wer": 0.2080078125,
+      "step": 16010
+    },
+    {
+      "epoch": 10.0,
+      "eval_BB_RUND_loss": 0.7012096643447876,
+      "eval_BB_RUND_runtime": 75.6789,
+      "eval_BB_RUND_samples_per_second": 35.875,
+      "eval_BB_RUND_steps_per_second": 1.123,
+      "eval_BB_RUND_wer": 0.28092855713428055,
+      "step": 16010
+    },
+    {
+      "epoch": 10.0,
+      "eval_bigbrother_loss": 1.1022217273712158,
+      "eval_bigbrother_runtime": 39.334,
+      "eval_bigbrother_samples_per_second": 34.83,
+      "eval_bigbrother_steps_per_second": 1.093,
+      "eval_bigbrother_wer": 0.4221380810440667,
+      "step": 16010
+    },
+    {
+      "epoch": 11.0,
+      "grad_norm": 0.9090811014175415,
+      "learning_rate": 7.425167892548769e-05,
+      "loss": 0.5266,
+      "step": 17611
+    },
+    {
+      "epoch": 11.0,
+      "eval_rundkast_loss": 0.30149751901626587,
+      "eval_rundkast_runtime": 31.3393,
+      "eval_rundkast_samples_per_second": 42.917,
+      "eval_rundkast_steps_per_second": 1.372,
+      "eval_rundkast_wer": 0.13935730194082088,
+      "step": 17611
+    },
+    {
+      "epoch": 11.0,
+      "eval_nb_samtale_loss": 0.4974854290485382,
+      "eval_nb_samtale_runtime": 35.6974,
+      "eval_nb_samtale_samples_per_second": 14.931,
+      "eval_nb_samtale_steps_per_second": 0.476,
+      "eval_nb_samtale_wer": 0.20947265625,
+      "step": 17611
+    },
+    {
+      "epoch": 11.0,
+      "eval_BB_RUND_loss": 0.7534126043319702,
+      "eval_BB_RUND_runtime": 73.8118,
+      "eval_BB_RUND_samples_per_second": 36.783,
+      "eval_BB_RUND_steps_per_second": 1.152,
+      "eval_BB_RUND_wer": 0.2830898539123474,
+      "step": 17611
+    },
+    {
+      "epoch": 11.0,
+      "eval_bigbrother_loss": 1.1972620487213135,
+      "eval_bigbrother_runtime": 39.3175,
+      "eval_bigbrother_samples_per_second": 34.845,
+      "eval_bigbrother_steps_per_second": 1.094,
+      "eval_bigbrother_wer": 0.4285829372432128,
+      "step": 17611
+    },
+    {
+      "epoch": 12.0,
+      "grad_norm": 1.5719759464263916,
+      "learning_rate": 7.169331627758235e-05,
+      "loss": 0.5103,
+      "step": 19212
+    },
+    {
+      "epoch": 12.0,
+      "eval_rundkast_loss": 0.2790067195892334,
+      "eval_rundkast_runtime": 31.604,
+      "eval_rundkast_samples_per_second": 42.558,
+      "eval_rundkast_steps_per_second": 1.361,
+      "eval_rundkast_wer": 0.13728921412663062,
+      "step": 19212
+    },
+    {
+      "epoch": 12.0,
+      "eval_nb_samtale_loss": 0.47254645824432373,
+      "eval_nb_samtale_runtime": 36.6581,
+      "eval_nb_samtale_samples_per_second": 14.54,
+      "eval_nb_samtale_steps_per_second": 0.464,
+      "eval_nb_samtale_wer": 0.208740234375,
+      "step": 19212
+    },
+    {
+      "epoch": 12.0,
+      "eval_BB_RUND_loss": 0.7001897096633911,
+      "eval_BB_RUND_runtime": 76.071,
+      "eval_BB_RUND_samples_per_second": 35.69,
+      "eval_BB_RUND_steps_per_second": 1.117,
+      "eval_BB_RUND_wer": 0.27512507504502703,
+      "step": 19212
+    },
+    {
+      "epoch": 12.0,
+      "eval_bigbrother_loss": 1.1136471033096313,
+      "eval_bigbrother_runtime": 39.6183,
+      "eval_bigbrother_samples_per_second": 34.58,
+      "eval_bigbrother_steps_per_second": 1.085,
+      "eval_bigbrother_wer": 0.41456537501007007,
+      "step": 19212
+    },
+    {
+      "epoch": 13.0,
+      "grad_norm": 1.0063461065292358,
+      "learning_rate": 6.913495362967701e-05,
+      "loss": 0.4968,
+      "step": 20813
+    },
+    {
+      "epoch": 13.0,
+      "eval_rundkast_loss": 0.29398083686828613,
+      "eval_rundkast_runtime": 31.5607,
+      "eval_rundkast_samples_per_second": 42.616,
+      "eval_rundkast_steps_per_second": 1.362,
+      "eval_rundkast_wer": 0.1381641743557111,
+      "step": 20813
+    },
+    {
+      "epoch": 13.0,
+      "eval_nb_samtale_loss": 0.4911497235298157,
+      "eval_nb_samtale_runtime": 36.0599,
+      "eval_nb_samtale_samples_per_second": 14.781,
+      "eval_nb_samtale_steps_per_second": 0.471,
+      "eval_nb_samtale_wer": 0.212158203125,
+      "step": 20813
+    },
+    {
+      "epoch": 13.0,
+      "eval_BB_RUND_loss": 0.729911208152771,
+      "eval_BB_RUND_runtime": 74.2919,
+      "eval_BB_RUND_samples_per_second": 36.545,
+      "eval_BB_RUND_steps_per_second": 1.144,
+      "eval_BB_RUND_wer": 0.2774864918951371,
+      "step": 20813
+    },
+    {
+      "epoch": 13.0,
+      "eval_bigbrother_loss": 1.1584389209747314,
+      "eval_bigbrother_runtime": 39.483,
+      "eval_bigbrother_samples_per_second": 34.698,
+      "eval_bigbrother_steps_per_second": 1.089,
+      "eval_bigbrother_wer": 0.41786836381213244,
+      "step": 20813
+    },
+    {
+      "epoch": 14.0,
+      "grad_norm": 1.0339038372039795,
+      "learning_rate": 6.657499200511673e-05,
+      "loss": 0.4867,
+      "step": 22414
+    },
+    {
+      "epoch": 14.0,
+      "eval_rundkast_loss": 0.2678089141845703,
+      "eval_rundkast_runtime": 31.9259,
+      "eval_rundkast_samples_per_second": 42.129,
+      "eval_rundkast_steps_per_second": 1.347,
+      "eval_rundkast_wer": 0.1390391345847916,
+      "step": 22414
+    },
+    {
+      "epoch": 14.0,
+      "eval_nb_samtale_loss": 0.48425397276878357,
+      "eval_nb_samtale_runtime": 35.6709,
+      "eval_nb_samtale_samples_per_second": 14.942,
+      "eval_nb_samtale_steps_per_second": 0.477,
+      "eval_nb_samtale_wer": 0.21004231770833334,
+      "step": 22414
+    },
+    {
+      "epoch": 14.0,
+      "eval_BB_RUND_loss": 0.6763830184936523,
+      "eval_BB_RUND_runtime": 75.1278,
+      "eval_BB_RUND_samples_per_second": 36.138,
+      "eval_BB_RUND_steps_per_second": 1.131,
+      "eval_BB_RUND_wer": 0.2732439463678207,
+      "step": 22414
+    },
+    {
+      "epoch": 14.0,
+      "eval_bigbrother_loss": 1.0772405862808228,
+      "eval_bigbrother_runtime": 39.3624,
+      "eval_bigbrother_samples_per_second": 34.805,
+      "eval_bigbrother_steps_per_second": 1.092,
+      "eval_bigbrother_wer": 0.408845565133328,
+      "step": 22414
+    },
+    {
+      "epoch": 15.0,
+      "grad_norm": 0.5528441667556763,
+      "learning_rate": 6.401662935721138e-05,
+      "loss": 0.4721,
+      "step": 24015
+    },
+    {
+      "epoch": 15.0,
+      "eval_rundkast_loss": 0.2952366769313812,
+      "eval_rundkast_runtime": 31.7087,
+      "eval_rundkast_samples_per_second": 42.417,
+      "eval_rundkast_steps_per_second": 1.356,
+      "eval_rundkast_wer": 0.1345847916003818,
+      "step": 24015
+    },
+    {
+      "epoch": 15.0,
+      "eval_nb_samtale_loss": 0.48395708203315735,
+      "eval_nb_samtale_runtime": 35.8001,
+      "eval_nb_samtale_samples_per_second": 14.888,
+      "eval_nb_samtale_steps_per_second": 0.475,
+      "eval_nb_samtale_wer": 0.20865885416666666,
+      "step": 24015
+    },
+    {
+      "epoch": 15.0,
+      "eval_BB_RUND_loss": 0.7274541854858398,
+      "eval_BB_RUND_runtime": 74.0948,
+      "eval_BB_RUND_samples_per_second": 36.642,
+      "eval_BB_RUND_steps_per_second": 1.147,
+      "eval_BB_RUND_wer": 0.269481689013408,
+      "step": 24015
+    },
+    {
+      "epoch": 15.0,
+      "eval_bigbrother_loss": 1.1518090963363647,
+      "eval_bigbrother_runtime": 39.2366,
+      "eval_bigbrother_samples_per_second": 34.916,
+      "eval_bigbrother_steps_per_second": 1.096,
+      "eval_bigbrother_wer": 0.4053008942237976,
+      "step": 24015
+    },
+    {
+      "epoch": 16.0,
+      "grad_norm": 0.9716380834579468,
+      "learning_rate": 6.14566677326511e-05,
+      "loss": 0.4626,
+      "step": 25616
+    },
+    {
+      "epoch": 16.0,
+      "eval_rundkast_loss": 0.3125823736190796,
+      "eval_rundkast_runtime": 31.5106,
+      "eval_rundkast_samples_per_second": 42.684,
+      "eval_rundkast_steps_per_second": 1.365,
+      "eval_rundkast_wer": 0.13347120585427935,
+      "step": 25616
+    },
+    {
+      "epoch": 16.0,
+      "eval_nb_samtale_loss": 0.5268623232841492,
+      "eval_nb_samtale_runtime": 35.7773,
+      "eval_nb_samtale_samples_per_second": 14.898,
+      "eval_nb_samtale_steps_per_second": 0.475,
+      "eval_nb_samtale_wer": 0.209228515625,
+      "step": 25616
+    },
+    {
+      "epoch": 16.0,
+      "eval_BB_RUND_loss": 0.752697229385376,
+      "eval_BB_RUND_runtime": 75.4571,
+      "eval_BB_RUND_samples_per_second": 35.981,
+      "eval_BB_RUND_steps_per_second": 1.126,
+      "eval_BB_RUND_wer": 0.2700820492295377,
+      "step": 25616
+    },
+    {
+      "epoch": 16.0,
+      "eval_bigbrother_loss": 1.1851829290390015,
+      "eval_bigbrother_runtime": 39.3085,
+      "eval_bigbrother_samples_per_second": 34.853,
+      "eval_bigbrother_steps_per_second": 1.094,
+      "eval_bigbrother_wer": 0.4079593974059454,
+      "step": 25616
+    },
+    {
+      "epoch": 17.0,
+      "grad_norm": 1.0000524520874023,
+      "learning_rate": 5.889830508474577e-05,
+      "loss": 0.4554,
+      "step": 27217
+    },
+    {
+      "epoch": 17.0,
+      "eval_rundkast_loss": 0.28784507513046265,
+      "eval_rundkast_runtime": 31.1375,
+      "eval_rundkast_samples_per_second": 43.196,
+      "eval_rundkast_steps_per_second": 1.381,
+      "eval_rundkast_wer": 0.13140311804008908,
+      "step": 27217
+    },
+    {
+      "epoch": 17.0,
+      "eval_nb_samtale_loss": 0.47152796387672424,
+      "eval_nb_samtale_runtime": 35.203,
+      "eval_nb_samtale_samples_per_second": 15.141,
+      "eval_nb_samtale_steps_per_second": 0.483,
+      "eval_nb_samtale_wer": 0.20361328125,
+      "step": 27217
+    },
+    {
+      "epoch": 17.0,
+      "eval_BB_RUND_loss": 0.705199122428894,
+      "eval_BB_RUND_runtime": 73.2232,
+      "eval_BB_RUND_samples_per_second": 37.078,
+      "eval_BB_RUND_steps_per_second": 1.161,
+      "eval_BB_RUND_wer": 0.2690814488693216,
+      "step": 27217
+    },
+    {
+      "epoch": 17.0,
+      "eval_bigbrother_loss": 1.1149847507476807,
+      "eval_bigbrother_runtime": 39.237,
+      "eval_bigbrother_samples_per_second": 34.916,
+      "eval_bigbrother_steps_per_second": 1.096,
+      "eval_bigbrother_wer": 0.40868444372834933,
+      "step": 27217
+    },
+    {
+      "epoch": 18.0,
+      "grad_norm": 0.8535083532333374,
+      "learning_rate": 5.6338343460185485e-05,
+      "loss": 0.4407,
+      "step": 28818
+    },
+    {
+      "epoch": 18.0,
+      "eval_rundkast_loss": 0.29337021708488464,
+      "eval_rundkast_runtime": 31.587,
+      "eval_rundkast_samples_per_second": 42.581,
+      "eval_rundkast_steps_per_second": 1.361,
+      "eval_rundkast_wer": 0.13044861597200128,
+      "step": 28818
+    },
+    {
+      "epoch": 18.0,
+      "eval_nb_samtale_loss": 0.5154338479042053,
+      "eval_nb_samtale_runtime": 35.5632,
+      "eval_nb_samtale_samples_per_second": 14.987,
+      "eval_nb_samtale_steps_per_second": 0.478,
+      "eval_nb_samtale_wer": 0.204345703125,
+      "step": 28818
+    },
+    {
+      "epoch": 18.0,
+      "eval_BB_RUND_loss": 0.7406498789787292,
+      "eval_BB_RUND_runtime": 73.657,
+      "eval_BB_RUND_samples_per_second": 36.86,
+      "eval_BB_RUND_steps_per_second": 1.154,
+      "eval_BB_RUND_wer": 0.26812087252351413,
+      "step": 28818
+    },
+    {
+      "epoch": 18.0,
+      "eval_bigbrother_loss": 1.1797504425048828,
+      "eval_bigbrother_runtime": 38.9311,
+      "eval_bigbrother_samples_per_second": 35.19,
+      "eval_bigbrother_steps_per_second": 1.105,
+      "eval_bigbrother_wer": 0.40699266897607345,
+      "step": 28818
+    },
+    {
+      "epoch": 19.0,
+      "grad_norm": 4.492996692657471,
+      "learning_rate": 5.378157978893509e-05,
+      "loss": 0.4361,
+      "step": 30419
+    },
+    {
+      "epoch": 19.0,
+      "eval_rundkast_loss": 0.2833118140697479,
+      "eval_rundkast_runtime": 31.0219,
+      "eval_rundkast_samples_per_second": 43.357,
+      "eval_rundkast_steps_per_second": 1.386,
+      "eval_rundkast_wer": 0.13219853643016227,
+      "step": 30419
+    },
+    {
+      "epoch": 19.0,
+      "eval_nb_samtale_loss": 0.4991215765476227,
+      "eval_nb_samtale_runtime": 35.3186,
+      "eval_nb_samtale_samples_per_second": 15.091,
+      "eval_nb_samtale_steps_per_second": 0.481,
+      "eval_nb_samtale_wer": 0.20638020833333334,
+      "step": 30419
+    },
+    {
+      "epoch": 19.0,
+      "eval_BB_RUND_loss": 0.7097201347351074,
+      "eval_BB_RUND_runtime": 73.7433,
+      "eval_BB_RUND_samples_per_second": 36.817,
+      "eval_BB_RUND_steps_per_second": 1.153,
+      "eval_BB_RUND_wer": 0.26451871122673604,
+      "step": 30419
+    },
+    {
+      "epoch": 19.0,
+      "eval_bigbrother_loss": 1.1280052661895752,
+      "eval_bigbrother_runtime": 38.9563,
+      "eval_bigbrother_samples_per_second": 35.168,
+      "eval_bigbrother_steps_per_second": 1.104,
+      "eval_bigbrother_wer": 0.39837267380971564,
+      "step": 30419
+    },
+    {
+      "epoch": 20.0,
+      "grad_norm": 1.5283879041671753,
+      "learning_rate": 5.122161816437481e-05,
+      "loss": 0.4249,
+      "step": 32020
+    },
+    {
+      "epoch": 20.0,
+      "eval_rundkast_loss": 0.309190571308136,
+      "eval_rundkast_runtime": 31.2274,
+      "eval_rundkast_samples_per_second": 43.071,
+      "eval_rundkast_steps_per_second": 1.377,
+      "eval_rundkast_wer": 0.13084632516703787,
+      "step": 32020
+    },
+    {
+      "epoch": 20.0,
+      "eval_nb_samtale_loss": 0.49869558215141296,
+      "eval_nb_samtale_runtime": 35.2581,
+      "eval_nb_samtale_samples_per_second": 15.117,
+      "eval_nb_samtale_steps_per_second": 0.482,
+      "eval_nb_samtale_wer": 0.200927734375,
+      "step": 32020
+    },
+    {
+      "epoch": 20.0,
+      "eval_BB_RUND_loss": 0.7553633451461792,
+      "eval_BB_RUND_runtime": 73.477,
+      "eval_BB_RUND_samples_per_second": 36.95,
+      "eval_BB_RUND_steps_per_second": 1.157,
+      "eval_BB_RUND_wer": 0.26575945567340403,
+      "step": 32020
+    },
+    {
+      "epoch": 20.0,
+      "eval_bigbrother_loss": 1.1935659646987915,
+      "eval_bigbrother_runtime": 39.2084,
+      "eval_bigbrother_samples_per_second": 34.941,
+      "eval_bigbrother_steps_per_second": 1.097,
+      "eval_bigbrother_wer": 0.40248126963667125,
+      "step": 32020
+    },
+    {
+      "epoch": 21.0,
+      "grad_norm": 0.824657142162323,
+      "learning_rate": 4.866165653981452e-05,
+      "loss": 0.4167,
+      "step": 33621
+    },
+    {
+      "epoch": 21.0,
+      "eval_rundkast_loss": 0.3222857415676117,
+      "eval_rundkast_runtime": 31.2353,
+      "eval_rundkast_samples_per_second": 43.06,
+      "eval_rundkast_steps_per_second": 1.377,
+      "eval_rundkast_wer": 0.1296531975819281,
+      "step": 33621
+    },
+    {
+      "epoch": 21.0,
+      "eval_nb_samtale_loss": 0.533822774887085,
+      "eval_nb_samtale_runtime": 35.2167,
+      "eval_nb_samtale_samples_per_second": 15.135,
+      "eval_nb_samtale_steps_per_second": 0.483,
+      "eval_nb_samtale_wer": 0.201171875,
+      "step": 33621
+    },
+    {
+      "epoch": 21.0,
+      "eval_BB_RUND_loss": 0.7721800804138184,
+      "eval_BB_RUND_runtime": 73.7086,
+      "eval_BB_RUND_samples_per_second": 36.834,
+      "eval_BB_RUND_steps_per_second": 1.153,
+      "eval_BB_RUND_wer": 0.2623574144486692,
+      "step": 33621
+    },
+    {
+      "epoch": 21.0,
+      "eval_bigbrother_loss": 1.2132436037063599,
+      "eval_bigbrother_runtime": 39.1843,
+      "eval_bigbrother_samples_per_second": 34.963,
+      "eval_bigbrother_steps_per_second": 1.097,
+      "eval_bigbrother_wer": 0.39660033835495045,
+      "step": 33621
+    },
+    {
+      "epoch": 22.0,
+      "grad_norm": 1.1440060138702393,
+      "learning_rate": 4.6103293891909183e-05,
+      "loss": 0.4105,
+      "step": 35222
+    },
+    {
+      "epoch": 22.0,
+      "eval_rundkast_loss": 0.31660783290863037,
+      "eval_rundkast_runtime": 31.6185,
+      "eval_rundkast_samples_per_second": 42.538,
+      "eval_rundkast_steps_per_second": 1.36,
+      "eval_rundkast_wer": 0.12893732103086222,
+      "step": 35222
+    },
+    {
+      "epoch": 22.0,
+      "eval_nb_samtale_loss": 0.5133374929428101,
+      "eval_nb_samtale_runtime": 35.2449,
+      "eval_nb_samtale_samples_per_second": 15.123,
+      "eval_nb_samtale_steps_per_second": 0.482,
+      "eval_nb_samtale_wer": 0.20157877604166666,
+      "step": 35222
+    },
+    {
+      "epoch": 22.0,
+      "eval_BB_RUND_loss": 0.7647114992141724,
+      "eval_BB_RUND_runtime": 73.4723,
+      "eval_BB_RUND_samples_per_second": 36.953,
+      "eval_BB_RUND_steps_per_second": 1.157,
+      "eval_BB_RUND_wer": 0.26255753452071245,
+      "step": 35222
+    },
+    {
+      "epoch": 22.0,
+      "eval_bigbrother_loss": 1.2045847177505493,
+      "eval_bigbrother_runtime": 39.0811,
+      "eval_bigbrother_samples_per_second": 35.055,
+      "eval_bigbrother_steps_per_second": 1.1,
+      "eval_bigbrother_wer": 0.39813099170224764,
+      "step": 35222
+    },
+    {
+      "epoch": 23.0,
+      "grad_norm": 1.2679944038391113,
+      "learning_rate": 4.354493124400384e-05,
+      "loss": 0.4077,
+      "step": 36823
+    },
+    {
+      "epoch": 23.0,
+      "eval_rundkast_loss": 0.32336536049842834,
+      "eval_rundkast_runtime": 31.2205,
+      "eval_rundkast_samples_per_second": 43.081,
+      "eval_rundkast_steps_per_second": 1.377,
+      "eval_rundkast_wer": 0.13156220171810373,
+      "step": 36823
+    },
+    {
+      "epoch": 23.0,
+      "eval_nb_samtale_loss": 0.5165642499923706,
+      "eval_nb_samtale_runtime": 35.3263,
+      "eval_nb_samtale_samples_per_second": 15.088,
+      "eval_nb_samtale_steps_per_second": 0.481,
+      "eval_nb_samtale_wer": 0.20035807291666666,
+      "step": 36823
+    },
+    {
+      "epoch": 23.0,
+      "eval_BB_RUND_loss": 0.7570832967758179,
+      "eval_BB_RUND_runtime": 90.621,
+      "eval_BB_RUND_samples_per_second": 29.96,
+      "eval_BB_RUND_steps_per_second": 0.938,
+      "eval_BB_RUND_wer": 0.26323794276565937,
+      "step": 36823
+    },
+    {
+      "epoch": 23.0,
+      "eval_bigbrother_loss": 1.1831412315368652,
+      "eval_bigbrother_runtime": 39.2988,
+      "eval_bigbrother_samples_per_second": 34.861,
+      "eval_bigbrother_steps_per_second": 1.094,
+      "eval_bigbrother_wer": 0.3967614597599291,
+      "step": 36823
+    },
+    {
+      "epoch": 24.0,
+      "grad_norm": 6.380431175231934,
+      "learning_rate": 4.098496961944356e-05,
+      "loss": 0.4011,
+      "step": 38424
+    },
+    {
+      "epoch": 24.0,
+      "eval_rundkast_loss": 0.3312782943248749,
+      "eval_rundkast_runtime": 31.4003,
+      "eval_rundkast_samples_per_second": 42.834,
+      "eval_rundkast_steps_per_second": 1.369,
+      "eval_rundkast_wer": 0.12853961183582566,
+      "step": 38424
+    },
+    {
+      "epoch": 24.0,
+      "eval_nb_samtale_loss": 0.5143250823020935,
+      "eval_nb_samtale_runtime": 35.5114,
+      "eval_nb_samtale_samples_per_second": 15.009,
+      "eval_nb_samtale_steps_per_second": 0.479,
+      "eval_nb_samtale_wer": 0.19954427083333334,
+      "step": 38424
+    },
+    {
+      "epoch": 24.0,
+      "eval_BB_RUND_loss": 0.7850114703178406,
+      "eval_BB_RUND_runtime": 74.2024,
+      "eval_BB_RUND_samples_per_second": 36.589,
+      "eval_BB_RUND_steps_per_second": 1.146,
+      "eval_BB_RUND_wer": 0.26135681408845307,
+      "step": 38424
+    },
+    {
+      "epoch": 24.0,
+      "eval_bigbrother_loss": 1.2299407720565796,
+      "eval_bigbrother_runtime": 39.2032,
+      "eval_bigbrother_samples_per_second": 34.946,
+      "eval_bigbrother_steps_per_second": 1.097,
+      "eval_bigbrother_wer": 0.39595585273503586,
+      "step": 38424
+    },
+    {
+      "epoch": 25.0,
+      "grad_norm": 0.8889333009719849,
+      "learning_rate": 3.842660697153822e-05,
+      "loss": 0.3946,
+      "step": 40025
+    },
+    {
+      "epoch": 25.0,
+      "eval_rundkast_loss": 0.3259143829345703,
+      "eval_rundkast_runtime": 31.2371,
+      "eval_rundkast_samples_per_second": 43.058,
+      "eval_rundkast_steps_per_second": 1.377,
+      "eval_rundkast_wer": 0.12822144447979636,
+      "step": 40025
+    },
+    {
+      "epoch": 25.0,
+      "eval_nb_samtale_loss": 0.5260791778564453,
+      "eval_nb_samtale_runtime": 35.2592,
+      "eval_nb_samtale_samples_per_second": 15.117,
+      "eval_nb_samtale_steps_per_second": 0.482,
+      "eval_nb_samtale_wer": 0.19742838541666666,
+      "step": 40025
+    },
+    {
+      "epoch": 25.0,
+      "eval_BB_RUND_loss": 0.7829692959785461,
+      "eval_BB_RUND_runtime": 96.3242,
+      "eval_BB_RUND_samples_per_second": 28.186,
+      "eval_BB_RUND_steps_per_second": 0.882,
+      "eval_BB_RUND_wer": 0.25939563738242943,
+      "step": 40025
+    },
+    {
+      "epoch": 25.0,
+      "eval_bigbrother_loss": 1.2314956188201904,
+      "eval_bigbrother_runtime": 39.2118,
+      "eval_bigbrother_samples_per_second": 34.938,
+      "eval_bigbrother_steps_per_second": 1.097,
+      "eval_bigbrother_wer": 0.3917666962055909,
+      "step": 40025
+    },
+    {
+      "epoch": 26.0,
+      "grad_norm": 2.6945877075195312,
+      "learning_rate": 3.5866645346977936e-05,
+      "loss": 0.3863,
+      "step": 41626
+    },
+    {
+      "epoch": 26.0,
+      "eval_rundkast_loss": 0.3363383412361145,
+      "eval_rundkast_runtime": 31.3558,
+      "eval_rundkast_samples_per_second": 42.895,
+      "eval_rundkast_steps_per_second": 1.371,
+      "eval_rundkast_wer": 0.13124403436207446,
+      "step": 41626
+    },
+    {
+      "epoch": 26.0,
+      "eval_nb_samtale_loss": 0.5427711009979248,
+      "eval_nb_samtale_runtime": 35.2067,
+      "eval_nb_samtale_samples_per_second": 15.139,
+      "eval_nb_samtale_steps_per_second": 0.483,
+      "eval_nb_samtale_wer": 0.20467122395833334,
+      "step": 41626
+    },
+    {
+      "epoch": 26.0,
+      "eval_BB_RUND_loss": 0.8028616905212402,
+      "eval_BB_RUND_runtime": 73.6484,
+      "eval_BB_RUND_samples_per_second": 36.864,
+      "eval_BB_RUND_steps_per_second": 1.154,
+      "eval_BB_RUND_wer": 0.2621172703622173,
+      "step": 41626
+    },
+    {
+      "epoch": 26.0,
+      "eval_bigbrother_loss": 1.2609052658081055,
+      "eval_bigbrother_runtime": 39.2296,
+      "eval_bigbrother_samples_per_second": 34.923,
+      "eval_bigbrother_steps_per_second": 1.096,
+      "eval_bigbrother_wer": 0.39506968500765327,
+      "step": 41626
+    },
+    {
+      "epoch": 27.0,
+      "grad_norm": 0.7852900624275208,
+      "learning_rate": 3.330828269907259e-05,
+      "loss": 0.3799,
+      "step": 43227
+    },
+    {
+      "epoch": 27.0,
+      "eval_rundkast_loss": 0.3347199857234955,
+      "eval_rundkast_runtime": 31.2946,
+      "eval_rundkast_samples_per_second": 42.979,
+      "eval_rundkast_steps_per_second": 1.374,
+      "eval_rundkast_wer": 0.12893732103086222,
+      "step": 43227
+    },
+    {
+      "epoch": 27.0,
+      "eval_nb_samtale_loss": 0.5341453552246094,
+      "eval_nb_samtale_runtime": 35.3834,
+      "eval_nb_samtale_samples_per_second": 15.064,
+      "eval_nb_samtale_steps_per_second": 0.48,
+      "eval_nb_samtale_wer": 0.20328776041666666,
+      "step": 43227
+    },
+    {
+      "epoch": 27.0,
+      "eval_BB_RUND_loss": 0.7905371189117432,
+      "eval_BB_RUND_runtime": 74.2226,
+      "eval_BB_RUND_samples_per_second": 36.579,
+      "eval_BB_RUND_steps_per_second": 1.145,
+      "eval_BB_RUND_wer": 0.25959575745447266,
+      "step": 43227
+    },
+    {
+      "epoch": 27.0,
+      "eval_bigbrother_loss": 1.2384859323501587,
+      "eval_bigbrother_runtime": 39.6106,
+      "eval_bigbrother_samples_per_second": 34.587,
+      "eval_bigbrother_steps_per_second": 1.086,
+      "eval_bigbrother_wer": 0.39192781761056955,
+      "step": 43227
+    },
+    {
+      "epoch": 28.0,
+      "grad_norm": 1.839573621749878,
+      "learning_rate": 3.074992005116725e-05,
+      "loss": 0.3782,
+      "step": 44828
+    },
+    {
+      "epoch": 28.0,
+      "eval_rundkast_loss": 0.33070889115333557,
+      "eval_rundkast_runtime": 31.2558,
+      "eval_rundkast_samples_per_second": 43.032,
+      "eval_rundkast_steps_per_second": 1.376,
+      "eval_rundkast_wer": 0.12750556792873052,
+      "step": 44828
+    },
+    {
+      "epoch": 28.0,
+      "eval_nb_samtale_loss": 0.5499075055122375,
+      "eval_nb_samtale_runtime": 35.4546,
+      "eval_nb_samtale_samples_per_second": 15.033,
+      "eval_nb_samtale_steps_per_second": 0.479,
+      "eval_nb_samtale_wer": 0.19881184895833334,
+      "step": 44828
+    },
+    {
+      "epoch": 28.0,
+      "eval_BB_RUND_loss": 0.7748451232910156,
+      "eval_BB_RUND_runtime": 73.8572,
+      "eval_BB_RUND_samples_per_second": 36.76,
+      "eval_BB_RUND_steps_per_second": 1.151,
+      "eval_BB_RUND_wer": 0.25531318791274765,
+      "step": 44828
+    },
+    {
+      "epoch": 28.0,
+      "eval_bigbrother_loss": 1.2108979225158691,
+      "eval_bigbrother_runtime": 39.3441,
+      "eval_bigbrother_samples_per_second": 34.821,
+      "eval_bigbrother_steps_per_second": 1.093,
+      "eval_bigbrother_wer": 0.3849995971964876,
+      "step": 44828
+    },
+    {
+      "epoch": 29.0,
+      "grad_norm": 1.2005807161331177,
+      "learning_rate": 2.8189958426606973e-05,
+      "loss": 0.3729,
+      "step": 46429
+    },
+    {
+      "epoch": 29.0,
+      "eval_rundkast_loss": 0.3197638690471649,
+      "eval_rundkast_runtime": 31.5545,
+      "eval_rundkast_samples_per_second": 42.625,
+      "eval_rundkast_steps_per_second": 1.363,
+      "eval_rundkast_wer": 0.12671014953865734,
+      "step": 46429
+    },
+    {
+      "epoch": 29.0,
+      "eval_nb_samtale_loss": 0.5454243421554565,
+      "eval_nb_samtale_runtime": 35.43,
+      "eval_nb_samtale_samples_per_second": 15.044,
+      "eval_nb_samtale_steps_per_second": 0.48,
+      "eval_nb_samtale_wer": 0.19832356770833334,
+      "step": 46429
+    },
+    {
+      "epoch": 29.0,
+      "eval_BB_RUND_loss": 0.7797754406929016,
+      "eval_BB_RUND_runtime": 73.7244,
+      "eval_BB_RUND_samples_per_second": 36.826,
+      "eval_BB_RUND_steps_per_second": 1.153,
+      "eval_BB_RUND_wer": 0.25567340404242545,
+      "step": 46429
+    },
+    {
+      "epoch": 29.0,
+      "eval_bigbrother_loss": 1.231561541557312,
+      "eval_bigbrother_runtime": 39.2468,
+      "eval_bigbrother_samples_per_second": 34.907,
+      "eval_bigbrother_steps_per_second": 1.096,
+      "eval_bigbrother_wer": 0.38620800773382746,
+      "step": 46429
+    },
+    {
+      "epoch": 30.0,
+      "grad_norm": 1.4953359365463257,
+      "learning_rate": 2.562999680204669e-05,
+      "loss": 0.3718,
+      "step": 48030
+    },
+    {
+      "epoch": 30.0,
+      "eval_rundkast_loss": 0.33351558446884155,
+      "eval_rundkast_runtime": 31.2627,
+      "eval_rundkast_samples_per_second": 43.023,
+      "eval_rundkast_steps_per_second": 1.375,
+      "eval_rundkast_wer": 0.12830098631880368,
+      "step": 48030
+    },
+    {
+      "epoch": 30.0,
+      "eval_nb_samtale_loss": 0.5619927048683167,
+      "eval_nb_samtale_runtime": 35.2849,
+      "eval_nb_samtale_samples_per_second": 15.106,
+      "eval_nb_samtale_steps_per_second": 0.482,
+      "eval_nb_samtale_wer": 0.19986979166666666,
+      "step": 48030
+    },
+    {
+      "epoch": 30.0,
+      "eval_BB_RUND_loss": 0.7934340238571167,
+      "eval_BB_RUND_runtime": 74.4083,
+      "eval_BB_RUND_samples_per_second": 36.488,
+      "eval_BB_RUND_steps_per_second": 1.142,
+      "eval_BB_RUND_wer": 0.25839503702221334,
+      "step": 48030
+    },
+    {
+      "epoch": 30.0,
+      "eval_bigbrother_loss": 1.2452094554901123,
+      "eval_bigbrother_runtime": 39.1955,
+      "eval_bigbrother_samples_per_second": 34.953,
+      "eval_bigbrother_steps_per_second": 1.097,
+      "eval_bigbrother_wer": 0.39071940707322966,
+      "step": 48030
+    },
+    {
+      "epoch": 31.0,
+      "grad_norm": 2.022852659225464,
+      "learning_rate": 2.307163415414135e-05,
+      "loss": 0.3648,
+      "step": 49631
+    },
+    {
+      "epoch": 31.0,
+      "eval_rundkast_loss": 0.32245931029319763,
+      "eval_rundkast_runtime": 31.3953,
+      "eval_rundkast_samples_per_second": 42.841,
+      "eval_rundkast_steps_per_second": 1.37,
+      "eval_rundkast_wer": 0.1252783964365256,
+      "step": 49631
+    },
+    {
+      "epoch": 31.0,
+      "eval_nb_samtale_loss": 0.547818660736084,
+      "eval_nb_samtale_runtime": 35.3829,
+      "eval_nb_samtale_samples_per_second": 15.064,
+      "eval_nb_samtale_steps_per_second": 0.48,
+      "eval_nb_samtale_wer": 0.19913736979166666,
+      "step": 49631
+    },
+    {
+      "epoch": 31.0,
+      "eval_BB_RUND_loss": 0.7814807295799255,
+      "eval_BB_RUND_runtime": 74.2777,
+      "eval_BB_RUND_samples_per_second": 36.552,
+      "eval_BB_RUND_steps_per_second": 1.144,
+      "eval_BB_RUND_wer": 0.25687412447468483,
+      "step": 49631
+    },
+    {
+      "epoch": 31.0,
+      "eval_bigbrother_loss": 1.232583999633789,
+      "eval_bigbrother_runtime": 39.2964,
+      "eval_bigbrother_samples_per_second": 34.863,
+      "eval_bigbrother_steps_per_second": 1.094,
+      "eval_bigbrother_wer": 0.3895915572383791,
+      "step": 49631
+    },
+    {
+      "epoch": 32.0,
+      "grad_norm": 1.159850001335144,
+      "learning_rate": 2.051327150623601e-05,
+      "loss": 0.3556,
+      "step": 51232
+    },
+    {
+      "epoch": 32.0,
+      "eval_rundkast_loss": 0.33501243591308594,
+      "eval_rundkast_runtime": 31.2712,
+      "eval_rundkast_samples_per_second": 43.011,
+      "eval_rundkast_steps_per_second": 1.375,
+      "eval_rundkast_wer": 0.12623289850461342,
+      "step": 51232
+    },
+    {
+      "epoch": 32.0,
+      "eval_nb_samtale_loss": 0.5665200352668762,
+      "eval_nb_samtale_runtime": 35.0524,
+      "eval_nb_samtale_samples_per_second": 15.206,
+      "eval_nb_samtale_steps_per_second": 0.485,
+      "eval_nb_samtale_wer": 0.19685872395833334,
+      "step": 51232
+    },
+    {
+      "epoch": 32.0,
+      "eval_BB_RUND_loss": 0.8201074004173279,
+      "eval_BB_RUND_runtime": 73.6889,
+      "eval_BB_RUND_samples_per_second": 36.844,
+      "eval_BB_RUND_steps_per_second": 1.153,
+      "eval_BB_RUND_wer": 0.2548328997398439,
+      "step": 51232
+    },
+    {
+      "epoch": 32.0,
+      "eval_bigbrother_loss": 1.296426773071289,
+      "eval_bigbrother_runtime": 39.3283,
+      "eval_bigbrother_samples_per_second": 34.835,
+      "eval_bigbrother_steps_per_second": 1.093,
+      "eval_bigbrother_wer": 0.3852412793039555,
+      "step": 51232
+    },
+    {
+      "epoch": 33.0,
+      "grad_norm": 4.668502330780029,
+      "learning_rate": 1.7954908858330668e-05,
+      "loss": 0.3533,
+      "step": 52833
+    },
+    {
+      "epoch": 33.0,
+      "eval_rundkast_loss": 0.33790138363838196,
+      "eval_rundkast_runtime": 31.5957,
+      "eval_rundkast_samples_per_second": 42.569,
+      "eval_rundkast_steps_per_second": 1.361,
+      "eval_rundkast_wer": 0.12623289850461342,
+      "step": 52833
+    },
+    {
+      "epoch": 33.0,
+      "eval_nb_samtale_loss": 0.5643696784973145,
+      "eval_nb_samtale_runtime": 35.3499,
+      "eval_nb_samtale_samples_per_second": 15.078,
+      "eval_nb_samtale_steps_per_second": 0.481,
+      "eval_nb_samtale_wer": 0.19669596354166666,
+      "step": 52833
+    },
+    {
+      "epoch": 33.0,
+      "eval_BB_RUND_loss": 0.8017848134040833,
+      "eval_BB_RUND_runtime": 74.5846,
+      "eval_BB_RUND_samples_per_second": 36.402,
+      "eval_BB_RUND_steps_per_second": 1.14,
+      "eval_BB_RUND_wer": 0.2553532119271563,
+      "step": 52833
+    },
+    {
+      "epoch": 33.0,
+      "eval_bigbrother_loss": 1.2571812868118286,
+      "eval_bigbrother_runtime": 38.9999,
+      "eval_bigbrother_samples_per_second": 35.128,
+      "eval_bigbrother_steps_per_second": 1.103,
+      "eval_bigbrother_wer": 0.38508015789897687,
+      "step": 52833
+    },
+    {
+      "epoch": 34.0,
+      "grad_norm": 1.0839606523513794,
+      "learning_rate": 1.5394947233770386e-05,
+      "loss": 0.3524,
+      "step": 54434
+    },
+    {
+      "epoch": 34.0,
+      "eval_rundkast_loss": 0.3482387959957123,
+      "eval_rundkast_runtime": 31.231,
+      "eval_rundkast_samples_per_second": 43.066,
+      "eval_rundkast_steps_per_second": 1.377,
+      "eval_rundkast_wer": 0.12496022908049634,
+      "step": 54434
+    },
+    {
+      "epoch": 34.0,
+      "eval_nb_samtale_loss": 0.5782368779182434,
+      "eval_nb_samtale_runtime": 35.115,
+      "eval_nb_samtale_samples_per_second": 15.179,
+      "eval_nb_samtale_steps_per_second": 0.484,
+      "eval_nb_samtale_wer": 0.19881184895833334,
+      "step": 54434
+    },
+    {
+      "epoch": 34.0,
+      "eval_BB_RUND_loss": 0.8167536854743958,
+      "eval_BB_RUND_runtime": 73.4659,
+      "eval_BB_RUND_samples_per_second": 36.956,
+      "eval_BB_RUND_steps_per_second": 1.157,
+      "eval_BB_RUND_wer": 0.2524314588753252,
+      "step": 54434
+    },
+    {
+      "epoch": 34.0,
+      "eval_bigbrother_loss": 1.2767822742462158,
+      "eval_bigbrother_runtime": 39.0487,
+      "eval_bigbrother_samples_per_second": 35.084,
+      "eval_bigbrother_steps_per_second": 1.101,
+      "eval_bigbrother_wer": 0.38121324417948926,
+      "step": 54434
+    },
+    {
+      "epoch": 35.0,
+      "grad_norm": 1.376759648323059,
+      "learning_rate": 1.2836584585865047e-05,
+      "loss": 0.3499,
+      "step": 56035
+    },
+    {
+      "epoch": 35.0,
+      "eval_rundkast_loss": 0.3501284718513489,
+      "eval_rundkast_runtime": 32.4165,
+      "eval_rundkast_samples_per_second": 41.491,
+      "eval_rundkast_steps_per_second": 1.326,
+      "eval_rundkast_wer": 0.12575564747056953,
+      "step": 56035
+    },
+    {
+      "epoch": 35.0,
+      "eval_nb_samtale_loss": 0.5841984152793884,
+      "eval_nb_samtale_runtime": 35.425,
+      "eval_nb_samtale_samples_per_second": 15.046,
+      "eval_nb_samtale_steps_per_second": 0.48,
+      "eval_nb_samtale_wer": 0.1982421875,
+      "step": 56035
+    },
+    {
+      "epoch": 35.0,
+      "eval_BB_RUND_loss": 0.8236829042434692,
+      "eval_BB_RUND_runtime": 74.6418,
+      "eval_BB_RUND_samples_per_second": 36.374,
+      "eval_BB_RUND_steps_per_second": 1.139,
+      "eval_BB_RUND_wer": 0.25203121873123874,
+      "step": 56035
+    },
+    {
+      "epoch": 35.0,
+      "eval_bigbrother_loss": 1.2888648509979248,
+      "eval_bigbrother_runtime": 39.2027,
+      "eval_bigbrother_samples_per_second": 34.947,
+      "eval_bigbrother_steps_per_second": 1.097,
+      "eval_bigbrother_wer": 0.38008539434463867,
+      "step": 56035
+    },
+    {
+      "epoch": 36.0,
+      "grad_norm": 1.6304969787597656,
+      "learning_rate": 1.0276622961304766e-05,
+      "loss": 0.349,
+      "step": 57636
+    },
+    {
+      "epoch": 36.0,
+      "eval_rundkast_loss": 0.3395073413848877,
+      "eval_rundkast_runtime": 31.3594,
+      "eval_rundkast_samples_per_second": 42.89,
+      "eval_rundkast_steps_per_second": 1.371,
+      "eval_rundkast_wer": 0.12583518930957685,
+      "step": 57636
+    },
+    {
+      "epoch": 36.0,
+      "eval_nb_samtale_loss": 0.5508641004562378,
+      "eval_nb_samtale_runtime": 35.3876,
+      "eval_nb_samtale_samples_per_second": 15.062,
+      "eval_nb_samtale_steps_per_second": 0.48,
+      "eval_nb_samtale_wer": 0.198974609375,
+      "step": 57636
+    },
+    {
+      "epoch": 36.0,
+      "eval_BB_RUND_loss": 0.7999393939971924,
+      "eval_BB_RUND_runtime": 73.6053,
+      "eval_BB_RUND_samples_per_second": 36.886,
+      "eval_BB_RUND_steps_per_second": 1.155,
+      "eval_BB_RUND_wer": 0.25139083450070043,
+      "step": 57636
+    },
+    {
+      "epoch": 36.0,
+      "eval_bigbrother_loss": 1.2519750595092773,
+      "eval_bigbrother_runtime": 38.9721,
+      "eval_bigbrother_samples_per_second": 35.153,
+      "eval_bigbrother_steps_per_second": 1.103,
+      "eval_bigbrother_wer": 0.3781519374848949,
+      "step": 57636
+    },
+    {
+      "epoch": 37.0,
+      "grad_norm": 0.9431388974189758,
+      "learning_rate": 7.718260313399425e-06,
+      "loss": 0.3443,
+      "step": 59237
+    },
+    {
+      "epoch": 37.0,
+      "eval_rundkast_loss": 0.3431856632232666,
+      "eval_rundkast_runtime": 32.1917,
+      "eval_rundkast_samples_per_second": 41.781,
+      "eval_rundkast_steps_per_second": 1.336,
+      "eval_rundkast_wer": 0.12440343620744512,
+      "step": 59237
+    },
+    {
+      "epoch": 37.0,
+      "eval_nb_samtale_loss": 0.5509617924690247,
+      "eval_nb_samtale_runtime": 35.3455,
+      "eval_nb_samtale_samples_per_second": 15.08,
+      "eval_nb_samtale_steps_per_second": 0.481,
+      "eval_nb_samtale_wer": 0.19669596354166666,
+      "step": 59237
+    },
+    {
+      "epoch": 37.0,
+      "eval_BB_RUND_loss": 0.8117216229438782,
+      "eval_BB_RUND_runtime": 75.5514,
+      "eval_BB_RUND_samples_per_second": 35.936,
+      "eval_BB_RUND_steps_per_second": 1.125,
+      "eval_BB_RUND_wer": 0.2507504502701621,
+      "step": 59237
+    },
+    {
+      "epoch": 37.0,
+      "eval_bigbrother_loss": 1.272763729095459,
+      "eval_bigbrother_runtime": 39.4053,
+      "eval_bigbrother_samples_per_second": 34.767,
+      "eval_bigbrother_steps_per_second": 1.091,
+      "eval_bigbrother_wer": 0.3785547409973415,
+      "step": 59237
+    },
+    {
+      "epoch": 38.0,
+      "grad_norm": 0.7018219232559204,
+      "learning_rate": 5.158298688839143e-06,
+      "loss": 0.3417,
+      "step": 60838
+    },
+    {
+      "epoch": 38.0,
+      "eval_rundkast_loss": 0.3419778645038605,
+      "eval_rundkast_runtime": 31.3896,
+      "eval_rundkast_samples_per_second": 42.849,
+      "eval_rundkast_steps_per_second": 1.37,
+      "eval_rundkast_wer": 0.12376710149538657,
+      "step": 60838
+    },
+    {
+      "epoch": 38.0,
+      "eval_nb_samtale_loss": 0.5525389909744263,
+      "eval_nb_samtale_runtime": 35.2018,
+      "eval_nb_samtale_samples_per_second": 15.141,
+      "eval_nb_samtale_steps_per_second": 0.483,
+      "eval_nb_samtale_wer": 0.19669596354166666,
+      "step": 60838
+    },
+    {
+      "epoch": 38.0,
+      "eval_BB_RUND_loss": 0.8073983192443848,
+      "eval_BB_RUND_runtime": 73.835,
+      "eval_BB_RUND_samples_per_second": 36.771,
+      "eval_BB_RUND_steps_per_second": 1.151,
+      "eval_BB_RUND_wer": 0.250870522313388,
+      "step": 60838
+    },
+    {
+      "epoch": 38.0,
+      "eval_bigbrother_loss": 1.2644871473312378,
+      "eval_bigbrother_runtime": 39.1416,
+      "eval_bigbrother_samples_per_second": 35.001,
+      "eval_bigbrother_steps_per_second": 1.099,
+      "eval_bigbrother_wer": 0.3788769838072988,
+      "step": 60838
+    },
+    {
+      "epoch": 39.0,
+      "grad_norm": 2.0295908451080322,
+      "learning_rate": 2.5999360409338027e-06,
+      "loss": 0.3442,
+      "step": 62439
+    },
+    {
+      "epoch": 39.0,
+      "eval_rundkast_loss": 0.3452610671520233,
+      "eval_rundkast_runtime": 32.4113,
+      "eval_rundkast_samples_per_second": 41.498,
+      "eval_rundkast_steps_per_second": 1.327,
+      "eval_rundkast_wer": 0.12376710149538657,
+      "step": 62439
+    },
+    {
+      "epoch": 39.0,
+      "eval_nb_samtale_loss": 0.5602259039878845,
+      "eval_nb_samtale_runtime": 35.342,
+      "eval_nb_samtale_samples_per_second": 15.081,
+      "eval_nb_samtale_steps_per_second": 0.481,
+      "eval_nb_samtale_wer": 0.195556640625,
+      "step": 62439
+    },
+    {
+      "epoch": 39.0,
+      "eval_BB_RUND_loss": 0.8162434101104736,
+      "eval_BB_RUND_runtime": 75.0912,
+      "eval_BB_RUND_samples_per_second": 36.156,
+      "eval_BB_RUND_steps_per_second": 1.132,
+      "eval_BB_RUND_wer": 0.2508304982989794,
+      "step": 62439
+    },
+    {
+      "epoch": 39.0,
+      "eval_bigbrother_loss": 1.2785000801086426,
+      "eval_bigbrother_runtime": 39.2508,
+      "eval_bigbrother_samples_per_second": 34.904,
+      "eval_bigbrother_steps_per_second": 1.096,
+      "eval_bigbrother_wer": 0.37903810521227743,
+      "step": 62439
+    },
+    {
+      "epoch": 40.0,
+      "grad_norm": 0.7962198257446289,
+      "learning_rate": 4.1573393028461783e-08,
+      "loss": 0.341,
+      "step": 64040
+    },
+    {
+      "epoch": 40.0,
+      "eval_rundkast_loss": 0.3451217710971832,
+      "eval_rundkast_runtime": 31.3475,
+      "eval_rundkast_samples_per_second": 42.906,
+      "eval_rundkast_steps_per_second": 1.372,
+      "eval_rundkast_wer": 0.12368755965637926,
+      "step": 64040
+    },
+    {
+      "epoch": 40.0,
+      "eval_nb_samtale_loss": 0.561275839805603,
+      "eval_nb_samtale_runtime": 35.2131,
+      "eval_nb_samtale_samples_per_second": 15.136,
+      "eval_nb_samtale_steps_per_second": 0.483,
+      "eval_nb_samtale_wer": 0.19588216145833334,
+      "step": 64040
+    },
+    {
+      "epoch": 40.0,
+      "eval_BB_RUND_loss": 0.8131784796714783,
+      "eval_BB_RUND_runtime": 74.2866,
+      "eval_BB_RUND_samples_per_second": 36.548,
+      "eval_BB_RUND_steps_per_second": 1.144,
+      "eval_BB_RUND_wer": 0.2511907144286572,
+      "step": 64040
+    },
+    {
+      "epoch": 40.0,
+      "eval_bigbrother_loss": 1.2729395627975464,
+      "eval_bigbrother_runtime": 39.0913,
+      "eval_bigbrother_samples_per_second": 35.046,
+      "eval_bigbrother_steps_per_second": 1.1,
+      "eval_bigbrother_wer": 0.3802465157496173,
+      "step": 64040
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 64040,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 40,
+  "save_steps": 500,
+  "total_flos": 3.314074430916319e+20,
+  "train_batch_size": 48,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-64040/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b25133bdb24b039668b926e9e3f9c4343b5002d30a14ff9ac158220672a6f871
+size 4984

config.json ADDED Viewed

	@@ -0,0 +1,116 @@

+{
+  "_name_or_path": "NbAiLab/nb-wav2vec2-300m-bokmaal",
+  "activation_dropout": 0.055,
+  "adapter_attn_dim": null,
+  "adapter_kernel_size": 3,
+  "adapter_stride": 2,
+  "add_adapter": false,
+  "apply_spec_augment": true,
+  "architectures": [
+    "Wav2Vec2ForCTC"
+  ],
+  "attention_dropout": 0.094,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "codevector_dim": 768,
+  "contrastive_logits_temperature": 0.1,
+  "conv_bias": true,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "mean",
+  "ctc_zero_infinity": true,
+  "diversity_loss_weight": 0.1,
+  "do_stable_layer_norm": true,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_dropout": 0.0,
+  "feat_extract_norm": "layer",
+  "feat_proj_dropout": 0.04,
+  "feat_quantizer_dropout": 0.0,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.047,
+  "hidden_size": 1024,
+  "initializer_range": 0.02,
+  "intermediate_size": 4096,
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.041,
+  "mask_channel_length": 10,
+  "mask_channel_min_space": 1,
+  "mask_channel_other": 0.0,
+  "mask_channel_prob": 0.0,
+  "mask_channel_selection": "static",
+  "mask_feature_length": 64,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.25,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_min_space": 1,
+  "mask_time_other": 0.0,
+  "mask_time_prob": 0.082,
+  "mask_time_selection": "static",
+  "model_type": "wav2vec2",
+  "num_adapter_layers": 3,
+  "num_attention_heads": 16,
+  "num_codevector_groups": 2,
+  "num_codevectors_per_group": 320,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 24,
+  "num_negatives": 100,
+  "output_hidden_size": 1024,
+  "pad_token_id": 31,
+  "proj_codevector_dim": 768,
+  "tdnn_dilation": [
+    1,
+    2,
+    3,
+    1,
+    1
+  ],
+  "tdnn_dim": [
+    512,
+    512,
+    512,
+    512,
+    1500
+  ],
+  "tdnn_kernel": [
+    5,
+    3,
+    3,
+    1,
+    1
+  ],
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 34,
+  "xvector_output_dim": 512
+}

language_model/5gram.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7b41c24c63f2f0585bea83666369593f3b3e6d047f327a90f36ebca2c35ef0ff
+size 4243671427

language_model/attrs.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"alpha": 0.5, "beta": 0.1, "unk_score_offset": -10.0, "score_boundary": true}

language_model/unigrams.txt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ac3e71ca49838ca355df6fdcb8d89344a5a9bf9e1a76587cdf5df1367c19b9a9
+size 16759269

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0f1b72a8661985e694d6249ad4fdebdffc86644e0140a80ac60f082cfeac4024
+size 1261946880

preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "do_normalize": true,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "processor_class": "Wav2Vec2ProcessorWithLM",
+  "return_attention_mask": true,
+  "sampling_rate": 16000
+}

runs/May30_23-02-47_idun-04-08/events.out.tfevents.1717104232.idun-04-08.1448637.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7db8a40bdbd50fbbe4cba63ee7d8049f7adf2cd8fd8952b7aa9bb4d847bb341e
+size 74721

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "bos_token": "<s>",
+  "eos_token": "</s>",
+  "pad_token": "[PAD]",
+  "unk_token": "[UNK]"
+}

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,47 @@

+{
+  "added_tokens_decoder": {
+    "30": {
+      "content": "[UNK]",
+      "lstrip": true,
+      "normalized": false,
+      "rstrip": true,
+      "single_word": false,
+      "special": false
+    },
+    "31": {
+      "content": "[PAD]",
+      "lstrip": true,
+      "normalized": false,
+      "rstrip": true,
+      "single_word": false,
+      "special": false
+    },
+    "32": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "33": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": true,
+  "do_lower_case": false,
+  "eos_token": "</s>",
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "[PAD]",
+  "replace_word_delimiter_char": " ",
+  "target_lang": null,
+  "tokenizer_class": "Wav2Vec2CTCTokenizer",
+  "unk_token": "[UNK]",
+  "word_delimiter_token": "|"
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b25133bdb24b039668b926e9e3f9c4343b5002d30a14ff9ac158220672a6f871
+size 4984

vocab.json ADDED Viewed

	@@ -0,0 +1,34 @@

+{
+  "[PAD]": 31,
+  "[UNK]": 30,
+  "a": 1,
+  "b": 2,
+  "c": 3,
+  "d": 4,
+  "e": 5,
+  "f": 6,
+  "g": 7,
+  "h": 8,
+  "i": 9,
+  "j": 10,
+  "k": 11,
+  "l": 12,
+  "m": 13,
+  "n": 14,
+  "o": 15,
+  "p": 16,
+  "q": 17,
+  "r": 18,
+  "s": 19,
+  "t": 20,
+  "u": 21,
+  "v": 22,
+  "w": 23,
+  "x": 24,
+  "y": 25,
+  "z": 26,
+  "|": 0,
+  "å": 27,
+  "æ": 28,
+  "ø": 29
+}