Tflatval commited on
Commit
29f5e83
1 Parent(s): 3328607

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ language_model/unigrams.txt filter=lfs diff=lfs merge=lfs -text
added_tokens.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "</s>": 33,
3
+ "<s>": 32
4
+ }
alphabet.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"labels": [" ", "a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k", "l", "m", "n", "o", "p", "q", "r", "s", "t", "u", "v", "w", "x", "y", "z", "\u00e5", "\u00e6", "\u00f8" ,"\u2047", "", "<s>", "</s>"], "is_bpe": false}
checkpoint-65871/config.json ADDED
@@ -0,0 +1,116 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "NbAiLab/nb-wav2vec2-300m-bokmaal",
3
+ "activation_dropout": 0.055,
4
+ "adapter_attn_dim": null,
5
+ "adapter_kernel_size": 3,
6
+ "adapter_stride": 2,
7
+ "add_adapter": false,
8
+ "apply_spec_augment": true,
9
+ "architectures": [
10
+ "Wav2Vec2ForCTC"
11
+ ],
12
+ "attention_dropout": 0.094,
13
+ "bos_token_id": 1,
14
+ "classifier_proj_size": 256,
15
+ "codevector_dim": 768,
16
+ "contrastive_logits_temperature": 0.1,
17
+ "conv_bias": true,
18
+ "conv_dim": [
19
+ 512,
20
+ 512,
21
+ 512,
22
+ 512,
23
+ 512,
24
+ 512,
25
+ 512
26
+ ],
27
+ "conv_kernel": [
28
+ 10,
29
+ 3,
30
+ 3,
31
+ 3,
32
+ 3,
33
+ 2,
34
+ 2
35
+ ],
36
+ "conv_stride": [
37
+ 5,
38
+ 2,
39
+ 2,
40
+ 2,
41
+ 2,
42
+ 2,
43
+ 2
44
+ ],
45
+ "ctc_loss_reduction": "mean",
46
+ "ctc_zero_infinity": true,
47
+ "diversity_loss_weight": 0.1,
48
+ "do_stable_layer_norm": true,
49
+ "eos_token_id": 2,
50
+ "feat_extract_activation": "gelu",
51
+ "feat_extract_dropout": 0.0,
52
+ "feat_extract_norm": "layer",
53
+ "feat_proj_dropout": 0.04,
54
+ "feat_quantizer_dropout": 0.0,
55
+ "final_dropout": 0.0,
56
+ "hidden_act": "gelu",
57
+ "hidden_dropout": 0.047,
58
+ "hidden_size": 1024,
59
+ "initializer_range": 0.02,
60
+ "intermediate_size": 4096,
61
+ "layer_norm_eps": 1e-05,
62
+ "layerdrop": 0.041,
63
+ "mask_channel_length": 10,
64
+ "mask_channel_min_space": 1,
65
+ "mask_channel_other": 0.0,
66
+ "mask_channel_prob": 0.0,
67
+ "mask_channel_selection": "static",
68
+ "mask_feature_length": 64,
69
+ "mask_feature_min_masks": 0,
70
+ "mask_feature_prob": 0.25,
71
+ "mask_time_length": 10,
72
+ "mask_time_min_masks": 2,
73
+ "mask_time_min_space": 1,
74
+ "mask_time_other": 0.0,
75
+ "mask_time_prob": 0.082,
76
+ "mask_time_selection": "static",
77
+ "model_type": "wav2vec2",
78
+ "num_adapter_layers": 3,
79
+ "num_attention_heads": 16,
80
+ "num_codevector_groups": 2,
81
+ "num_codevectors_per_group": 320,
82
+ "num_conv_pos_embedding_groups": 16,
83
+ "num_conv_pos_embeddings": 128,
84
+ "num_feat_extract_layers": 7,
85
+ "num_hidden_layers": 24,
86
+ "num_negatives": 100,
87
+ "output_hidden_size": 1024,
88
+ "pad_token_id": 31,
89
+ "proj_codevector_dim": 768,
90
+ "tdnn_dilation": [
91
+ 1,
92
+ 2,
93
+ 3,
94
+ 1,
95
+ 1
96
+ ],
97
+ "tdnn_dim": [
98
+ 512,
99
+ 512,
100
+ 512,
101
+ 512,
102
+ 1500
103
+ ],
104
+ "tdnn_kernel": [
105
+ 5,
106
+ 3,
107
+ 3,
108
+ 1,
109
+ 1
110
+ ],
111
+ "torch_dtype": "float32",
112
+ "transformers_version": "4.38.1",
113
+ "use_weighted_layer_sum": false,
114
+ "vocab_size": 34,
115
+ "xvector_output_dim": 512
116
+ }
checkpoint-65871/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6f2cb9759090ff3e4f9ed9a8800e2008d2c3ca13063af3457dea658c88a0b1a
3
+ size 1261946880
checkpoint-65871/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10263e0e1d8ba434df3cad1ccad26c2dde097656e3cd954e7d0eb9f26aa80ef6
3
+ size 2490438582
checkpoint-65871/preprocessor_config.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_normalize": true,
3
+ "feature_extractor_type": "Wav2Vec2FeatureExtractor",
4
+ "feature_size": 1,
5
+ "padding_side": "right",
6
+ "padding_value": 0,
7
+ "processor_class": "Wav2Vec2ProcessorWithLM",
8
+ "return_attention_mask": true,
9
+ "sampling_rate": 16000
10
+ }
checkpoint-65871/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:838ef37a988d80a33b67380e4197e8fd92eabfc665f59d1401eee6787873b549
3
+ size 14244
checkpoint-65871/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42b41e6855efa3a52786891fb57f47ab6782d9c03141030a4fb4f037b4f4bde6
3
+ size 1064
checkpoint-65871/trainer_state.json ADDED
@@ -0,0 +1,1698 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.22021302283154026,
3
+ "best_model_checkpoint": "/cluster/home/torstefl/Master/saved_model/W2V/Combined/BB-NB-RUND/30.05/checkpoint-65871",
4
+ "epoch": 39.0,
5
+ "eval_steps": 500,
6
+ "global_step": 65871,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 1.0,
13
+ "grad_norm": 5.23741340637207,
14
+ "learning_rate": 9.971692400847715e-05,
15
+ "loss": 0.9222,
16
+ "step": 1689
17
+ },
18
+ {
19
+ "epoch": 1.0,
20
+ "eval_bigbrother_loss": 1.5889759063720703,
21
+ "eval_bigbrother_runtime": 41.228,
22
+ "eval_bigbrother_samples_per_second": 33.23,
23
+ "eval_bigbrother_steps_per_second": 1.043,
24
+ "eval_bigbrother_wer": 0.5449931523402884,
25
+ "step": 1689
26
+ },
27
+ {
28
+ "epoch": 1.0,
29
+ "eval_BB_NB_RUND_loss": 0.9018728137016296,
30
+ "eval_BB_NB_RUND_runtime": 133.4774,
31
+ "eval_BB_NB_RUND_samples_per_second": 24.334,
32
+ "eval_BB_NB_RUND_steps_per_second": 0.764,
33
+ "eval_BB_NB_RUND_wer": 0.32291471038016795,
34
+ "step": 1689
35
+ },
36
+ {
37
+ "epoch": 1.0,
38
+ "eval_rundkast_loss": 0.3399111032485962,
39
+ "eval_rundkast_runtime": 32.978,
40
+ "eval_rundkast_samples_per_second": 40.785,
41
+ "eval_rundkast_steps_per_second": 1.304,
42
+ "eval_rundkast_wer": 0.1885937002863506,
43
+ "step": 1689
44
+ },
45
+ {
46
+ "epoch": 1.0,
47
+ "eval_nb_samtale_loss": 0.5534453988075256,
48
+ "eval_nb_samtale_runtime": 38.0417,
49
+ "eval_nb_samtale_samples_per_second": 14.011,
50
+ "eval_nb_samtale_steps_per_second": 0.447,
51
+ "eval_nb_samtale_wer": 0.235595703125,
52
+ "step": 1689
53
+ },
54
+ {
55
+ "epoch": 2.0,
56
+ "grad_norm": 3.7305831909179688,
57
+ "learning_rate": 9.716167120799274e-05,
58
+ "loss": 0.7821,
59
+ "step": 3378
60
+ },
61
+ {
62
+ "epoch": 2.0,
63
+ "eval_bigbrother_loss": 1.4070501327514648,
64
+ "eval_bigbrother_runtime": 41.1443,
65
+ "eval_bigbrother_samples_per_second": 33.297,
66
+ "eval_bigbrother_steps_per_second": 1.045,
67
+ "eval_bigbrother_wer": 0.510271489567389,
68
+ "step": 3378
69
+ },
70
+ {
71
+ "epoch": 2.0,
72
+ "eval_BB_NB_RUND_loss": 0.8076683282852173,
73
+ "eval_BB_NB_RUND_runtime": 129.6259,
74
+ "eval_BB_NB_RUND_samples_per_second": 25.057,
75
+ "eval_BB_NB_RUND_steps_per_second": 0.787,
76
+ "eval_BB_NB_RUND_wer": 0.30147828186623027,
77
+ "step": 3378
78
+ },
79
+ {
80
+ "epoch": 2.0,
81
+ "eval_rundkast_loss": 0.317608118057251,
82
+ "eval_rundkast_runtime": 32.5347,
83
+ "eval_rundkast_samples_per_second": 41.34,
84
+ "eval_rundkast_steps_per_second": 1.322,
85
+ "eval_rundkast_wer": 0.16775373846643335,
86
+ "step": 3378
87
+ },
88
+ {
89
+ "epoch": 2.0,
90
+ "eval_nb_samtale_loss": 0.5036561489105225,
91
+ "eval_nb_samtale_runtime": 37.1369,
92
+ "eval_nb_samtale_samples_per_second": 14.352,
93
+ "eval_nb_samtale_steps_per_second": 0.458,
94
+ "eval_nb_samtale_wer": 0.22639973958333334,
95
+ "step": 3378
96
+ },
97
+ {
98
+ "epoch": 3.0,
99
+ "grad_norm": 4.790787696838379,
100
+ "learning_rate": 9.460490463215258e-05,
101
+ "loss": 0.7185,
102
+ "step": 5067
103
+ },
104
+ {
105
+ "epoch": 3.0,
106
+ "eval_bigbrother_loss": 1.203812837600708,
107
+ "eval_bigbrother_runtime": 41.1237,
108
+ "eval_bigbrother_samples_per_second": 33.314,
109
+ "eval_bigbrother_steps_per_second": 1.046,
110
+ "eval_bigbrother_wer": 0.49714009506162893,
111
+ "step": 5067
112
+ },
113
+ {
114
+ "epoch": 3.0,
115
+ "eval_BB_NB_RUND_loss": 0.6942233443260193,
116
+ "eval_BB_NB_RUND_runtime": 132.6472,
117
+ "eval_BB_NB_RUND_samples_per_second": 24.486,
118
+ "eval_BB_NB_RUND_steps_per_second": 0.769,
119
+ "eval_BB_NB_RUND_wer": 0.2955222278861374,
120
+ "step": 5067
121
+ },
122
+ {
123
+ "epoch": 3.0,
124
+ "eval_rundkast_loss": 0.27395445108413696,
125
+ "eval_rundkast_runtime": 32.6467,
126
+ "eval_rundkast_samples_per_second": 41.199,
127
+ "eval_rundkast_steps_per_second": 1.317,
128
+ "eval_rundkast_wer": 0.16481069042316257,
129
+ "step": 5067
130
+ },
131
+ {
132
+ "epoch": 3.0,
133
+ "eval_nb_samtale_loss": 0.44476863741874695,
134
+ "eval_nb_samtale_runtime": 37.2129,
135
+ "eval_nb_samtale_samples_per_second": 14.323,
136
+ "eval_nb_samtale_steps_per_second": 0.457,
137
+ "eval_nb_samtale_wer": 0.225830078125,
138
+ "step": 5067
139
+ },
140
+ {
141
+ "epoch": 4.0,
142
+ "grad_norm": 4.615499496459961,
143
+ "learning_rate": 9.204965183166818e-05,
144
+ "loss": 0.6788,
145
+ "step": 6756
146
+ },
147
+ {
148
+ "epoch": 4.0,
149
+ "eval_bigbrother_loss": 1.1682614088058472,
150
+ "eval_bigbrother_runtime": 41.2735,
151
+ "eval_bigbrother_samples_per_second": 33.193,
152
+ "eval_bigbrother_steps_per_second": 1.042,
153
+ "eval_bigbrother_wer": 0.46934665270281156,
154
+ "step": 6756
155
+ },
156
+ {
157
+ "epoch": 4.0,
158
+ "eval_BB_NB_RUND_loss": 0.6765461564064026,
159
+ "eval_BB_NB_RUND_runtime": 128.689,
160
+ "eval_BB_NB_RUND_samples_per_second": 25.239,
161
+ "eval_BB_NB_RUND_steps_per_second": 0.793,
162
+ "eval_BB_NB_RUND_wer": 0.27942478469669735,
163
+ "step": 6756
164
+ },
165
+ {
166
+ "epoch": 4.0,
167
+ "eval_rundkast_loss": 0.2691804766654968,
168
+ "eval_rundkast_runtime": 32.6511,
169
+ "eval_rundkast_samples_per_second": 41.193,
170
+ "eval_rundkast_steps_per_second": 1.317,
171
+ "eval_rundkast_wer": 0.15566337893732102,
172
+ "step": 6756
173
+ },
174
+ {
175
+ "epoch": 4.0,
176
+ "eval_nb_samtale_loss": 0.4400266706943512,
177
+ "eval_nb_samtale_runtime": 37.139,
178
+ "eval_nb_samtale_samples_per_second": 14.351,
179
+ "eval_nb_samtale_steps_per_second": 0.458,
180
+ "eval_nb_samtale_wer": 0.21329752604166666,
181
+ "step": 6756
182
+ },
183
+ {
184
+ "epoch": 5.0,
185
+ "grad_norm": 5.309389591217041,
186
+ "learning_rate": 8.949288525582804e-05,
187
+ "loss": 0.6442,
188
+ "step": 8445
189
+ },
190
+ {
191
+ "epoch": 5.0,
192
+ "eval_bigbrother_loss": 1.163558006286621,
193
+ "eval_bigbrother_runtime": 41.5596,
194
+ "eval_bigbrother_samples_per_second": 32.965,
195
+ "eval_bigbrother_steps_per_second": 1.035,
196
+ "eval_bigbrother_wer": 0.46080721823894305,
197
+ "step": 8445
198
+ },
199
+ {
200
+ "epoch": 5.0,
201
+ "eval_BB_NB_RUND_loss": 0.6712897419929504,
202
+ "eval_BB_NB_RUND_runtime": 199.5442,
203
+ "eval_BB_NB_RUND_samples_per_second": 16.277,
204
+ "eval_BB_NB_RUND_steps_per_second": 0.511,
205
+ "eval_BB_NB_RUND_wer": 0.2733345853566925,
206
+ "step": 8445
207
+ },
208
+ {
209
+ "epoch": 5.0,
210
+ "eval_rundkast_loss": 0.26304560899734497,
211
+ "eval_rundkast_runtime": 32.653,
212
+ "eval_rundkast_samples_per_second": 41.191,
213
+ "eval_rundkast_steps_per_second": 1.317,
214
+ "eval_rundkast_wer": 0.15224307986000638,
215
+ "step": 8445
216
+ },
217
+ {
218
+ "epoch": 5.0,
219
+ "eval_nb_samtale_loss": 0.4362596273422241,
220
+ "eval_nb_samtale_runtime": 37.3619,
221
+ "eval_nb_samtale_samples_per_second": 14.266,
222
+ "eval_nb_samtale_steps_per_second": 0.455,
223
+ "eval_nb_samtale_wer": 0.20719401041666666,
224
+ "step": 8445
225
+ },
226
+ {
227
+ "epoch": 6.0,
228
+ "grad_norm": 3.735290050506592,
229
+ "learning_rate": 8.69361186799879e-05,
230
+ "loss": 0.6167,
231
+ "step": 10134
232
+ },
233
+ {
234
+ "epoch": 6.0,
235
+ "eval_bigbrother_loss": 1.111521601676941,
236
+ "eval_bigbrother_runtime": 41.747,
237
+ "eval_bigbrother_samples_per_second": 32.817,
238
+ "eval_bigbrother_steps_per_second": 1.03,
239
+ "eval_bigbrother_wer": 0.44960928059292676,
240
+ "step": 10134
241
+ },
242
+ {
243
+ "epoch": 6.0,
244
+ "eval_BB_NB_RUND_loss": 0.6480989456176758,
245
+ "eval_BB_NB_RUND_runtime": 129.1077,
246
+ "eval_BB_NB_RUND_samples_per_second": 25.157,
247
+ "eval_BB_NB_RUND_steps_per_second": 0.79,
248
+ "eval_BB_NB_RUND_wer": 0.2680224291041773,
249
+ "step": 10134
250
+ },
251
+ {
252
+ "epoch": 6.0,
253
+ "eval_rundkast_loss": 0.260196715593338,
254
+ "eval_rundkast_runtime": 32.8953,
255
+ "eval_rundkast_samples_per_second": 40.887,
256
+ "eval_rundkast_steps_per_second": 1.307,
257
+ "eval_rundkast_wer": 0.15001590836780146,
258
+ "step": 10134
259
+ },
260
+ {
261
+ "epoch": 6.0,
262
+ "eval_nb_samtale_loss": 0.4358641803264618,
263
+ "eval_nb_samtale_runtime": 37.2416,
264
+ "eval_nb_samtale_samples_per_second": 14.312,
265
+ "eval_nb_samtale_steps_per_second": 0.456,
266
+ "eval_nb_samtale_wer": 0.20475260416666666,
267
+ "step": 10134
268
+ },
269
+ {
270
+ "epoch": 7.0,
271
+ "grad_norm": 3.0601396560668945,
272
+ "learning_rate": 8.438086587950349e-05,
273
+ "loss": 0.5897,
274
+ "step": 11823
275
+ },
276
+ {
277
+ "epoch": 7.0,
278
+ "eval_bigbrother_loss": 1.1370279788970947,
279
+ "eval_bigbrother_runtime": 40.9127,
280
+ "eval_bigbrother_samples_per_second": 33.486,
281
+ "eval_bigbrother_steps_per_second": 1.051,
282
+ "eval_bigbrother_wer": 0.4386530250543785,
283
+ "step": 11823
284
+ },
285
+ {
286
+ "epoch": 7.0,
287
+ "eval_BB_NB_RUND_loss": 0.6591894626617432,
288
+ "eval_BB_NB_RUND_runtime": 131.1395,
289
+ "eval_BB_NB_RUND_samples_per_second": 24.768,
290
+ "eval_BB_NB_RUND_steps_per_second": 0.778,
291
+ "eval_BB_NB_RUND_wer": 0.26238832398787326,
292
+ "step": 11823
293
+ },
294
+ {
295
+ "epoch": 7.0,
296
+ "eval_rundkast_loss": 0.268062025308609,
297
+ "eval_rundkast_runtime": 33.0258,
298
+ "eval_rundkast_samples_per_second": 40.726,
299
+ "eval_rundkast_steps_per_second": 1.302,
300
+ "eval_rundkast_wer": 0.14762965319758192,
301
+ "step": 11823
302
+ },
303
+ {
304
+ "epoch": 7.0,
305
+ "eval_nb_samtale_loss": 0.4182298183441162,
306
+ "eval_nb_samtale_runtime": 37.1616,
307
+ "eval_nb_samtale_samples_per_second": 14.343,
308
+ "eval_nb_samtale_steps_per_second": 0.457,
309
+ "eval_nb_samtale_wer": 0.20149739583333334,
310
+ "step": 11823
311
+ },
312
+ {
313
+ "epoch": 8.0,
314
+ "grad_norm": 5.5860819816589355,
315
+ "learning_rate": 8.182561307901908e-05,
316
+ "loss": 0.5683,
317
+ "step": 13512
318
+ },
319
+ {
320
+ "epoch": 8.0,
321
+ "eval_bigbrother_loss": 1.1404756307601929,
322
+ "eval_bigbrother_runtime": 40.7715,
323
+ "eval_bigbrother_samples_per_second": 33.602,
324
+ "eval_bigbrother_steps_per_second": 1.055,
325
+ "eval_bigbrother_wer": 0.429388544268106,
326
+ "step": 13512
327
+ },
328
+ {
329
+ "epoch": 8.0,
330
+ "eval_BB_NB_RUND_loss": 0.6637564897537231,
331
+ "eval_BB_NB_RUND_runtime": 129.0461,
332
+ "eval_BB_NB_RUND_samples_per_second": 25.169,
333
+ "eval_BB_NB_RUND_steps_per_second": 0.79,
334
+ "eval_BB_NB_RUND_wer": 0.255466423416414,
335
+ "step": 13512
336
+ },
337
+ {
338
+ "epoch": 8.0,
339
+ "eval_rundkast_loss": 0.26927700638771057,
340
+ "eval_rundkast_runtime": 32.7194,
341
+ "eval_rundkast_samples_per_second": 41.107,
342
+ "eval_rundkast_steps_per_second": 1.314,
343
+ "eval_rundkast_wer": 0.14230034998409163,
344
+ "step": 13512
345
+ },
346
+ {
347
+ "epoch": 8.0,
348
+ "eval_nb_samtale_loss": 0.43339914083480835,
349
+ "eval_nb_samtale_runtime": 37.1014,
350
+ "eval_nb_samtale_samples_per_second": 14.366,
351
+ "eval_nb_samtale_steps_per_second": 0.458,
352
+ "eval_nb_samtale_wer": 0.19539388020833334,
353
+ "step": 13512
354
+ },
355
+ {
356
+ "epoch": 9.0,
357
+ "grad_norm": 6.843884468078613,
358
+ "learning_rate": 7.927036027853467e-05,
359
+ "loss": 0.5532,
360
+ "step": 15201
361
+ },
362
+ {
363
+ "epoch": 9.0,
364
+ "eval_bigbrother_loss": 1.1039360761642456,
365
+ "eval_bigbrother_runtime": 41.1161,
366
+ "eval_bigbrother_samples_per_second": 33.32,
367
+ "eval_bigbrother_steps_per_second": 1.046,
368
+ "eval_bigbrother_wer": 0.42600499476355436,
369
+ "step": 15201
370
+ },
371
+ {
372
+ "epoch": 9.0,
373
+ "eval_BB_NB_RUND_loss": 0.6467078924179077,
374
+ "eval_BB_NB_RUND_runtime": 131.0223,
375
+ "eval_BB_NB_RUND_samples_per_second": 24.79,
376
+ "eval_BB_NB_RUND_steps_per_second": 0.778,
377
+ "eval_BB_NB_RUND_wer": 0.2532664395138572,
378
+ "step": 15201
379
+ },
380
+ {
381
+ "epoch": 9.0,
382
+ "eval_rundkast_loss": 0.27150803804397583,
383
+ "eval_rundkast_runtime": 32.7213,
384
+ "eval_rundkast_samples_per_second": 41.105,
385
+ "eval_rundkast_steps_per_second": 1.314,
386
+ "eval_rundkast_wer": 0.14317531021317212,
387
+ "step": 15201
388
+ },
389
+ {
390
+ "epoch": 9.0,
391
+ "eval_nb_samtale_loss": 0.4183700680732727,
392
+ "eval_nb_samtale_runtime": 37.0058,
393
+ "eval_nb_samtale_samples_per_second": 14.403,
394
+ "eval_nb_samtale_steps_per_second": 0.459,
395
+ "eval_nb_samtale_wer": 0.19173177083333334,
396
+ "step": 15201
397
+ },
398
+ {
399
+ "epoch": 10.0,
400
+ "grad_norm": 4.194594860076904,
401
+ "learning_rate": 7.671359370269452e-05,
402
+ "loss": 0.5346,
403
+ "step": 16890
404
+ },
405
+ {
406
+ "epoch": 10.0,
407
+ "eval_bigbrother_loss": 1.1744848489761353,
408
+ "eval_bigbrother_runtime": 41.0112,
409
+ "eval_bigbrother_samples_per_second": 33.405,
410
+ "eval_bigbrother_steps_per_second": 1.048,
411
+ "eval_bigbrother_wer": 0.4209296705067268,
412
+ "step": 16890
413
+ },
414
+ {
415
+ "epoch": 10.0,
416
+ "eval_BB_NB_RUND_loss": 0.6952946782112122,
417
+ "eval_BB_NB_RUND_runtime": 128.204,
418
+ "eval_BB_NB_RUND_samples_per_second": 25.335,
419
+ "eval_BB_NB_RUND_steps_per_second": 0.796,
420
+ "eval_BB_NB_RUND_wer": 0.2505298741716524,
421
+ "step": 16890
422
+ },
423
+ {
424
+ "epoch": 10.0,
425
+ "eval_rundkast_loss": 0.2990908622741699,
426
+ "eval_rundkast_runtime": 32.6803,
427
+ "eval_rundkast_samples_per_second": 41.156,
428
+ "eval_rundkast_steps_per_second": 1.316,
429
+ "eval_rundkast_wer": 0.1403118040089087,
430
+ "step": 16890
431
+ },
432
+ {
433
+ "epoch": 10.0,
434
+ "eval_nb_samtale_loss": 0.46227914094924927,
435
+ "eval_nb_samtale_runtime": 37.038,
436
+ "eval_nb_samtale_samples_per_second": 14.391,
437
+ "eval_nb_samtale_steps_per_second": 0.459,
438
+ "eval_nb_samtale_wer": 0.19010416666666666,
439
+ "step": 16890
440
+ },
441
+ {
442
+ "epoch": 11.0,
443
+ "grad_norm": 4.1977338790893555,
444
+ "learning_rate": 7.415682712685438e-05,
445
+ "loss": 0.5173,
446
+ "step": 18579
447
+ },
448
+ {
449
+ "epoch": 11.0,
450
+ "eval_bigbrother_loss": 1.2221542596817017,
451
+ "eval_bigbrother_runtime": 40.9814,
452
+ "eval_bigbrother_samples_per_second": 33.43,
453
+ "eval_bigbrother_steps_per_second": 1.049,
454
+ "eval_bigbrother_wer": 0.4190767743494723,
455
+ "step": 18579
456
+ },
457
+ {
458
+ "epoch": 11.0,
459
+ "eval_BB_NB_RUND_loss": 0.7245953679084778,
460
+ "eval_BB_NB_RUND_runtime": 131.2027,
461
+ "eval_BB_NB_RUND_samples_per_second": 24.756,
462
+ "eval_BB_NB_RUND_steps_per_second": 0.777,
463
+ "eval_BB_NB_RUND_wer": 0.2488128135647788,
464
+ "step": 18579
465
+ },
466
+ {
467
+ "epoch": 11.0,
468
+ "eval_rundkast_loss": 0.3232197165489197,
469
+ "eval_rundkast_runtime": 32.6557,
470
+ "eval_rundkast_samples_per_second": 41.187,
471
+ "eval_rundkast_steps_per_second": 1.317,
472
+ "eval_rundkast_wer": 0.14237989182309896,
473
+ "step": 18579
474
+ },
475
+ {
476
+ "epoch": 11.0,
477
+ "eval_nb_samtale_loss": 0.4594550132751465,
478
+ "eval_nb_samtale_runtime": 37.0192,
479
+ "eval_nb_samtale_samples_per_second": 14.398,
480
+ "eval_nb_samtale_steps_per_second": 0.459,
481
+ "eval_nb_samtale_wer": 0.185302734375,
482
+ "step": 18579
483
+ },
484
+ {
485
+ "epoch": 12.0,
486
+ "grad_norm": 3.211408853530884,
487
+ "learning_rate": 7.160157432636997e-05,
488
+ "loss": 0.5034,
489
+ "step": 20268
490
+ },
491
+ {
492
+ "epoch": 12.0,
493
+ "eval_bigbrother_loss": 1.1385760307312012,
494
+ "eval_bigbrother_runtime": 40.816,
495
+ "eval_bigbrother_samples_per_second": 33.565,
496
+ "eval_bigbrother_steps_per_second": 1.054,
497
+ "eval_bigbrother_wer": 0.40981229356319987,
498
+ "step": 20268
499
+ },
500
+ {
501
+ "epoch": 12.0,
502
+ "eval_BB_NB_RUND_loss": 0.6762681603431702,
503
+ "eval_BB_NB_RUND_runtime": 128.7262,
504
+ "eval_BB_NB_RUND_samples_per_second": 25.232,
505
+ "eval_BB_NB_RUND_steps_per_second": 0.792,
506
+ "eval_BB_NB_RUND_wer": 0.24229334907305555,
507
+ "step": 20268
508
+ },
509
+ {
510
+ "epoch": 12.0,
511
+ "eval_rundkast_loss": 0.2944062352180481,
512
+ "eval_rundkast_runtime": 32.5788,
513
+ "eval_rundkast_samples_per_second": 41.284,
514
+ "eval_rundkast_steps_per_second": 1.32,
515
+ "eval_rundkast_wer": 0.1358574610244989,
516
+ "step": 20268
517
+ },
518
+ {
519
+ "epoch": 12.0,
520
+ "eval_nb_samtale_loss": 0.451029509305954,
521
+ "eval_nb_samtale_runtime": 36.6243,
522
+ "eval_nb_samtale_samples_per_second": 14.553,
523
+ "eval_nb_samtale_steps_per_second": 0.464,
524
+ "eval_nb_samtale_wer": 0.18172200520833334,
525
+ "step": 20268
526
+ },
527
+ {
528
+ "epoch": 13.0,
529
+ "grad_norm": 4.915965557098389,
530
+ "learning_rate": 6.904783530124131e-05,
531
+ "loss": 0.4922,
532
+ "step": 21957
533
+ },
534
+ {
535
+ "epoch": 13.0,
536
+ "eval_bigbrother_loss": 1.070022702217102,
537
+ "eval_bigbrother_runtime": 41.6248,
538
+ "eval_bigbrother_samples_per_second": 32.913,
539
+ "eval_bigbrother_steps_per_second": 1.033,
540
+ "eval_bigbrother_wer": 0.408845565133328,
541
+ "step": 21957
542
+ },
543
+ {
544
+ "epoch": 13.0,
545
+ "eval_BB_NB_RUND_loss": 0.641231894493103,
546
+ "eval_BB_NB_RUND_runtime": 130.0831,
547
+ "eval_BB_NB_RUND_samples_per_second": 24.969,
548
+ "eval_BB_NB_RUND_steps_per_second": 0.784,
549
+ "eval_BB_NB_RUND_wer": 0.24320553752045718,
550
+ "step": 21957
551
+ },
552
+ {
553
+ "epoch": 13.0,
554
+ "eval_rundkast_loss": 0.28888097405433655,
555
+ "eval_rundkast_runtime": 32.35,
556
+ "eval_rundkast_samples_per_second": 41.577,
557
+ "eval_rundkast_steps_per_second": 1.329,
558
+ "eval_rundkast_wer": 0.14023226216990137,
559
+ "step": 21957
560
+ },
561
+ {
562
+ "epoch": 13.0,
563
+ "eval_nb_samtale_loss": 0.4279041886329651,
564
+ "eval_nb_samtale_runtime": 36.6119,
565
+ "eval_nb_samtale_samples_per_second": 14.558,
566
+ "eval_nb_samtale_steps_per_second": 0.464,
567
+ "eval_nb_samtale_wer": 0.18180338541666666,
568
+ "step": 21957
569
+ },
570
+ {
571
+ "epoch": 14.0,
572
+ "grad_norm": 7.668597221374512,
573
+ "learning_rate": 6.649106872540115e-05,
574
+ "loss": 0.4787,
575
+ "step": 23646
576
+ },
577
+ {
578
+ "epoch": 14.0,
579
+ "eval_bigbrother_loss": 1.123586893081665,
580
+ "eval_bigbrother_runtime": 40.9041,
581
+ "eval_bigbrother_samples_per_second": 33.493,
582
+ "eval_bigbrother_steps_per_second": 1.051,
583
+ "eval_bigbrother_wer": 0.4079593974059454,
584
+ "step": 23646
585
+ },
586
+ {
587
+ "epoch": 14.0,
588
+ "eval_BB_NB_RUND_loss": 0.6701177358627319,
589
+ "eval_BB_NB_RUND_runtime": 128.6687,
590
+ "eval_BB_NB_RUND_samples_per_second": 25.243,
591
+ "eval_BB_NB_RUND_steps_per_second": 0.793,
592
+ "eval_BB_NB_RUND_wer": 0.24256163979287956,
593
+ "step": 23646
594
+ },
595
+ {
596
+ "epoch": 14.0,
597
+ "eval_rundkast_loss": 0.2999539077281952,
598
+ "eval_rundkast_runtime": 33.5296,
599
+ "eval_rundkast_samples_per_second": 40.114,
600
+ "eval_rundkast_steps_per_second": 1.282,
601
+ "eval_rundkast_wer": 0.13697104677060135,
602
+ "step": 23646
603
+ },
604
+ {
605
+ "epoch": 14.0,
606
+ "eval_nb_samtale_loss": 0.43806180357933044,
607
+ "eval_nb_samtale_runtime": 36.6824,
608
+ "eval_nb_samtale_samples_per_second": 14.53,
609
+ "eval_nb_samtale_steps_per_second": 0.463,
610
+ "eval_nb_samtale_wer": 0.18375651041666666,
611
+ "step": 23646
612
+ },
613
+ {
614
+ "epoch": 15.0,
615
+ "grad_norm": 8.808441162109375,
616
+ "learning_rate": 6.393430214956101e-05,
617
+ "loss": 0.4663,
618
+ "step": 25335
619
+ },
620
+ {
621
+ "epoch": 15.0,
622
+ "eval_bigbrother_loss": 1.160325050354004,
623
+ "eval_bigbrother_runtime": 41.0537,
624
+ "eval_bigbrother_samples_per_second": 33.371,
625
+ "eval_bigbrother_steps_per_second": 1.047,
626
+ "eval_bigbrother_wer": 0.3999033271570128,
627
+ "step": 25335
628
+ },
629
+ {
630
+ "epoch": 15.0,
631
+ "eval_BB_NB_RUND_loss": 0.6799572706222534,
632
+ "eval_BB_NB_RUND_runtime": 185.9813,
633
+ "eval_BB_NB_RUND_samples_per_second": 17.464,
634
+ "eval_BB_NB_RUND_steps_per_second": 0.548,
635
+ "eval_BB_NB_RUND_wer": 0.23767874869208275,
636
+ "step": 25335
637
+ },
638
+ {
639
+ "epoch": 15.0,
640
+ "eval_rundkast_loss": 0.2853633463382721,
641
+ "eval_rundkast_runtime": 32.9208,
642
+ "eval_rundkast_samples_per_second": 40.856,
643
+ "eval_rundkast_steps_per_second": 1.306,
644
+ "eval_rundkast_wer": 0.1345847916003818,
645
+ "step": 25335
646
+ },
647
+ {
648
+ "epoch": 15.0,
649
+ "eval_nb_samtale_loss": 0.4409109652042389,
650
+ "eval_nb_samtale_runtime": 36.4232,
651
+ "eval_nb_samtale_samples_per_second": 14.634,
652
+ "eval_nb_samtale_steps_per_second": 0.467,
653
+ "eval_nb_samtale_wer": 0.178466796875,
654
+ "step": 25335
655
+ },
656
+ {
657
+ "epoch": 16.0,
658
+ "grad_norm": 4.101474761962891,
659
+ "learning_rate": 6.137753557372086e-05,
660
+ "loss": 0.4579,
661
+ "step": 27024
662
+ },
663
+ {
664
+ "epoch": 16.0,
665
+ "eval_bigbrother_loss": 1.155598759651184,
666
+ "eval_bigbrother_runtime": 42.3097,
667
+ "eval_bigbrother_samples_per_second": 32.38,
668
+ "eval_bigbrother_steps_per_second": 1.016,
669
+ "eval_bigbrother_wer": 0.3999033271570128,
670
+ "step": 27024
671
+ },
672
+ {
673
+ "epoch": 16.0,
674
+ "eval_BB_NB_RUND_loss": 0.6771286129951477,
675
+ "eval_BB_NB_RUND_runtime": 128.4569,
676
+ "eval_BB_NB_RUND_samples_per_second": 25.285,
677
+ "eval_BB_NB_RUND_steps_per_second": 0.794,
678
+ "eval_BB_NB_RUND_wer": 0.23773240683604754,
679
+ "step": 27024
680
+ },
681
+ {
682
+ "epoch": 16.0,
683
+ "eval_rundkast_loss": 0.27949705719947815,
684
+ "eval_rundkast_runtime": 32.5865,
685
+ "eval_rundkast_samples_per_second": 41.275,
686
+ "eval_rundkast_steps_per_second": 1.32,
687
+ "eval_rundkast_wer": 0.13450524976137448,
688
+ "step": 27024
689
+ },
690
+ {
691
+ "epoch": 16.0,
692
+ "eval_nb_samtale_loss": 0.4515434503555298,
693
+ "eval_nb_samtale_runtime": 37.0041,
694
+ "eval_nb_samtale_samples_per_second": 14.404,
695
+ "eval_nb_samtale_steps_per_second": 0.459,
696
+ "eval_nb_samtale_wer": 0.17936197916666666,
697
+ "step": 27024
698
+ },
699
+ {
700
+ "epoch": 17.0,
701
+ "grad_norm": 9.384012222290039,
702
+ "learning_rate": 5.882379654859219e-05,
703
+ "loss": 0.4469,
704
+ "step": 28713
705
+ },
706
+ {
707
+ "epoch": 17.0,
708
+ "eval_bigbrother_loss": 1.1895906925201416,
709
+ "eval_bigbrother_runtime": 40.9285,
710
+ "eval_bigbrother_samples_per_second": 33.473,
711
+ "eval_bigbrother_steps_per_second": 1.051,
712
+ "eval_bigbrother_wer": 0.40167566261177795,
713
+ "step": 28713
714
+ },
715
+ {
716
+ "epoch": 17.0,
717
+ "eval_BB_NB_RUND_loss": 0.6978138089179993,
718
+ "eval_BB_NB_RUND_runtime": 169.0105,
719
+ "eval_BB_NB_RUND_samples_per_second": 19.218,
720
+ "eval_BB_NB_RUND_steps_per_second": 0.604,
721
+ "eval_BB_NB_RUND_wer": 0.23837630456362516,
722
+ "step": 28713
723
+ },
724
+ {
725
+ "epoch": 17.0,
726
+ "eval_rundkast_loss": 0.29528018832206726,
727
+ "eval_rundkast_runtime": 32.6968,
728
+ "eval_rundkast_samples_per_second": 41.136,
729
+ "eval_rundkast_steps_per_second": 1.315,
730
+ "eval_rundkast_wer": 0.1377664651606745,
731
+ "step": 28713
732
+ },
733
+ {
734
+ "epoch": 17.0,
735
+ "eval_nb_samtale_loss": 0.4508727788925171,
736
+ "eval_nb_samtale_runtime": 36.4289,
737
+ "eval_nb_samtale_samples_per_second": 14.631,
738
+ "eval_nb_samtale_steps_per_second": 0.467,
739
+ "eval_nb_samtale_wer": 0.17667643229166666,
740
+ "step": 28713
741
+ },
742
+ {
743
+ "epoch": 18.0,
744
+ "grad_norm": 3.587054491043091,
745
+ "learning_rate": 5.626702997275205e-05,
746
+ "loss": 0.4399,
747
+ "step": 30402
748
+ },
749
+ {
750
+ "epoch": 18.0,
751
+ "eval_bigbrother_loss": 1.1661101579666138,
752
+ "eval_bigbrother_runtime": 41.0139,
753
+ "eval_bigbrother_samples_per_second": 33.403,
754
+ "eval_bigbrother_steps_per_second": 1.048,
755
+ "eval_bigbrother_wer": 0.3982921131072263,
756
+ "step": 30402
757
+ },
758
+ {
759
+ "epoch": 18.0,
760
+ "eval_BB_NB_RUND_loss": 0.6934623718261719,
761
+ "eval_BB_NB_RUND_runtime": 127.79,
762
+ "eval_BB_NB_RUND_samples_per_second": 25.417,
763
+ "eval_BB_NB_RUND_steps_per_second": 0.798,
764
+ "eval_BB_NB_RUND_wer": 0.23443243098221234,
765
+ "step": 30402
766
+ },
767
+ {
768
+ "epoch": 18.0,
769
+ "eval_rundkast_loss": 0.3097790777683258,
770
+ "eval_rundkast_runtime": 32.5419,
771
+ "eval_rundkast_samples_per_second": 41.331,
772
+ "eval_rundkast_steps_per_second": 1.321,
773
+ "eval_rundkast_wer": 0.13307349665924276,
774
+ "step": 30402
775
+ },
776
+ {
777
+ "epoch": 18.0,
778
+ "eval_nb_samtale_loss": 0.4466961622238159,
779
+ "eval_nb_samtale_runtime": 36.4501,
780
+ "eval_nb_samtale_samples_per_second": 14.623,
781
+ "eval_nb_samtale_steps_per_second": 0.466,
782
+ "eval_nb_samtale_wer": 0.17268880208333334,
783
+ "step": 30402
784
+ },
785
+ {
786
+ "epoch": 19.0,
787
+ "grad_norm": 4.3045973777771,
788
+ "learning_rate": 5.371177717226764e-05,
789
+ "loss": 0.4313,
790
+ "step": 32091
791
+ },
792
+ {
793
+ "epoch": 19.0,
794
+ "eval_bigbrother_loss": 1.1764683723449707,
795
+ "eval_bigbrother_runtime": 41.1081,
796
+ "eval_bigbrother_samples_per_second": 33.327,
797
+ "eval_bigbrother_steps_per_second": 1.046,
798
+ "eval_bigbrother_wer": 0.3935390316603561,
799
+ "step": 32091
800
+ },
801
+ {
802
+ "epoch": 19.0,
803
+ "eval_BB_NB_RUND_loss": 0.6927400231361389,
804
+ "eval_BB_NB_RUND_runtime": 131.0803,
805
+ "eval_BB_NB_RUND_samples_per_second": 24.779,
806
+ "eval_BB_NB_RUND_steps_per_second": 0.778,
807
+ "eval_BB_NB_RUND_wer": 0.23349341346282831,
808
+ "step": 32091
809
+ },
810
+ {
811
+ "epoch": 19.0,
812
+ "eval_rundkast_loss": 0.296793133020401,
813
+ "eval_rundkast_runtime": 32.4376,
814
+ "eval_rundkast_samples_per_second": 41.464,
815
+ "eval_rundkast_steps_per_second": 1.326,
816
+ "eval_rundkast_wer": 0.13355074769328668,
817
+ "step": 32091
818
+ },
819
+ {
820
+ "epoch": 19.0,
821
+ "eval_nb_samtale_loss": 0.44873738288879395,
822
+ "eval_nb_samtale_runtime": 36.5729,
823
+ "eval_nb_samtale_samples_per_second": 14.574,
824
+ "eval_nb_samtale_steps_per_second": 0.465,
825
+ "eval_nb_samtale_wer": 0.17415364583333334,
826
+ "step": 32091
827
+ },
828
+ {
829
+ "epoch": 20.0,
830
+ "grad_norm": 2.650940418243408,
831
+ "learning_rate": 5.115501059642749e-05,
832
+ "loss": 0.4229,
833
+ "step": 33780
834
+ },
835
+ {
836
+ "epoch": 20.0,
837
+ "eval_bigbrother_loss": 1.1612807512283325,
838
+ "eval_bigbrother_runtime": 41.2062,
839
+ "eval_bigbrother_samples_per_second": 33.247,
840
+ "eval_bigbrother_steps_per_second": 1.044,
841
+ "eval_bigbrother_wer": 0.39402239587529203,
842
+ "step": 33780
843
+ },
844
+ {
845
+ "epoch": 20.0,
846
+ "eval_BB_NB_RUND_loss": 0.6827826499938965,
847
+ "eval_BB_NB_RUND_runtime": 326.107,
848
+ "eval_BB_NB_RUND_samples_per_second": 9.96,
849
+ "eval_BB_NB_RUND_steps_per_second": 0.313,
850
+ "eval_BB_NB_RUND_wer": 0.23164220749604272,
851
+ "step": 33780
852
+ },
853
+ {
854
+ "epoch": 20.0,
855
+ "eval_rundkast_loss": 0.29459282755851746,
856
+ "eval_rundkast_runtime": 36.3812,
857
+ "eval_rundkast_samples_per_second": 36.97,
858
+ "eval_rundkast_steps_per_second": 1.182,
859
+ "eval_rundkast_wer": 0.12957365574292076,
860
+ "step": 33780
861
+ },
862
+ {
863
+ "epoch": 20.0,
864
+ "eval_nb_samtale_loss": 0.4326167404651642,
865
+ "eval_nb_samtale_runtime": 39.3019,
866
+ "eval_nb_samtale_samples_per_second": 13.562,
867
+ "eval_nb_samtale_steps_per_second": 0.433,
868
+ "eval_nb_samtale_wer": 0.17252604166666666,
869
+ "step": 33780
870
+ },
871
+ {
872
+ "epoch": 21.0,
873
+ "grad_norm": 6.971451282501221,
874
+ "learning_rate": 4.859975779594308e-05,
875
+ "loss": 0.4173,
876
+ "step": 35469
877
+ },
878
+ {
879
+ "epoch": 21.0,
880
+ "eval_bigbrother_loss": 1.18746018409729,
881
+ "eval_bigbrother_runtime": 42.6131,
882
+ "eval_bigbrother_samples_per_second": 32.15,
883
+ "eval_bigbrother_steps_per_second": 1.009,
884
+ "eval_bigbrother_wer": 0.3920889390155482,
885
+ "step": 35469
886
+ },
887
+ {
888
+ "epoch": 21.0,
889
+ "eval_BB_NB_RUND_loss": 0.6960651874542236,
890
+ "eval_BB_NB_RUND_runtime": 153.2803,
891
+ "eval_BB_NB_RUND_samples_per_second": 21.19,
892
+ "eval_BB_NB_RUND_steps_per_second": 0.665,
893
+ "eval_BB_NB_RUND_wer": 0.23126660048828912,
894
+ "step": 35469
895
+ },
896
+ {
897
+ "epoch": 21.0,
898
+ "eval_rundkast_loss": 0.2939074635505676,
899
+ "eval_rundkast_runtime": 161.3899,
900
+ "eval_rundkast_samples_per_second": 8.334,
901
+ "eval_rundkast_steps_per_second": 0.266,
902
+ "eval_rundkast_wer": 0.13084632516703787,
903
+ "step": 35469
904
+ },
905
+ {
906
+ "epoch": 21.0,
907
+ "eval_nb_samtale_loss": 0.44757071137428284,
908
+ "eval_nb_samtale_runtime": 49.4947,
909
+ "eval_nb_samtale_samples_per_second": 10.769,
910
+ "eval_nb_samtale_steps_per_second": 0.343,
911
+ "eval_nb_samtale_wer": 0.17244466145833334,
912
+ "step": 35469
913
+ },
914
+ {
915
+ "epoch": 22.0,
916
+ "grad_norm": 7.361974716186523,
917
+ "learning_rate": 4.6042991220102936e-05,
918
+ "loss": 0.4101,
919
+ "step": 37158
920
+ },
921
+ {
922
+ "epoch": 22.0,
923
+ "eval_bigbrother_loss": 1.2487200498580933,
924
+ "eval_bigbrother_runtime": 44.9933,
925
+ "eval_bigbrother_samples_per_second": 30.449,
926
+ "eval_bigbrother_steps_per_second": 0.956,
927
+ "eval_bigbrother_wer": 0.39152501409812296,
928
+ "step": 37158
929
+ },
930
+ {
931
+ "epoch": 22.0,
932
+ "eval_BB_NB_RUND_loss": 0.7247402667999268,
933
+ "eval_BB_NB_RUND_runtime": 182.0939,
934
+ "eval_BB_NB_RUND_samples_per_second": 17.837,
935
+ "eval_BB_NB_RUND_steps_per_second": 0.56,
936
+ "eval_BB_NB_RUND_wer": 0.2308105062645883,
937
+ "step": 37158
938
+ },
939
+ {
940
+ "epoch": 22.0,
941
+ "eval_rundkast_loss": 0.2898001968860626,
942
+ "eval_rundkast_runtime": 38.6925,
943
+ "eval_rundkast_samples_per_second": 34.761,
944
+ "eval_rundkast_steps_per_second": 1.111,
945
+ "eval_rundkast_wer": 0.13084632516703787,
946
+ "step": 37158
947
+ },
948
+ {
949
+ "epoch": 22.0,
950
+ "eval_nb_samtale_loss": 0.4750688672065735,
951
+ "eval_nb_samtale_runtime": 42.0801,
952
+ "eval_nb_samtale_samples_per_second": 12.666,
953
+ "eval_nb_samtale_steps_per_second": 0.404,
954
+ "eval_nb_samtale_wer": 0.1708984375,
955
+ "step": 37158
956
+ },
957
+ {
958
+ "epoch": 23.0,
959
+ "grad_norm": 3.2216553688049316,
960
+ "learning_rate": 4.348773841961853e-05,
961
+ "loss": 0.3985,
962
+ "step": 38847
963
+ },
964
+ {
965
+ "epoch": 23.0,
966
+ "eval_bigbrother_loss": 1.1696597337722778,
967
+ "eval_bigbrother_runtime": 41.468,
968
+ "eval_bigbrother_samples_per_second": 33.038,
969
+ "eval_bigbrother_steps_per_second": 1.037,
970
+ "eval_bigbrother_wer": 0.3846773543865302,
971
+ "step": 38847
972
+ },
973
+ {
974
+ "epoch": 23.0,
975
+ "eval_BB_NB_RUND_loss": 0.6836020350456238,
976
+ "eval_BB_NB_RUND_runtime": 175.228,
977
+ "eval_BB_NB_RUND_samples_per_second": 18.536,
978
+ "eval_BB_NB_RUND_steps_per_second": 0.582,
979
+ "eval_BB_NB_RUND_wer": 0.2291739328736619,
980
+ "step": 38847
981
+ },
982
+ {
983
+ "epoch": 23.0,
984
+ "eval_rundkast_loss": 0.2838425934314728,
985
+ "eval_rundkast_runtime": 32.5363,
986
+ "eval_rundkast_samples_per_second": 41.338,
987
+ "eval_rundkast_steps_per_second": 1.322,
988
+ "eval_rundkast_wer": 0.1319599109131403,
989
+ "step": 38847
990
+ },
991
+ {
992
+ "epoch": 23.0,
993
+ "eval_nb_samtale_loss": 0.442909300327301,
994
+ "eval_nb_samtale_runtime": 36.3978,
995
+ "eval_nb_samtale_samples_per_second": 14.644,
996
+ "eval_nb_samtale_steps_per_second": 0.467,
997
+ "eval_nb_samtale_wer": 0.17203776041666666,
998
+ "step": 38847
999
+ },
1000
+ {
1001
+ "epoch": 24.0,
1002
+ "grad_norm": 8.511246681213379,
1003
+ "learning_rate": 4.0933999394489856e-05,
1004
+ "loss": 0.3943,
1005
+ "step": 40536
1006
+ },
1007
+ {
1008
+ "epoch": 24.0,
1009
+ "eval_bigbrother_loss": 1.1965091228485107,
1010
+ "eval_bigbrother_runtime": 41.19,
1011
+ "eval_bigbrother_samples_per_second": 33.26,
1012
+ "eval_bigbrother_steps_per_second": 1.044,
1013
+ "eval_bigbrother_wer": 0.38363006525416904,
1014
+ "step": 40536
1015
+ },
1016
+ {
1017
+ "epoch": 24.0,
1018
+ "eval_BB_NB_RUND_loss": 0.7099454402923584,
1019
+ "eval_BB_NB_RUND_runtime": 129.9149,
1020
+ "eval_BB_NB_RUND_samples_per_second": 25.001,
1021
+ "eval_BB_NB_RUND_steps_per_second": 0.785,
1022
+ "eval_BB_NB_RUND_wer": 0.2286910095779787,
1023
+ "step": 40536
1024
+ },
1025
+ {
1026
+ "epoch": 24.0,
1027
+ "eval_rundkast_loss": 0.31351616978645325,
1028
+ "eval_rundkast_runtime": 32.5656,
1029
+ "eval_rundkast_samples_per_second": 41.301,
1030
+ "eval_rundkast_steps_per_second": 1.32,
1031
+ "eval_rundkast_wer": 0.13108495068405981,
1032
+ "step": 40536
1033
+ },
1034
+ {
1035
+ "epoch": 24.0,
1036
+ "eval_nb_samtale_loss": 0.4599841833114624,
1037
+ "eval_nb_samtale_runtime": 36.637,
1038
+ "eval_nb_samtale_samples_per_second": 14.548,
1039
+ "eval_nb_samtale_steps_per_second": 0.464,
1040
+ "eval_nb_samtale_wer": 0.17154947916666666,
1041
+ "step": 40536
1042
+ },
1043
+ {
1044
+ "epoch": 25.0,
1045
+ "grad_norm": 3.3434505462646484,
1046
+ "learning_rate": 3.837723281864972e-05,
1047
+ "loss": 0.3902,
1048
+ "step": 42225
1049
+ },
1050
+ {
1051
+ "epoch": 25.0,
1052
+ "eval_bigbrother_loss": 1.194956660270691,
1053
+ "eval_bigbrother_runtime": 41.082,
1054
+ "eval_bigbrother_samples_per_second": 33.348,
1055
+ "eval_bigbrother_steps_per_second": 1.047,
1056
+ "eval_bigbrother_wer": 0.38193829050189315,
1057
+ "step": 42225
1058
+ },
1059
+ {
1060
+ "epoch": 25.0,
1061
+ "eval_BB_NB_RUND_loss": 0.7117018103599548,
1062
+ "eval_BB_NB_RUND_runtime": 129.0515,
1063
+ "eval_BB_NB_RUND_samples_per_second": 25.168,
1064
+ "eval_BB_NB_RUND_steps_per_second": 0.79,
1065
+ "eval_BB_NB_RUND_wer": 0.2270812652590347,
1066
+ "step": 42225
1067
+ },
1068
+ {
1069
+ "epoch": 25.0,
1070
+ "eval_rundkast_loss": 0.31047695875167847,
1071
+ "eval_rundkast_runtime": 32.4929,
1072
+ "eval_rundkast_samples_per_second": 41.394,
1073
+ "eval_rundkast_steps_per_second": 1.323,
1074
+ "eval_rundkast_wer": 0.13124403436207446,
1075
+ "step": 42225
1076
+ },
1077
+ {
1078
+ "epoch": 25.0,
1079
+ "eval_nb_samtale_loss": 0.48264163732528687,
1080
+ "eval_nb_samtale_runtime": 36.4332,
1081
+ "eval_nb_samtale_samples_per_second": 14.63,
1082
+ "eval_nb_samtale_steps_per_second": 0.467,
1083
+ "eval_nb_samtale_wer": 0.16878255208333334,
1084
+ "step": 42225
1085
+ },
1086
+ {
1087
+ "epoch": 26.0,
1088
+ "grad_norm": 3.0726335048675537,
1089
+ "learning_rate": 3.582046624280957e-05,
1090
+ "loss": 0.3836,
1091
+ "step": 43914
1092
+ },
1093
+ {
1094
+ "epoch": 26.0,
1095
+ "eval_bigbrother_loss": 1.2235493659973145,
1096
+ "eval_bigbrother_runtime": 41.1244,
1097
+ "eval_bigbrother_samples_per_second": 33.314,
1098
+ "eval_bigbrother_steps_per_second": 1.046,
1099
+ "eval_bigbrother_wer": 0.3832272617417224,
1100
+ "step": 43914
1101
+ },
1102
+ {
1103
+ "epoch": 26.0,
1104
+ "eval_BB_NB_RUND_loss": 0.7329136729240417,
1105
+ "eval_BB_NB_RUND_runtime": 153.8243,
1106
+ "eval_BB_NB_RUND_samples_per_second": 21.115,
1107
+ "eval_BB_NB_RUND_steps_per_second": 0.663,
1108
+ "eval_BB_NB_RUND_wer": 0.22842271885815468,
1109
+ "step": 43914
1110
+ },
1111
+ {
1112
+ "epoch": 26.0,
1113
+ "eval_rundkast_loss": 0.3316984474658966,
1114
+ "eval_rundkast_runtime": 32.4356,
1115
+ "eval_rundkast_samples_per_second": 41.467,
1116
+ "eval_rundkast_steps_per_second": 1.326,
1117
+ "eval_rundkast_wer": 0.13434616608335984,
1118
+ "step": 43914
1119
+ },
1120
+ {
1121
+ "epoch": 26.0,
1122
+ "eval_nb_samtale_loss": 0.48570868372917175,
1123
+ "eval_nb_samtale_runtime": 36.6552,
1124
+ "eval_nb_samtale_samples_per_second": 14.541,
1125
+ "eval_nb_samtale_steps_per_second": 0.464,
1126
+ "eval_nb_samtale_wer": 0.16731770833333334,
1127
+ "step": 43914
1128
+ },
1129
+ {
1130
+ "epoch": 27.0,
1131
+ "grad_norm": 15.335138320922852,
1132
+ "learning_rate": 3.3263699666969425e-05,
1133
+ "loss": 0.3786,
1134
+ "step": 45603
1135
+ },
1136
+ {
1137
+ "epoch": 27.0,
1138
+ "eval_bigbrother_loss": 1.205081820487976,
1139
+ "eval_bigbrother_runtime": 40.4664,
1140
+ "eval_bigbrother_samples_per_second": 33.855,
1141
+ "eval_bigbrother_steps_per_second": 1.063,
1142
+ "eval_bigbrother_wer": 0.3794409087247241,
1143
+ "step": 45603
1144
+ },
1145
+ {
1146
+ "epoch": 27.0,
1147
+ "eval_BB_NB_RUND_loss": 0.7199556231498718,
1148
+ "eval_BB_NB_RUND_runtime": 130.4204,
1149
+ "eval_BB_NB_RUND_samples_per_second": 24.904,
1150
+ "eval_BB_NB_RUND_steps_per_second": 0.782,
1151
+ "eval_BB_NB_RUND_wer": 0.22506908486035468,
1152
+ "step": 45603
1153
+ },
1154
+ {
1155
+ "epoch": 27.0,
1156
+ "eval_rundkast_loss": 0.31949692964553833,
1157
+ "eval_rundkast_runtime": 32.7387,
1158
+ "eval_rundkast_samples_per_second": 41.083,
1159
+ "eval_rundkast_steps_per_second": 1.313,
1160
+ "eval_rundkast_wer": 0.12846006999681833,
1161
+ "step": 45603
1162
+ },
1163
+ {
1164
+ "epoch": 27.0,
1165
+ "eval_nb_samtale_loss": 0.48315760493278503,
1166
+ "eval_nb_samtale_runtime": 36.3915,
1167
+ "eval_nb_samtale_samples_per_second": 14.646,
1168
+ "eval_nb_samtale_steps_per_second": 0.467,
1169
+ "eval_nb_samtale_wer": 0.16715494791666666,
1170
+ "step": 45603
1171
+ },
1172
+ {
1173
+ "epoch": 28.0,
1174
+ "grad_norm": 9.487163543701172,
1175
+ "learning_rate": 3.0708446866485016e-05,
1176
+ "loss": 0.3752,
1177
+ "step": 47292
1178
+ },
1179
+ {
1180
+ "epoch": 28.0,
1181
+ "eval_bigbrother_loss": 1.200919508934021,
1182
+ "eval_bigbrother_runtime": 40.9519,
1183
+ "eval_bigbrother_samples_per_second": 33.454,
1184
+ "eval_bigbrother_steps_per_second": 1.05,
1185
+ "eval_bigbrother_wer": 0.380165955047128,
1186
+ "step": 47292
1187
+ },
1188
+ {
1189
+ "epoch": 28.0,
1190
+ "eval_BB_NB_RUND_loss": 0.7172989845275879,
1191
+ "eval_BB_NB_RUND_runtime": 127.4559,
1192
+ "eval_BB_NB_RUND_samples_per_second": 25.483,
1193
+ "eval_BB_NB_RUND_steps_per_second": 0.8,
1194
+ "eval_BB_NB_RUND_wer": 0.2256861535159499,
1195
+ "step": 47292
1196
+ },
1197
+ {
1198
+ "epoch": 28.0,
1199
+ "eval_rundkast_loss": 0.3196479082107544,
1200
+ "eval_rundkast_runtime": 32.5881,
1201
+ "eval_rundkast_samples_per_second": 41.273,
1202
+ "eval_rundkast_steps_per_second": 1.319,
1203
+ "eval_rundkast_wer": 0.13084632516703787,
1204
+ "step": 47292
1205
+ },
1206
+ {
1207
+ "epoch": 28.0,
1208
+ "eval_nb_samtale_loss": 0.4765280485153198,
1209
+ "eval_nb_samtale_runtime": 37.1947,
1210
+ "eval_nb_samtale_samples_per_second": 14.33,
1211
+ "eval_nb_samtale_steps_per_second": 0.457,
1212
+ "eval_nb_samtale_wer": 0.16731770833333334,
1213
+ "step": 47292
1214
+ },
1215
+ {
1216
+ "epoch": 29.0,
1217
+ "grad_norm": 4.333740234375,
1218
+ "learning_rate": 2.8153194066000604e-05,
1219
+ "loss": 0.3718,
1220
+ "step": 48981
1221
+ },
1222
+ {
1223
+ "epoch": 29.0,
1224
+ "eval_bigbrother_loss": 1.2218164205551147,
1225
+ "eval_bigbrother_runtime": 40.6907,
1226
+ "eval_bigbrother_samples_per_second": 33.669,
1227
+ "eval_bigbrother_steps_per_second": 1.057,
1228
+ "eval_bigbrother_wer": 0.37621848062515106,
1229
+ "step": 48981
1230
+ },
1231
+ {
1232
+ "epoch": 29.0,
1233
+ "eval_BB_NB_RUND_loss": 0.7251059412956238,
1234
+ "eval_BB_NB_RUND_runtime": 151.9233,
1235
+ "eval_BB_NB_RUND_samples_per_second": 21.379,
1236
+ "eval_BB_NB_RUND_steps_per_second": 0.671,
1237
+ "eval_BB_NB_RUND_wer": 0.22418372548493548,
1238
+ "step": 48981
1239
+ },
1240
+ {
1241
+ "epoch": 29.0,
1242
+ "eval_rundkast_loss": 0.319437175989151,
1243
+ "eval_rundkast_runtime": 32.7825,
1244
+ "eval_rundkast_samples_per_second": 41.028,
1245
+ "eval_rundkast_steps_per_second": 1.312,
1246
+ "eval_rundkast_wer": 0.13084632516703787,
1247
+ "step": 48981
1248
+ },
1249
+ {
1250
+ "epoch": 29.0,
1251
+ "eval_nb_samtale_loss": 0.4711519181728363,
1252
+ "eval_nb_samtale_runtime": 36.3015,
1253
+ "eval_nb_samtale_samples_per_second": 14.683,
1254
+ "eval_nb_samtale_steps_per_second": 0.468,
1255
+ "eval_nb_samtale_wer": 0.16609700520833334,
1256
+ "step": 48981
1257
+ },
1258
+ {
1259
+ "epoch": 30.0,
1260
+ "grad_norm": 6.403714179992676,
1261
+ "learning_rate": 2.5596427490160462e-05,
1262
+ "loss": 0.3645,
1263
+ "step": 50670
1264
+ },
1265
+ {
1266
+ "epoch": 30.0,
1267
+ "eval_bigbrother_loss": 1.183604121208191,
1268
+ "eval_bigbrother_runtime": 42.3075,
1269
+ "eval_bigbrother_samples_per_second": 32.382,
1270
+ "eval_bigbrother_steps_per_second": 1.016,
1271
+ "eval_bigbrother_wer": 0.37557399500523647,
1272
+ "step": 50670
1273
+ },
1274
+ {
1275
+ "epoch": 30.0,
1276
+ "eval_BB_NB_RUND_loss": 0.7078377604484558,
1277
+ "eval_BB_NB_RUND_runtime": 127.3976,
1278
+ "eval_BB_NB_RUND_samples_per_second": 25.495,
1279
+ "eval_BB_NB_RUND_steps_per_second": 0.801,
1280
+ "eval_BB_NB_RUND_wer": 0.22356665682934027,
1281
+ "step": 50670
1282
+ },
1283
+ {
1284
+ "epoch": 30.0,
1285
+ "eval_rundkast_loss": 0.3230808675289154,
1286
+ "eval_rundkast_runtime": 32.4456,
1287
+ "eval_rundkast_samples_per_second": 41.454,
1288
+ "eval_rundkast_steps_per_second": 1.325,
1289
+ "eval_rundkast_wer": 0.12861915367483295,
1290
+ "step": 50670
1291
+ },
1292
+ {
1293
+ "epoch": 30.0,
1294
+ "eval_nb_samtale_loss": 0.4557996094226837,
1295
+ "eval_nb_samtale_runtime": 36.3068,
1296
+ "eval_nb_samtale_samples_per_second": 14.68,
1297
+ "eval_nb_samtale_steps_per_second": 0.468,
1298
+ "eval_nb_samtale_wer": 0.16642252604166666,
1299
+ "step": 50670
1300
+ },
1301
+ {
1302
+ "epoch": 31.0,
1303
+ "grad_norm": 3.91894268989563,
1304
+ "learning_rate": 2.3041174689676053e-05,
1305
+ "loss": 0.3609,
1306
+ "step": 52359
1307
+ },
1308
+ {
1309
+ "epoch": 31.0,
1310
+ "eval_bigbrother_loss": 1.2197799682617188,
1311
+ "eval_bigbrother_runtime": 41.1407,
1312
+ "eval_bigbrother_samples_per_second": 33.3,
1313
+ "eval_bigbrother_steps_per_second": 1.045,
1314
+ "eval_bigbrother_wer": 0.37565455570772577,
1315
+ "step": 52359
1316
+ },
1317
+ {
1318
+ "epoch": 31.0,
1319
+ "eval_BB_NB_RUND_loss": 0.7260043025016785,
1320
+ "eval_BB_NB_RUND_runtime": 131.0819,
1321
+ "eval_BB_NB_RUND_samples_per_second": 24.778,
1322
+ "eval_BB_NB_RUND_steps_per_second": 0.778,
1323
+ "eval_BB_NB_RUND_wer": 0.22383494754916428,
1324
+ "step": 52359
1325
+ },
1326
+ {
1327
+ "epoch": 31.0,
1328
+ "eval_rundkast_loss": 0.32174140214920044,
1329
+ "eval_rundkast_runtime": 32.4715,
1330
+ "eval_rundkast_samples_per_second": 41.421,
1331
+ "eval_rundkast_steps_per_second": 1.324,
1332
+ "eval_rundkast_wer": 0.12885777919185493,
1333
+ "step": 52359
1334
+ },
1335
+ {
1336
+ "epoch": 31.0,
1337
+ "eval_nb_samtale_loss": 0.47712796926498413,
1338
+ "eval_nb_samtale_runtime": 36.1596,
1339
+ "eval_nb_samtale_samples_per_second": 14.74,
1340
+ "eval_nb_samtale_steps_per_second": 0.47,
1341
+ "eval_nb_samtale_wer": 0.166748046875,
1342
+ "step": 52359
1343
+ },
1344
+ {
1345
+ "epoch": 32.0,
1346
+ "grad_norm": 2.9196996688842773,
1347
+ "learning_rate": 2.0485921889191645e-05,
1348
+ "loss": 0.36,
1349
+ "step": 54048
1350
+ },
1351
+ {
1352
+ "epoch": 32.0,
1353
+ "eval_bigbrother_loss": 1.2731306552886963,
1354
+ "eval_bigbrother_runtime": 40.9963,
1355
+ "eval_bigbrother_samples_per_second": 33.418,
1356
+ "eval_bigbrother_steps_per_second": 1.049,
1357
+ "eval_bigbrother_wer": 0.3735599774430033,
1358
+ "step": 54048
1359
+ },
1360
+ {
1361
+ "epoch": 32.0,
1362
+ "eval_BB_NB_RUND_loss": 0.7525675296783447,
1363
+ "eval_BB_NB_RUND_runtime": 128.3644,
1364
+ "eval_BB_NB_RUND_samples_per_second": 25.303,
1365
+ "eval_BB_NB_RUND_steps_per_second": 0.795,
1366
+ "eval_BB_NB_RUND_wer": 0.22262763930995627,
1367
+ "step": 54048
1368
+ },
1369
+ {
1370
+ "epoch": 32.0,
1371
+ "eval_rundkast_loss": 0.3295101523399353,
1372
+ "eval_rundkast_runtime": 33.7671,
1373
+ "eval_rundkast_samples_per_second": 39.832,
1374
+ "eval_rundkast_steps_per_second": 1.273,
1375
+ "eval_rundkast_wer": 0.12798281896277441,
1376
+ "step": 54048
1377
+ },
1378
+ {
1379
+ "epoch": 32.0,
1380
+ "eval_nb_samtale_loss": 0.48206984996795654,
1381
+ "eval_nb_samtale_runtime": 36.7176,
1382
+ "eval_nb_samtale_samples_per_second": 14.516,
1383
+ "eval_nb_samtale_steps_per_second": 0.463,
1384
+ "eval_nb_samtale_wer": 0.16691080729166666,
1385
+ "step": 54048
1386
+ },
1387
+ {
1388
+ "epoch": 33.0,
1389
+ "grad_norm": 7.844558238983154,
1390
+ "learning_rate": 1.7929155313351502e-05,
1391
+ "loss": 0.3497,
1392
+ "step": 55737
1393
+ },
1394
+ {
1395
+ "epoch": 33.0,
1396
+ "eval_bigbrother_loss": 1.2425702810287476,
1397
+ "eval_bigbrother_runtime": 40.5135,
1398
+ "eval_bigbrother_samples_per_second": 33.816,
1399
+ "eval_bigbrother_steps_per_second": 1.061,
1400
+ "eval_bigbrother_wer": 0.37219044550068475,
1401
+ "step": 55737
1402
+ },
1403
+ {
1404
+ "epoch": 33.0,
1405
+ "eval_BB_NB_RUND_loss": 0.7353043556213379,
1406
+ "eval_BB_NB_RUND_runtime": 130.7216,
1407
+ "eval_BB_NB_RUND_samples_per_second": 24.847,
1408
+ "eval_BB_NB_RUND_steps_per_second": 0.78,
1409
+ "eval_BB_NB_RUND_wer": 0.22085692055911785,
1410
+ "step": 55737
1411
+ },
1412
+ {
1413
+ "epoch": 33.0,
1414
+ "eval_rundkast_loss": 0.32282164692878723,
1415
+ "eval_rundkast_runtime": 32.5615,
1416
+ "eval_rundkast_samples_per_second": 41.306,
1417
+ "eval_rundkast_steps_per_second": 1.321,
1418
+ "eval_rundkast_wer": 0.12623289850461342,
1419
+ "step": 55737
1420
+ },
1421
+ {
1422
+ "epoch": 33.0,
1423
+ "eval_nb_samtale_loss": 0.47214123606681824,
1424
+ "eval_nb_samtale_runtime": 36.5675,
1425
+ "eval_nb_samtale_samples_per_second": 14.576,
1426
+ "eval_nb_samtale_steps_per_second": 0.465,
1427
+ "eval_nb_samtale_wer": 0.16357421875,
1428
+ "step": 55737
1429
+ },
1430
+ {
1431
+ "epoch": 34.0,
1432
+ "grad_norm": 7.324841022491455,
1433
+ "learning_rate": 1.537541628822283e-05,
1434
+ "loss": 0.352,
1435
+ "step": 57426
1436
+ },
1437
+ {
1438
+ "epoch": 34.0,
1439
+ "eval_bigbrother_loss": 1.306195616722107,
1440
+ "eval_bigbrother_runtime": 41.3854,
1441
+ "eval_bigbrother_samples_per_second": 33.103,
1442
+ "eval_bigbrother_steps_per_second": 1.039,
1443
+ "eval_bigbrother_wer": 0.3747683879803432,
1444
+ "step": 57426
1445
+ },
1446
+ {
1447
+ "epoch": 34.0,
1448
+ "eval_BB_NB_RUND_loss": 0.7695896029472351,
1449
+ "eval_BB_NB_RUND_runtime": 128.8264,
1450
+ "eval_BB_NB_RUND_samples_per_second": 25.212,
1451
+ "eval_BB_NB_RUND_steps_per_second": 0.792,
1452
+ "eval_BB_NB_RUND_wer": 0.22206422879832585,
1453
+ "step": 57426
1454
+ },
1455
+ {
1456
+ "epoch": 34.0,
1457
+ "eval_rundkast_loss": 0.33627748489379883,
1458
+ "eval_rundkast_runtime": 35.7,
1459
+ "eval_rundkast_samples_per_second": 37.675,
1460
+ "eval_rundkast_steps_per_second": 1.204,
1461
+ "eval_rundkast_wer": 0.1270283168946866,
1462
+ "step": 57426
1463
+ },
1464
+ {
1465
+ "epoch": 34.0,
1466
+ "eval_nb_samtale_loss": 0.48346221446990967,
1467
+ "eval_nb_samtale_runtime": 37.2815,
1468
+ "eval_nb_samtale_samples_per_second": 14.297,
1469
+ "eval_nb_samtale_steps_per_second": 0.456,
1470
+ "eval_nb_samtale_wer": 0.16487630208333334,
1471
+ "step": 57426
1472
+ },
1473
+ {
1474
+ "epoch": 35.0,
1475
+ "grad_norm": 8.772356986999512,
1476
+ "learning_rate": 1.2818649712382683e-05,
1477
+ "loss": 0.3475,
1478
+ "step": 59115
1479
+ },
1480
+ {
1481
+ "epoch": 35.0,
1482
+ "eval_bigbrother_loss": 1.2660571336746216,
1483
+ "eval_bigbrother_runtime": 41.6526,
1484
+ "eval_bigbrother_samples_per_second": 32.891,
1485
+ "eval_bigbrother_steps_per_second": 1.032,
1486
+ "eval_bigbrother_wer": 0.37662128413759766,
1487
+ "step": 59115
1488
+ },
1489
+ {
1490
+ "epoch": 35.0,
1491
+ "eval_BB_NB_RUND_loss": 0.7468720078468323,
1492
+ "eval_BB_NB_RUND_runtime": 168.5154,
1493
+ "eval_BB_NB_RUND_samples_per_second": 19.274,
1494
+ "eval_BB_NB_RUND_steps_per_second": 0.605,
1495
+ "eval_BB_NB_RUND_wer": 0.22329836610951628,
1496
+ "step": 59115
1497
+ },
1498
+ {
1499
+ "epoch": 35.0,
1500
+ "eval_rundkast_loss": 0.3307986259460449,
1501
+ "eval_rundkast_runtime": 32.7759,
1502
+ "eval_rundkast_samples_per_second": 41.036,
1503
+ "eval_rundkast_steps_per_second": 1.312,
1504
+ "eval_rundkast_wer": 0.12861915367483295,
1505
+ "step": 59115
1506
+ },
1507
+ {
1508
+ "epoch": 35.0,
1509
+ "eval_nb_samtale_loss": 0.4614698588848114,
1510
+ "eval_nb_samtale_runtime": 36.7886,
1511
+ "eval_nb_samtale_samples_per_second": 14.488,
1512
+ "eval_nb_samtale_steps_per_second": 0.462,
1513
+ "eval_nb_samtale_wer": 0.1650390625,
1514
+ "step": 59115
1515
+ },
1516
+ {
1517
+ "epoch": 36.0,
1518
+ "grad_norm": 2.949153184890747,
1519
+ "learning_rate": 1.0261883136542537e-05,
1520
+ "loss": 0.3436,
1521
+ "step": 60804
1522
+ },
1523
+ {
1524
+ "epoch": 36.0,
1525
+ "eval_bigbrother_loss": 1.2538405656814575,
1526
+ "eval_bigbrother_runtime": 41.1392,
1527
+ "eval_bigbrother_samples_per_second": 33.302,
1528
+ "eval_bigbrother_steps_per_second": 1.045,
1529
+ "eval_bigbrother_wer": 0.3738822202529606,
1530
+ "step": 60804
1531
+ },
1532
+ {
1533
+ "epoch": 36.0,
1534
+ "eval_BB_NB_RUND_loss": 0.7353929877281189,
1535
+ "eval_BB_NB_RUND_runtime": 128.0616,
1536
+ "eval_BB_NB_RUND_samples_per_second": 25.363,
1537
+ "eval_BB_NB_RUND_steps_per_second": 0.796,
1538
+ "eval_BB_NB_RUND_wer": 0.22300324631770987,
1539
+ "step": 60804
1540
+ },
1541
+ {
1542
+ "epoch": 36.0,
1543
+ "eval_rundkast_loss": 0.313808798789978,
1544
+ "eval_rundkast_runtime": 33.2884,
1545
+ "eval_rundkast_samples_per_second": 40.404,
1546
+ "eval_rundkast_steps_per_second": 1.292,
1547
+ "eval_rundkast_wer": 0.1297327394209354,
1548
+ "step": 60804
1549
+ },
1550
+ {
1551
+ "epoch": 36.0,
1552
+ "eval_nb_samtale_loss": 0.466793030500412,
1553
+ "eval_nb_samtale_runtime": 36.3748,
1554
+ "eval_nb_samtale_samples_per_second": 14.653,
1555
+ "eval_nb_samtale_steps_per_second": 0.467,
1556
+ "eval_nb_samtale_wer": 0.16455078125,
1557
+ "step": 60804
1558
+ },
1559
+ {
1560
+ "epoch": 37.0,
1561
+ "grad_norm": 8.754982948303223,
1562
+ "learning_rate": 7.70663033605813e-06,
1563
+ "loss": 0.3476,
1564
+ "step": 62493
1565
+ },
1566
+ {
1567
+ "epoch": 37.0,
1568
+ "eval_bigbrother_loss": 1.2831249237060547,
1569
+ "eval_bigbrother_runtime": 41.6433,
1570
+ "eval_bigbrother_samples_per_second": 32.898,
1571
+ "eval_bigbrother_steps_per_second": 1.033,
1572
+ "eval_bigbrother_wer": 0.37219044550068475,
1573
+ "step": 62493
1574
+ },
1575
+ {
1576
+ "epoch": 37.0,
1577
+ "eval_BB_NB_RUND_loss": 0.7575647234916687,
1578
+ "eval_BB_NB_RUND_runtime": 156.4835,
1579
+ "eval_BB_NB_RUND_samples_per_second": 20.756,
1580
+ "eval_BB_NB_RUND_steps_per_second": 0.652,
1581
+ "eval_BB_NB_RUND_wer": 0.22139350199876587,
1582
+ "step": 62493
1583
+ },
1584
+ {
1585
+ "epoch": 37.0,
1586
+ "eval_rundkast_loss": 0.33385977149009705,
1587
+ "eval_rundkast_runtime": 32.6665,
1588
+ "eval_rundkast_samples_per_second": 41.174,
1589
+ "eval_rundkast_steps_per_second": 1.316,
1590
+ "eval_rundkast_wer": 0.12726694241170855,
1591
+ "step": 62493
1592
+ },
1593
+ {
1594
+ "epoch": 37.0,
1595
+ "eval_nb_samtale_loss": 0.47487109899520874,
1596
+ "eval_nb_samtale_runtime": 36.6818,
1597
+ "eval_nb_samtale_samples_per_second": 14.53,
1598
+ "eval_nb_samtale_steps_per_second": 0.463,
1599
+ "eval_nb_samtale_wer": 0.16495768229166666,
1600
+ "step": 62493
1601
+ },
1602
+ {
1603
+ "epoch": 38.0,
1604
+ "grad_norm": 3.9857819080352783,
1605
+ "learning_rate": 5.151377535573721e-06,
1606
+ "loss": 0.3395,
1607
+ "step": 64182
1608
+ },
1609
+ {
1610
+ "epoch": 38.0,
1611
+ "eval_bigbrother_loss": 1.2619588375091553,
1612
+ "eval_bigbrother_runtime": 40.9934,
1613
+ "eval_bigbrother_samples_per_second": 33.42,
1614
+ "eval_bigbrother_steps_per_second": 1.049,
1615
+ "eval_bigbrother_wer": 0.3714653991782808,
1616
+ "step": 64182
1617
+ },
1618
+ {
1619
+ "epoch": 38.0,
1620
+ "eval_BB_NB_RUND_loss": 0.7496170997619629,
1621
+ "eval_BB_NB_RUND_runtime": 127.9601,
1622
+ "eval_BB_NB_RUND_samples_per_second": 25.383,
1623
+ "eval_BB_NB_RUND_steps_per_second": 0.797,
1624
+ "eval_BB_NB_RUND_wer": 0.22184959622246667,
1625
+ "step": 64182
1626
+ },
1627
+ {
1628
+ "epoch": 38.0,
1629
+ "eval_rundkast_loss": 0.3360491693019867,
1630
+ "eval_rundkast_runtime": 33.333,
1631
+ "eval_rundkast_samples_per_second": 40.35,
1632
+ "eval_rundkast_steps_per_second": 1.29,
1633
+ "eval_rundkast_wer": 0.12830098631880368,
1634
+ "step": 64182
1635
+ },
1636
+ {
1637
+ "epoch": 38.0,
1638
+ "eval_nb_samtale_loss": 0.47765567898750305,
1639
+ "eval_nb_samtale_runtime": 36.2738,
1640
+ "eval_nb_samtale_samples_per_second": 14.694,
1641
+ "eval_nb_samtale_steps_per_second": 0.469,
1642
+ "eval_nb_samtale_wer": 0.16569010416666666,
1643
+ "step": 64182
1644
+ },
1645
+ {
1646
+ "epoch": 39.0,
1647
+ "grad_norm": 3.834691286087036,
1648
+ "learning_rate": 2.5946109597335756e-06,
1649
+ "loss": 0.3415,
1650
+ "step": 65871
1651
+ },
1652
+ {
1653
+ "epoch": 39.0,
1654
+ "eval_bigbrother_loss": 1.2587852478027344,
1655
+ "eval_bigbrother_runtime": 42.0349,
1656
+ "eval_bigbrother_samples_per_second": 32.592,
1657
+ "eval_bigbrother_steps_per_second": 1.023,
1658
+ "eval_bigbrother_wer": 0.3704986707484089,
1659
+ "step": 65871
1660
+ },
1661
+ {
1662
+ "epoch": 39.0,
1663
+ "eval_BB_NB_RUND_loss": 0.747022271156311,
1664
+ "eval_BB_NB_RUND_runtime": 165.2337,
1665
+ "eval_BB_NB_RUND_samples_per_second": 19.657,
1666
+ "eval_BB_NB_RUND_steps_per_second": 0.617,
1667
+ "eval_BB_NB_RUND_wer": 0.22021302283154026,
1668
+ "step": 65871
1669
+ },
1670
+ {
1671
+ "epoch": 39.0,
1672
+ "eval_rundkast_loss": 0.3341328203678131,
1673
+ "eval_rundkast_runtime": 32.991,
1674
+ "eval_rundkast_samples_per_second": 40.769,
1675
+ "eval_rundkast_steps_per_second": 1.303,
1676
+ "eval_rundkast_wer": 0.1265510658606427,
1677
+ "step": 65871
1678
+ },
1679
+ {
1680
+ "epoch": 39.0,
1681
+ "eval_nb_samtale_loss": 0.47388482093811035,
1682
+ "eval_nb_samtale_runtime": 36.3132,
1683
+ "eval_nb_samtale_samples_per_second": 14.678,
1684
+ "eval_nb_samtale_steps_per_second": 0.468,
1685
+ "eval_nb_samtale_wer": 0.16389973958333334,
1686
+ "step": 65871
1687
+ }
1688
+ ],
1689
+ "logging_steps": 500,
1690
+ "max_steps": 67560,
1691
+ "num_input_tokens_seen": 0,
1692
+ "num_train_epochs": 40,
1693
+ "save_steps": 500,
1694
+ "total_flos": 3.6574726698214536e+20,
1695
+ "train_batch_size": 48,
1696
+ "trial_name": null,
1697
+ "trial_params": null
1698
+ }
checkpoint-65871/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:350225cd13eaea5c53facdfd0bf5c84ee772638ee245537f79787ad7224840fa
3
+ size 4984
checkpoint-67560/config.json ADDED
@@ -0,0 +1,116 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "NbAiLab/nb-wav2vec2-300m-bokmaal",
3
+ "activation_dropout": 0.055,
4
+ "adapter_attn_dim": null,
5
+ "adapter_kernel_size": 3,
6
+ "adapter_stride": 2,
7
+ "add_adapter": false,
8
+ "apply_spec_augment": true,
9
+ "architectures": [
10
+ "Wav2Vec2ForCTC"
11
+ ],
12
+ "attention_dropout": 0.094,
13
+ "bos_token_id": 1,
14
+ "classifier_proj_size": 256,
15
+ "codevector_dim": 768,
16
+ "contrastive_logits_temperature": 0.1,
17
+ "conv_bias": true,
18
+ "conv_dim": [
19
+ 512,
20
+ 512,
21
+ 512,
22
+ 512,
23
+ 512,
24
+ 512,
25
+ 512
26
+ ],
27
+ "conv_kernel": [
28
+ 10,
29
+ 3,
30
+ 3,
31
+ 3,
32
+ 3,
33
+ 2,
34
+ 2
35
+ ],
36
+ "conv_stride": [
37
+ 5,
38
+ 2,
39
+ 2,
40
+ 2,
41
+ 2,
42
+ 2,
43
+ 2
44
+ ],
45
+ "ctc_loss_reduction": "mean",
46
+ "ctc_zero_infinity": true,
47
+ "diversity_loss_weight": 0.1,
48
+ "do_stable_layer_norm": true,
49
+ "eos_token_id": 2,
50
+ "feat_extract_activation": "gelu",
51
+ "feat_extract_dropout": 0.0,
52
+ "feat_extract_norm": "layer",
53
+ "feat_proj_dropout": 0.04,
54
+ "feat_quantizer_dropout": 0.0,
55
+ "final_dropout": 0.0,
56
+ "hidden_act": "gelu",
57
+ "hidden_dropout": 0.047,
58
+ "hidden_size": 1024,
59
+ "initializer_range": 0.02,
60
+ "intermediate_size": 4096,
61
+ "layer_norm_eps": 1e-05,
62
+ "layerdrop": 0.041,
63
+ "mask_channel_length": 10,
64
+ "mask_channel_min_space": 1,
65
+ "mask_channel_other": 0.0,
66
+ "mask_channel_prob": 0.0,
67
+ "mask_channel_selection": "static",
68
+ "mask_feature_length": 64,
69
+ "mask_feature_min_masks": 0,
70
+ "mask_feature_prob": 0.25,
71
+ "mask_time_length": 10,
72
+ "mask_time_min_masks": 2,
73
+ "mask_time_min_space": 1,
74
+ "mask_time_other": 0.0,
75
+ "mask_time_prob": 0.082,
76
+ "mask_time_selection": "static",
77
+ "model_type": "wav2vec2",
78
+ "num_adapter_layers": 3,
79
+ "num_attention_heads": 16,
80
+ "num_codevector_groups": 2,
81
+ "num_codevectors_per_group": 320,
82
+ "num_conv_pos_embedding_groups": 16,
83
+ "num_conv_pos_embeddings": 128,
84
+ "num_feat_extract_layers": 7,
85
+ "num_hidden_layers": 24,
86
+ "num_negatives": 100,
87
+ "output_hidden_size": 1024,
88
+ "pad_token_id": 31,
89
+ "proj_codevector_dim": 768,
90
+ "tdnn_dilation": [
91
+ 1,
92
+ 2,
93
+ 3,
94
+ 1,
95
+ 1
96
+ ],
97
+ "tdnn_dim": [
98
+ 512,
99
+ 512,
100
+ 512,
101
+ 512,
102
+ 1500
103
+ ],
104
+ "tdnn_kernel": [
105
+ 5,
106
+ 3,
107
+ 3,
108
+ 1,
109
+ 1
110
+ ],
111
+ "torch_dtype": "float32",
112
+ "transformers_version": "4.38.1",
113
+ "use_weighted_layer_sum": false,
114
+ "vocab_size": 34,
115
+ "xvector_output_dim": 512
116
+ }
checkpoint-67560/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0826be868a8f5fd759dbf2b85a4655deaea32ffa6c27479443fcf37ceb5dc5d
3
+ size 1261946880
checkpoint-67560/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9831f50feb2bd1397556671fad14557a4d8af1d856515f4a66076c7bc7d24da
3
+ size 2490438582
checkpoint-67560/preprocessor_config.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_normalize": true,
3
+ "feature_extractor_type": "Wav2Vec2FeatureExtractor",
4
+ "feature_size": 1,
5
+ "padding_side": "right",
6
+ "padding_value": 0,
7
+ "processor_class": "Wav2Vec2ProcessorWithLM",
8
+ "return_attention_mask": true,
9
+ "sampling_rate": 16000
10
+ }
checkpoint-67560/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2266ae49b2f43d94c6b2ae41098615cbe4e6e72766b89431b513ee4344e7e801
3
+ size 14308
checkpoint-67560/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6284df78b3056008982cbae6b46769d982b0b1ac54dc8cdd29908a6bc0316f92
3
+ size 1064
checkpoint-67560/trainer_state.json ADDED
@@ -0,0 +1,1741 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.22021302283154026,
3
+ "best_model_checkpoint": "/cluster/home/torstefl/Master/saved_model/W2V/Combined/BB-NB-RUND/30.05/checkpoint-65871",
4
+ "epoch": 40.0,
5
+ "eval_steps": 500,
6
+ "global_step": 67560,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 1.0,
13
+ "grad_norm": 5.23741340637207,
14
+ "learning_rate": 9.971692400847715e-05,
15
+ "loss": 0.9222,
16
+ "step": 1689
17
+ },
18
+ {
19
+ "epoch": 1.0,
20
+ "eval_bigbrother_loss": 1.5889759063720703,
21
+ "eval_bigbrother_runtime": 41.228,
22
+ "eval_bigbrother_samples_per_second": 33.23,
23
+ "eval_bigbrother_steps_per_second": 1.043,
24
+ "eval_bigbrother_wer": 0.5449931523402884,
25
+ "step": 1689
26
+ },
27
+ {
28
+ "epoch": 1.0,
29
+ "eval_BB_NB_RUND_loss": 0.9018728137016296,
30
+ "eval_BB_NB_RUND_runtime": 133.4774,
31
+ "eval_BB_NB_RUND_samples_per_second": 24.334,
32
+ "eval_BB_NB_RUND_steps_per_second": 0.764,
33
+ "eval_BB_NB_RUND_wer": 0.32291471038016795,
34
+ "step": 1689
35
+ },
36
+ {
37
+ "epoch": 1.0,
38
+ "eval_rundkast_loss": 0.3399111032485962,
39
+ "eval_rundkast_runtime": 32.978,
40
+ "eval_rundkast_samples_per_second": 40.785,
41
+ "eval_rundkast_steps_per_second": 1.304,
42
+ "eval_rundkast_wer": 0.1885937002863506,
43
+ "step": 1689
44
+ },
45
+ {
46
+ "epoch": 1.0,
47
+ "eval_nb_samtale_loss": 0.5534453988075256,
48
+ "eval_nb_samtale_runtime": 38.0417,
49
+ "eval_nb_samtale_samples_per_second": 14.011,
50
+ "eval_nb_samtale_steps_per_second": 0.447,
51
+ "eval_nb_samtale_wer": 0.235595703125,
52
+ "step": 1689
53
+ },
54
+ {
55
+ "epoch": 2.0,
56
+ "grad_norm": 3.7305831909179688,
57
+ "learning_rate": 9.716167120799274e-05,
58
+ "loss": 0.7821,
59
+ "step": 3378
60
+ },
61
+ {
62
+ "epoch": 2.0,
63
+ "eval_bigbrother_loss": 1.4070501327514648,
64
+ "eval_bigbrother_runtime": 41.1443,
65
+ "eval_bigbrother_samples_per_second": 33.297,
66
+ "eval_bigbrother_steps_per_second": 1.045,
67
+ "eval_bigbrother_wer": 0.510271489567389,
68
+ "step": 3378
69
+ },
70
+ {
71
+ "epoch": 2.0,
72
+ "eval_BB_NB_RUND_loss": 0.8076683282852173,
73
+ "eval_BB_NB_RUND_runtime": 129.6259,
74
+ "eval_BB_NB_RUND_samples_per_second": 25.057,
75
+ "eval_BB_NB_RUND_steps_per_second": 0.787,
76
+ "eval_BB_NB_RUND_wer": 0.30147828186623027,
77
+ "step": 3378
78
+ },
79
+ {
80
+ "epoch": 2.0,
81
+ "eval_rundkast_loss": 0.317608118057251,
82
+ "eval_rundkast_runtime": 32.5347,
83
+ "eval_rundkast_samples_per_second": 41.34,
84
+ "eval_rundkast_steps_per_second": 1.322,
85
+ "eval_rundkast_wer": 0.16775373846643335,
86
+ "step": 3378
87
+ },
88
+ {
89
+ "epoch": 2.0,
90
+ "eval_nb_samtale_loss": 0.5036561489105225,
91
+ "eval_nb_samtale_runtime": 37.1369,
92
+ "eval_nb_samtale_samples_per_second": 14.352,
93
+ "eval_nb_samtale_steps_per_second": 0.458,
94
+ "eval_nb_samtale_wer": 0.22639973958333334,
95
+ "step": 3378
96
+ },
97
+ {
98
+ "epoch": 3.0,
99
+ "grad_norm": 4.790787696838379,
100
+ "learning_rate": 9.460490463215258e-05,
101
+ "loss": 0.7185,
102
+ "step": 5067
103
+ },
104
+ {
105
+ "epoch": 3.0,
106
+ "eval_bigbrother_loss": 1.203812837600708,
107
+ "eval_bigbrother_runtime": 41.1237,
108
+ "eval_bigbrother_samples_per_second": 33.314,
109
+ "eval_bigbrother_steps_per_second": 1.046,
110
+ "eval_bigbrother_wer": 0.49714009506162893,
111
+ "step": 5067
112
+ },
113
+ {
114
+ "epoch": 3.0,
115
+ "eval_BB_NB_RUND_loss": 0.6942233443260193,
116
+ "eval_BB_NB_RUND_runtime": 132.6472,
117
+ "eval_BB_NB_RUND_samples_per_second": 24.486,
118
+ "eval_BB_NB_RUND_steps_per_second": 0.769,
119
+ "eval_BB_NB_RUND_wer": 0.2955222278861374,
120
+ "step": 5067
121
+ },
122
+ {
123
+ "epoch": 3.0,
124
+ "eval_rundkast_loss": 0.27395445108413696,
125
+ "eval_rundkast_runtime": 32.6467,
126
+ "eval_rundkast_samples_per_second": 41.199,
127
+ "eval_rundkast_steps_per_second": 1.317,
128
+ "eval_rundkast_wer": 0.16481069042316257,
129
+ "step": 5067
130
+ },
131
+ {
132
+ "epoch": 3.0,
133
+ "eval_nb_samtale_loss": 0.44476863741874695,
134
+ "eval_nb_samtale_runtime": 37.2129,
135
+ "eval_nb_samtale_samples_per_second": 14.323,
136
+ "eval_nb_samtale_steps_per_second": 0.457,
137
+ "eval_nb_samtale_wer": 0.225830078125,
138
+ "step": 5067
139
+ },
140
+ {
141
+ "epoch": 4.0,
142
+ "grad_norm": 4.615499496459961,
143
+ "learning_rate": 9.204965183166818e-05,
144
+ "loss": 0.6788,
145
+ "step": 6756
146
+ },
147
+ {
148
+ "epoch": 4.0,
149
+ "eval_bigbrother_loss": 1.1682614088058472,
150
+ "eval_bigbrother_runtime": 41.2735,
151
+ "eval_bigbrother_samples_per_second": 33.193,
152
+ "eval_bigbrother_steps_per_second": 1.042,
153
+ "eval_bigbrother_wer": 0.46934665270281156,
154
+ "step": 6756
155
+ },
156
+ {
157
+ "epoch": 4.0,
158
+ "eval_BB_NB_RUND_loss": 0.6765461564064026,
159
+ "eval_BB_NB_RUND_runtime": 128.689,
160
+ "eval_BB_NB_RUND_samples_per_second": 25.239,
161
+ "eval_BB_NB_RUND_steps_per_second": 0.793,
162
+ "eval_BB_NB_RUND_wer": 0.27942478469669735,
163
+ "step": 6756
164
+ },
165
+ {
166
+ "epoch": 4.0,
167
+ "eval_rundkast_loss": 0.2691804766654968,
168
+ "eval_rundkast_runtime": 32.6511,
169
+ "eval_rundkast_samples_per_second": 41.193,
170
+ "eval_rundkast_steps_per_second": 1.317,
171
+ "eval_rundkast_wer": 0.15566337893732102,
172
+ "step": 6756
173
+ },
174
+ {
175
+ "epoch": 4.0,
176
+ "eval_nb_samtale_loss": 0.4400266706943512,
177
+ "eval_nb_samtale_runtime": 37.139,
178
+ "eval_nb_samtale_samples_per_second": 14.351,
179
+ "eval_nb_samtale_steps_per_second": 0.458,
180
+ "eval_nb_samtale_wer": 0.21329752604166666,
181
+ "step": 6756
182
+ },
183
+ {
184
+ "epoch": 5.0,
185
+ "grad_norm": 5.309389591217041,
186
+ "learning_rate": 8.949288525582804e-05,
187
+ "loss": 0.6442,
188
+ "step": 8445
189
+ },
190
+ {
191
+ "epoch": 5.0,
192
+ "eval_bigbrother_loss": 1.163558006286621,
193
+ "eval_bigbrother_runtime": 41.5596,
194
+ "eval_bigbrother_samples_per_second": 32.965,
195
+ "eval_bigbrother_steps_per_second": 1.035,
196
+ "eval_bigbrother_wer": 0.46080721823894305,
197
+ "step": 8445
198
+ },
199
+ {
200
+ "epoch": 5.0,
201
+ "eval_BB_NB_RUND_loss": 0.6712897419929504,
202
+ "eval_BB_NB_RUND_runtime": 199.5442,
203
+ "eval_BB_NB_RUND_samples_per_second": 16.277,
204
+ "eval_BB_NB_RUND_steps_per_second": 0.511,
205
+ "eval_BB_NB_RUND_wer": 0.2733345853566925,
206
+ "step": 8445
207
+ },
208
+ {
209
+ "epoch": 5.0,
210
+ "eval_rundkast_loss": 0.26304560899734497,
211
+ "eval_rundkast_runtime": 32.653,
212
+ "eval_rundkast_samples_per_second": 41.191,
213
+ "eval_rundkast_steps_per_second": 1.317,
214
+ "eval_rundkast_wer": 0.15224307986000638,
215
+ "step": 8445
216
+ },
217
+ {
218
+ "epoch": 5.0,
219
+ "eval_nb_samtale_loss": 0.4362596273422241,
220
+ "eval_nb_samtale_runtime": 37.3619,
221
+ "eval_nb_samtale_samples_per_second": 14.266,
222
+ "eval_nb_samtale_steps_per_second": 0.455,
223
+ "eval_nb_samtale_wer": 0.20719401041666666,
224
+ "step": 8445
225
+ },
226
+ {
227
+ "epoch": 6.0,
228
+ "grad_norm": 3.735290050506592,
229
+ "learning_rate": 8.69361186799879e-05,
230
+ "loss": 0.6167,
231
+ "step": 10134
232
+ },
233
+ {
234
+ "epoch": 6.0,
235
+ "eval_bigbrother_loss": 1.111521601676941,
236
+ "eval_bigbrother_runtime": 41.747,
237
+ "eval_bigbrother_samples_per_second": 32.817,
238
+ "eval_bigbrother_steps_per_second": 1.03,
239
+ "eval_bigbrother_wer": 0.44960928059292676,
240
+ "step": 10134
241
+ },
242
+ {
243
+ "epoch": 6.0,
244
+ "eval_BB_NB_RUND_loss": 0.6480989456176758,
245
+ "eval_BB_NB_RUND_runtime": 129.1077,
246
+ "eval_BB_NB_RUND_samples_per_second": 25.157,
247
+ "eval_BB_NB_RUND_steps_per_second": 0.79,
248
+ "eval_BB_NB_RUND_wer": 0.2680224291041773,
249
+ "step": 10134
250
+ },
251
+ {
252
+ "epoch": 6.0,
253
+ "eval_rundkast_loss": 0.260196715593338,
254
+ "eval_rundkast_runtime": 32.8953,
255
+ "eval_rundkast_samples_per_second": 40.887,
256
+ "eval_rundkast_steps_per_second": 1.307,
257
+ "eval_rundkast_wer": 0.15001590836780146,
258
+ "step": 10134
259
+ },
260
+ {
261
+ "epoch": 6.0,
262
+ "eval_nb_samtale_loss": 0.4358641803264618,
263
+ "eval_nb_samtale_runtime": 37.2416,
264
+ "eval_nb_samtale_samples_per_second": 14.312,
265
+ "eval_nb_samtale_steps_per_second": 0.456,
266
+ "eval_nb_samtale_wer": 0.20475260416666666,
267
+ "step": 10134
268
+ },
269
+ {
270
+ "epoch": 7.0,
271
+ "grad_norm": 3.0601396560668945,
272
+ "learning_rate": 8.438086587950349e-05,
273
+ "loss": 0.5897,
274
+ "step": 11823
275
+ },
276
+ {
277
+ "epoch": 7.0,
278
+ "eval_bigbrother_loss": 1.1370279788970947,
279
+ "eval_bigbrother_runtime": 40.9127,
280
+ "eval_bigbrother_samples_per_second": 33.486,
281
+ "eval_bigbrother_steps_per_second": 1.051,
282
+ "eval_bigbrother_wer": 0.4386530250543785,
283
+ "step": 11823
284
+ },
285
+ {
286
+ "epoch": 7.0,
287
+ "eval_BB_NB_RUND_loss": 0.6591894626617432,
288
+ "eval_BB_NB_RUND_runtime": 131.1395,
289
+ "eval_BB_NB_RUND_samples_per_second": 24.768,
290
+ "eval_BB_NB_RUND_steps_per_second": 0.778,
291
+ "eval_BB_NB_RUND_wer": 0.26238832398787326,
292
+ "step": 11823
293
+ },
294
+ {
295
+ "epoch": 7.0,
296
+ "eval_rundkast_loss": 0.268062025308609,
297
+ "eval_rundkast_runtime": 33.0258,
298
+ "eval_rundkast_samples_per_second": 40.726,
299
+ "eval_rundkast_steps_per_second": 1.302,
300
+ "eval_rundkast_wer": 0.14762965319758192,
301
+ "step": 11823
302
+ },
303
+ {
304
+ "epoch": 7.0,
305
+ "eval_nb_samtale_loss": 0.4182298183441162,
306
+ "eval_nb_samtale_runtime": 37.1616,
307
+ "eval_nb_samtale_samples_per_second": 14.343,
308
+ "eval_nb_samtale_steps_per_second": 0.457,
309
+ "eval_nb_samtale_wer": 0.20149739583333334,
310
+ "step": 11823
311
+ },
312
+ {
313
+ "epoch": 8.0,
314
+ "grad_norm": 5.5860819816589355,
315
+ "learning_rate": 8.182561307901908e-05,
316
+ "loss": 0.5683,
317
+ "step": 13512
318
+ },
319
+ {
320
+ "epoch": 8.0,
321
+ "eval_bigbrother_loss": 1.1404756307601929,
322
+ "eval_bigbrother_runtime": 40.7715,
323
+ "eval_bigbrother_samples_per_second": 33.602,
324
+ "eval_bigbrother_steps_per_second": 1.055,
325
+ "eval_bigbrother_wer": 0.429388544268106,
326
+ "step": 13512
327
+ },
328
+ {
329
+ "epoch": 8.0,
330
+ "eval_BB_NB_RUND_loss": 0.6637564897537231,
331
+ "eval_BB_NB_RUND_runtime": 129.0461,
332
+ "eval_BB_NB_RUND_samples_per_second": 25.169,
333
+ "eval_BB_NB_RUND_steps_per_second": 0.79,
334
+ "eval_BB_NB_RUND_wer": 0.255466423416414,
335
+ "step": 13512
336
+ },
337
+ {
338
+ "epoch": 8.0,
339
+ "eval_rundkast_loss": 0.26927700638771057,
340
+ "eval_rundkast_runtime": 32.7194,
341
+ "eval_rundkast_samples_per_second": 41.107,
342
+ "eval_rundkast_steps_per_second": 1.314,
343
+ "eval_rundkast_wer": 0.14230034998409163,
344
+ "step": 13512
345
+ },
346
+ {
347
+ "epoch": 8.0,
348
+ "eval_nb_samtale_loss": 0.43339914083480835,
349
+ "eval_nb_samtale_runtime": 37.1014,
350
+ "eval_nb_samtale_samples_per_second": 14.366,
351
+ "eval_nb_samtale_steps_per_second": 0.458,
352
+ "eval_nb_samtale_wer": 0.19539388020833334,
353
+ "step": 13512
354
+ },
355
+ {
356
+ "epoch": 9.0,
357
+ "grad_norm": 6.843884468078613,
358
+ "learning_rate": 7.927036027853467e-05,
359
+ "loss": 0.5532,
360
+ "step": 15201
361
+ },
362
+ {
363
+ "epoch": 9.0,
364
+ "eval_bigbrother_loss": 1.1039360761642456,
365
+ "eval_bigbrother_runtime": 41.1161,
366
+ "eval_bigbrother_samples_per_second": 33.32,
367
+ "eval_bigbrother_steps_per_second": 1.046,
368
+ "eval_bigbrother_wer": 0.42600499476355436,
369
+ "step": 15201
370
+ },
371
+ {
372
+ "epoch": 9.0,
373
+ "eval_BB_NB_RUND_loss": 0.6467078924179077,
374
+ "eval_BB_NB_RUND_runtime": 131.0223,
375
+ "eval_BB_NB_RUND_samples_per_second": 24.79,
376
+ "eval_BB_NB_RUND_steps_per_second": 0.778,
377
+ "eval_BB_NB_RUND_wer": 0.2532664395138572,
378
+ "step": 15201
379
+ },
380
+ {
381
+ "epoch": 9.0,
382
+ "eval_rundkast_loss": 0.27150803804397583,
383
+ "eval_rundkast_runtime": 32.7213,
384
+ "eval_rundkast_samples_per_second": 41.105,
385
+ "eval_rundkast_steps_per_second": 1.314,
386
+ "eval_rundkast_wer": 0.14317531021317212,
387
+ "step": 15201
388
+ },
389
+ {
390
+ "epoch": 9.0,
391
+ "eval_nb_samtale_loss": 0.4183700680732727,
392
+ "eval_nb_samtale_runtime": 37.0058,
393
+ "eval_nb_samtale_samples_per_second": 14.403,
394
+ "eval_nb_samtale_steps_per_second": 0.459,
395
+ "eval_nb_samtale_wer": 0.19173177083333334,
396
+ "step": 15201
397
+ },
398
+ {
399
+ "epoch": 10.0,
400
+ "grad_norm": 4.194594860076904,
401
+ "learning_rate": 7.671359370269452e-05,
402
+ "loss": 0.5346,
403
+ "step": 16890
404
+ },
405
+ {
406
+ "epoch": 10.0,
407
+ "eval_bigbrother_loss": 1.1744848489761353,
408
+ "eval_bigbrother_runtime": 41.0112,
409
+ "eval_bigbrother_samples_per_second": 33.405,
410
+ "eval_bigbrother_steps_per_second": 1.048,
411
+ "eval_bigbrother_wer": 0.4209296705067268,
412
+ "step": 16890
413
+ },
414
+ {
415
+ "epoch": 10.0,
416
+ "eval_BB_NB_RUND_loss": 0.6952946782112122,
417
+ "eval_BB_NB_RUND_runtime": 128.204,
418
+ "eval_BB_NB_RUND_samples_per_second": 25.335,
419
+ "eval_BB_NB_RUND_steps_per_second": 0.796,
420
+ "eval_BB_NB_RUND_wer": 0.2505298741716524,
421
+ "step": 16890
422
+ },
423
+ {
424
+ "epoch": 10.0,
425
+ "eval_rundkast_loss": 0.2990908622741699,
426
+ "eval_rundkast_runtime": 32.6803,
427
+ "eval_rundkast_samples_per_second": 41.156,
428
+ "eval_rundkast_steps_per_second": 1.316,
429
+ "eval_rundkast_wer": 0.1403118040089087,
430
+ "step": 16890
431
+ },
432
+ {
433
+ "epoch": 10.0,
434
+ "eval_nb_samtale_loss": 0.46227914094924927,
435
+ "eval_nb_samtale_runtime": 37.038,
436
+ "eval_nb_samtale_samples_per_second": 14.391,
437
+ "eval_nb_samtale_steps_per_second": 0.459,
438
+ "eval_nb_samtale_wer": 0.19010416666666666,
439
+ "step": 16890
440
+ },
441
+ {
442
+ "epoch": 11.0,
443
+ "grad_norm": 4.1977338790893555,
444
+ "learning_rate": 7.415682712685438e-05,
445
+ "loss": 0.5173,
446
+ "step": 18579
447
+ },
448
+ {
449
+ "epoch": 11.0,
450
+ "eval_bigbrother_loss": 1.2221542596817017,
451
+ "eval_bigbrother_runtime": 40.9814,
452
+ "eval_bigbrother_samples_per_second": 33.43,
453
+ "eval_bigbrother_steps_per_second": 1.049,
454
+ "eval_bigbrother_wer": 0.4190767743494723,
455
+ "step": 18579
456
+ },
457
+ {
458
+ "epoch": 11.0,
459
+ "eval_BB_NB_RUND_loss": 0.7245953679084778,
460
+ "eval_BB_NB_RUND_runtime": 131.2027,
461
+ "eval_BB_NB_RUND_samples_per_second": 24.756,
462
+ "eval_BB_NB_RUND_steps_per_second": 0.777,
463
+ "eval_BB_NB_RUND_wer": 0.2488128135647788,
464
+ "step": 18579
465
+ },
466
+ {
467
+ "epoch": 11.0,
468
+ "eval_rundkast_loss": 0.3232197165489197,
469
+ "eval_rundkast_runtime": 32.6557,
470
+ "eval_rundkast_samples_per_second": 41.187,
471
+ "eval_rundkast_steps_per_second": 1.317,
472
+ "eval_rundkast_wer": 0.14237989182309896,
473
+ "step": 18579
474
+ },
475
+ {
476
+ "epoch": 11.0,
477
+ "eval_nb_samtale_loss": 0.4594550132751465,
478
+ "eval_nb_samtale_runtime": 37.0192,
479
+ "eval_nb_samtale_samples_per_second": 14.398,
480
+ "eval_nb_samtale_steps_per_second": 0.459,
481
+ "eval_nb_samtale_wer": 0.185302734375,
482
+ "step": 18579
483
+ },
484
+ {
485
+ "epoch": 12.0,
486
+ "grad_norm": 3.211408853530884,
487
+ "learning_rate": 7.160157432636997e-05,
488
+ "loss": 0.5034,
489
+ "step": 20268
490
+ },
491
+ {
492
+ "epoch": 12.0,
493
+ "eval_bigbrother_loss": 1.1385760307312012,
494
+ "eval_bigbrother_runtime": 40.816,
495
+ "eval_bigbrother_samples_per_second": 33.565,
496
+ "eval_bigbrother_steps_per_second": 1.054,
497
+ "eval_bigbrother_wer": 0.40981229356319987,
498
+ "step": 20268
499
+ },
500
+ {
501
+ "epoch": 12.0,
502
+ "eval_BB_NB_RUND_loss": 0.6762681603431702,
503
+ "eval_BB_NB_RUND_runtime": 128.7262,
504
+ "eval_BB_NB_RUND_samples_per_second": 25.232,
505
+ "eval_BB_NB_RUND_steps_per_second": 0.792,
506
+ "eval_BB_NB_RUND_wer": 0.24229334907305555,
507
+ "step": 20268
508
+ },
509
+ {
510
+ "epoch": 12.0,
511
+ "eval_rundkast_loss": 0.2944062352180481,
512
+ "eval_rundkast_runtime": 32.5788,
513
+ "eval_rundkast_samples_per_second": 41.284,
514
+ "eval_rundkast_steps_per_second": 1.32,
515
+ "eval_rundkast_wer": 0.1358574610244989,
516
+ "step": 20268
517
+ },
518
+ {
519
+ "epoch": 12.0,
520
+ "eval_nb_samtale_loss": 0.451029509305954,
521
+ "eval_nb_samtale_runtime": 36.6243,
522
+ "eval_nb_samtale_samples_per_second": 14.553,
523
+ "eval_nb_samtale_steps_per_second": 0.464,
524
+ "eval_nb_samtale_wer": 0.18172200520833334,
525
+ "step": 20268
526
+ },
527
+ {
528
+ "epoch": 13.0,
529
+ "grad_norm": 4.915965557098389,
530
+ "learning_rate": 6.904783530124131e-05,
531
+ "loss": 0.4922,
532
+ "step": 21957
533
+ },
534
+ {
535
+ "epoch": 13.0,
536
+ "eval_bigbrother_loss": 1.070022702217102,
537
+ "eval_bigbrother_runtime": 41.6248,
538
+ "eval_bigbrother_samples_per_second": 32.913,
539
+ "eval_bigbrother_steps_per_second": 1.033,
540
+ "eval_bigbrother_wer": 0.408845565133328,
541
+ "step": 21957
542
+ },
543
+ {
544
+ "epoch": 13.0,
545
+ "eval_BB_NB_RUND_loss": 0.641231894493103,
546
+ "eval_BB_NB_RUND_runtime": 130.0831,
547
+ "eval_BB_NB_RUND_samples_per_second": 24.969,
548
+ "eval_BB_NB_RUND_steps_per_second": 0.784,
549
+ "eval_BB_NB_RUND_wer": 0.24320553752045718,
550
+ "step": 21957
551
+ },
552
+ {
553
+ "epoch": 13.0,
554
+ "eval_rundkast_loss": 0.28888097405433655,
555
+ "eval_rundkast_runtime": 32.35,
556
+ "eval_rundkast_samples_per_second": 41.577,
557
+ "eval_rundkast_steps_per_second": 1.329,
558
+ "eval_rundkast_wer": 0.14023226216990137,
559
+ "step": 21957
560
+ },
561
+ {
562
+ "epoch": 13.0,
563
+ "eval_nb_samtale_loss": 0.4279041886329651,
564
+ "eval_nb_samtale_runtime": 36.6119,
565
+ "eval_nb_samtale_samples_per_second": 14.558,
566
+ "eval_nb_samtale_steps_per_second": 0.464,
567
+ "eval_nb_samtale_wer": 0.18180338541666666,
568
+ "step": 21957
569
+ },
570
+ {
571
+ "epoch": 14.0,
572
+ "grad_norm": 7.668597221374512,
573
+ "learning_rate": 6.649106872540115e-05,
574
+ "loss": 0.4787,
575
+ "step": 23646
576
+ },
577
+ {
578
+ "epoch": 14.0,
579
+ "eval_bigbrother_loss": 1.123586893081665,
580
+ "eval_bigbrother_runtime": 40.9041,
581
+ "eval_bigbrother_samples_per_second": 33.493,
582
+ "eval_bigbrother_steps_per_second": 1.051,
583
+ "eval_bigbrother_wer": 0.4079593974059454,
584
+ "step": 23646
585
+ },
586
+ {
587
+ "epoch": 14.0,
588
+ "eval_BB_NB_RUND_loss": 0.6701177358627319,
589
+ "eval_BB_NB_RUND_runtime": 128.6687,
590
+ "eval_BB_NB_RUND_samples_per_second": 25.243,
591
+ "eval_BB_NB_RUND_steps_per_second": 0.793,
592
+ "eval_BB_NB_RUND_wer": 0.24256163979287956,
593
+ "step": 23646
594
+ },
595
+ {
596
+ "epoch": 14.0,
597
+ "eval_rundkast_loss": 0.2999539077281952,
598
+ "eval_rundkast_runtime": 33.5296,
599
+ "eval_rundkast_samples_per_second": 40.114,
600
+ "eval_rundkast_steps_per_second": 1.282,
601
+ "eval_rundkast_wer": 0.13697104677060135,
602
+ "step": 23646
603
+ },
604
+ {
605
+ "epoch": 14.0,
606
+ "eval_nb_samtale_loss": 0.43806180357933044,
607
+ "eval_nb_samtale_runtime": 36.6824,
608
+ "eval_nb_samtale_samples_per_second": 14.53,
609
+ "eval_nb_samtale_steps_per_second": 0.463,
610
+ "eval_nb_samtale_wer": 0.18375651041666666,
611
+ "step": 23646
612
+ },
613
+ {
614
+ "epoch": 15.0,
615
+ "grad_norm": 8.808441162109375,
616
+ "learning_rate": 6.393430214956101e-05,
617
+ "loss": 0.4663,
618
+ "step": 25335
619
+ },
620
+ {
621
+ "epoch": 15.0,
622
+ "eval_bigbrother_loss": 1.160325050354004,
623
+ "eval_bigbrother_runtime": 41.0537,
624
+ "eval_bigbrother_samples_per_second": 33.371,
625
+ "eval_bigbrother_steps_per_second": 1.047,
626
+ "eval_bigbrother_wer": 0.3999033271570128,
627
+ "step": 25335
628
+ },
629
+ {
630
+ "epoch": 15.0,
631
+ "eval_BB_NB_RUND_loss": 0.6799572706222534,
632
+ "eval_BB_NB_RUND_runtime": 185.9813,
633
+ "eval_BB_NB_RUND_samples_per_second": 17.464,
634
+ "eval_BB_NB_RUND_steps_per_second": 0.548,
635
+ "eval_BB_NB_RUND_wer": 0.23767874869208275,
636
+ "step": 25335
637
+ },
638
+ {
639
+ "epoch": 15.0,
640
+ "eval_rundkast_loss": 0.2853633463382721,
641
+ "eval_rundkast_runtime": 32.9208,
642
+ "eval_rundkast_samples_per_second": 40.856,
643
+ "eval_rundkast_steps_per_second": 1.306,
644
+ "eval_rundkast_wer": 0.1345847916003818,
645
+ "step": 25335
646
+ },
647
+ {
648
+ "epoch": 15.0,
649
+ "eval_nb_samtale_loss": 0.4409109652042389,
650
+ "eval_nb_samtale_runtime": 36.4232,
651
+ "eval_nb_samtale_samples_per_second": 14.634,
652
+ "eval_nb_samtale_steps_per_second": 0.467,
653
+ "eval_nb_samtale_wer": 0.178466796875,
654
+ "step": 25335
655
+ },
656
+ {
657
+ "epoch": 16.0,
658
+ "grad_norm": 4.101474761962891,
659
+ "learning_rate": 6.137753557372086e-05,
660
+ "loss": 0.4579,
661
+ "step": 27024
662
+ },
663
+ {
664
+ "epoch": 16.0,
665
+ "eval_bigbrother_loss": 1.155598759651184,
666
+ "eval_bigbrother_runtime": 42.3097,
667
+ "eval_bigbrother_samples_per_second": 32.38,
668
+ "eval_bigbrother_steps_per_second": 1.016,
669
+ "eval_bigbrother_wer": 0.3999033271570128,
670
+ "step": 27024
671
+ },
672
+ {
673
+ "epoch": 16.0,
674
+ "eval_BB_NB_RUND_loss": 0.6771286129951477,
675
+ "eval_BB_NB_RUND_runtime": 128.4569,
676
+ "eval_BB_NB_RUND_samples_per_second": 25.285,
677
+ "eval_BB_NB_RUND_steps_per_second": 0.794,
678
+ "eval_BB_NB_RUND_wer": 0.23773240683604754,
679
+ "step": 27024
680
+ },
681
+ {
682
+ "epoch": 16.0,
683
+ "eval_rundkast_loss": 0.27949705719947815,
684
+ "eval_rundkast_runtime": 32.5865,
685
+ "eval_rundkast_samples_per_second": 41.275,
686
+ "eval_rundkast_steps_per_second": 1.32,
687
+ "eval_rundkast_wer": 0.13450524976137448,
688
+ "step": 27024
689
+ },
690
+ {
691
+ "epoch": 16.0,
692
+ "eval_nb_samtale_loss": 0.4515434503555298,
693
+ "eval_nb_samtale_runtime": 37.0041,
694
+ "eval_nb_samtale_samples_per_second": 14.404,
695
+ "eval_nb_samtale_steps_per_second": 0.459,
696
+ "eval_nb_samtale_wer": 0.17936197916666666,
697
+ "step": 27024
698
+ },
699
+ {
700
+ "epoch": 17.0,
701
+ "grad_norm": 9.384012222290039,
702
+ "learning_rate": 5.882379654859219e-05,
703
+ "loss": 0.4469,
704
+ "step": 28713
705
+ },
706
+ {
707
+ "epoch": 17.0,
708
+ "eval_bigbrother_loss": 1.1895906925201416,
709
+ "eval_bigbrother_runtime": 40.9285,
710
+ "eval_bigbrother_samples_per_second": 33.473,
711
+ "eval_bigbrother_steps_per_second": 1.051,
712
+ "eval_bigbrother_wer": 0.40167566261177795,
713
+ "step": 28713
714
+ },
715
+ {
716
+ "epoch": 17.0,
717
+ "eval_BB_NB_RUND_loss": 0.6978138089179993,
718
+ "eval_BB_NB_RUND_runtime": 169.0105,
719
+ "eval_BB_NB_RUND_samples_per_second": 19.218,
720
+ "eval_BB_NB_RUND_steps_per_second": 0.604,
721
+ "eval_BB_NB_RUND_wer": 0.23837630456362516,
722
+ "step": 28713
723
+ },
724
+ {
725
+ "epoch": 17.0,
726
+ "eval_rundkast_loss": 0.29528018832206726,
727
+ "eval_rundkast_runtime": 32.6968,
728
+ "eval_rundkast_samples_per_second": 41.136,
729
+ "eval_rundkast_steps_per_second": 1.315,
730
+ "eval_rundkast_wer": 0.1377664651606745,
731
+ "step": 28713
732
+ },
733
+ {
734
+ "epoch": 17.0,
735
+ "eval_nb_samtale_loss": 0.4508727788925171,
736
+ "eval_nb_samtale_runtime": 36.4289,
737
+ "eval_nb_samtale_samples_per_second": 14.631,
738
+ "eval_nb_samtale_steps_per_second": 0.467,
739
+ "eval_nb_samtale_wer": 0.17667643229166666,
740
+ "step": 28713
741
+ },
742
+ {
743
+ "epoch": 18.0,
744
+ "grad_norm": 3.587054491043091,
745
+ "learning_rate": 5.626702997275205e-05,
746
+ "loss": 0.4399,
747
+ "step": 30402
748
+ },
749
+ {
750
+ "epoch": 18.0,
751
+ "eval_bigbrother_loss": 1.1661101579666138,
752
+ "eval_bigbrother_runtime": 41.0139,
753
+ "eval_bigbrother_samples_per_second": 33.403,
754
+ "eval_bigbrother_steps_per_second": 1.048,
755
+ "eval_bigbrother_wer": 0.3982921131072263,
756
+ "step": 30402
757
+ },
758
+ {
759
+ "epoch": 18.0,
760
+ "eval_BB_NB_RUND_loss": 0.6934623718261719,
761
+ "eval_BB_NB_RUND_runtime": 127.79,
762
+ "eval_BB_NB_RUND_samples_per_second": 25.417,
763
+ "eval_BB_NB_RUND_steps_per_second": 0.798,
764
+ "eval_BB_NB_RUND_wer": 0.23443243098221234,
765
+ "step": 30402
766
+ },
767
+ {
768
+ "epoch": 18.0,
769
+ "eval_rundkast_loss": 0.3097790777683258,
770
+ "eval_rundkast_runtime": 32.5419,
771
+ "eval_rundkast_samples_per_second": 41.331,
772
+ "eval_rundkast_steps_per_second": 1.321,
773
+ "eval_rundkast_wer": 0.13307349665924276,
774
+ "step": 30402
775
+ },
776
+ {
777
+ "epoch": 18.0,
778
+ "eval_nb_samtale_loss": 0.4466961622238159,
779
+ "eval_nb_samtale_runtime": 36.4501,
780
+ "eval_nb_samtale_samples_per_second": 14.623,
781
+ "eval_nb_samtale_steps_per_second": 0.466,
782
+ "eval_nb_samtale_wer": 0.17268880208333334,
783
+ "step": 30402
784
+ },
785
+ {
786
+ "epoch": 19.0,
787
+ "grad_norm": 4.3045973777771,
788
+ "learning_rate": 5.371177717226764e-05,
789
+ "loss": 0.4313,
790
+ "step": 32091
791
+ },
792
+ {
793
+ "epoch": 19.0,
794
+ "eval_bigbrother_loss": 1.1764683723449707,
795
+ "eval_bigbrother_runtime": 41.1081,
796
+ "eval_bigbrother_samples_per_second": 33.327,
797
+ "eval_bigbrother_steps_per_second": 1.046,
798
+ "eval_bigbrother_wer": 0.3935390316603561,
799
+ "step": 32091
800
+ },
801
+ {
802
+ "epoch": 19.0,
803
+ "eval_BB_NB_RUND_loss": 0.6927400231361389,
804
+ "eval_BB_NB_RUND_runtime": 131.0803,
805
+ "eval_BB_NB_RUND_samples_per_second": 24.779,
806
+ "eval_BB_NB_RUND_steps_per_second": 0.778,
807
+ "eval_BB_NB_RUND_wer": 0.23349341346282831,
808
+ "step": 32091
809
+ },
810
+ {
811
+ "epoch": 19.0,
812
+ "eval_rundkast_loss": 0.296793133020401,
813
+ "eval_rundkast_runtime": 32.4376,
814
+ "eval_rundkast_samples_per_second": 41.464,
815
+ "eval_rundkast_steps_per_second": 1.326,
816
+ "eval_rundkast_wer": 0.13355074769328668,
817
+ "step": 32091
818
+ },
819
+ {
820
+ "epoch": 19.0,
821
+ "eval_nb_samtale_loss": 0.44873738288879395,
822
+ "eval_nb_samtale_runtime": 36.5729,
823
+ "eval_nb_samtale_samples_per_second": 14.574,
824
+ "eval_nb_samtale_steps_per_second": 0.465,
825
+ "eval_nb_samtale_wer": 0.17415364583333334,
826
+ "step": 32091
827
+ },
828
+ {
829
+ "epoch": 20.0,
830
+ "grad_norm": 2.650940418243408,
831
+ "learning_rate": 5.115501059642749e-05,
832
+ "loss": 0.4229,
833
+ "step": 33780
834
+ },
835
+ {
836
+ "epoch": 20.0,
837
+ "eval_bigbrother_loss": 1.1612807512283325,
838
+ "eval_bigbrother_runtime": 41.2062,
839
+ "eval_bigbrother_samples_per_second": 33.247,
840
+ "eval_bigbrother_steps_per_second": 1.044,
841
+ "eval_bigbrother_wer": 0.39402239587529203,
842
+ "step": 33780
843
+ },
844
+ {
845
+ "epoch": 20.0,
846
+ "eval_BB_NB_RUND_loss": 0.6827826499938965,
847
+ "eval_BB_NB_RUND_runtime": 326.107,
848
+ "eval_BB_NB_RUND_samples_per_second": 9.96,
849
+ "eval_BB_NB_RUND_steps_per_second": 0.313,
850
+ "eval_BB_NB_RUND_wer": 0.23164220749604272,
851
+ "step": 33780
852
+ },
853
+ {
854
+ "epoch": 20.0,
855
+ "eval_rundkast_loss": 0.29459282755851746,
856
+ "eval_rundkast_runtime": 36.3812,
857
+ "eval_rundkast_samples_per_second": 36.97,
858
+ "eval_rundkast_steps_per_second": 1.182,
859
+ "eval_rundkast_wer": 0.12957365574292076,
860
+ "step": 33780
861
+ },
862
+ {
863
+ "epoch": 20.0,
864
+ "eval_nb_samtale_loss": 0.4326167404651642,
865
+ "eval_nb_samtale_runtime": 39.3019,
866
+ "eval_nb_samtale_samples_per_second": 13.562,
867
+ "eval_nb_samtale_steps_per_second": 0.433,
868
+ "eval_nb_samtale_wer": 0.17252604166666666,
869
+ "step": 33780
870
+ },
871
+ {
872
+ "epoch": 21.0,
873
+ "grad_norm": 6.971451282501221,
874
+ "learning_rate": 4.859975779594308e-05,
875
+ "loss": 0.4173,
876
+ "step": 35469
877
+ },
878
+ {
879
+ "epoch": 21.0,
880
+ "eval_bigbrother_loss": 1.18746018409729,
881
+ "eval_bigbrother_runtime": 42.6131,
882
+ "eval_bigbrother_samples_per_second": 32.15,
883
+ "eval_bigbrother_steps_per_second": 1.009,
884
+ "eval_bigbrother_wer": 0.3920889390155482,
885
+ "step": 35469
886
+ },
887
+ {
888
+ "epoch": 21.0,
889
+ "eval_BB_NB_RUND_loss": 0.6960651874542236,
890
+ "eval_BB_NB_RUND_runtime": 153.2803,
891
+ "eval_BB_NB_RUND_samples_per_second": 21.19,
892
+ "eval_BB_NB_RUND_steps_per_second": 0.665,
893
+ "eval_BB_NB_RUND_wer": 0.23126660048828912,
894
+ "step": 35469
895
+ },
896
+ {
897
+ "epoch": 21.0,
898
+ "eval_rundkast_loss": 0.2939074635505676,
899
+ "eval_rundkast_runtime": 161.3899,
900
+ "eval_rundkast_samples_per_second": 8.334,
901
+ "eval_rundkast_steps_per_second": 0.266,
902
+ "eval_rundkast_wer": 0.13084632516703787,
903
+ "step": 35469
904
+ },
905
+ {
906
+ "epoch": 21.0,
907
+ "eval_nb_samtale_loss": 0.44757071137428284,
908
+ "eval_nb_samtale_runtime": 49.4947,
909
+ "eval_nb_samtale_samples_per_second": 10.769,
910
+ "eval_nb_samtale_steps_per_second": 0.343,
911
+ "eval_nb_samtale_wer": 0.17244466145833334,
912
+ "step": 35469
913
+ },
914
+ {
915
+ "epoch": 22.0,
916
+ "grad_norm": 7.361974716186523,
917
+ "learning_rate": 4.6042991220102936e-05,
918
+ "loss": 0.4101,
919
+ "step": 37158
920
+ },
921
+ {
922
+ "epoch": 22.0,
923
+ "eval_bigbrother_loss": 1.2487200498580933,
924
+ "eval_bigbrother_runtime": 44.9933,
925
+ "eval_bigbrother_samples_per_second": 30.449,
926
+ "eval_bigbrother_steps_per_second": 0.956,
927
+ "eval_bigbrother_wer": 0.39152501409812296,
928
+ "step": 37158
929
+ },
930
+ {
931
+ "epoch": 22.0,
932
+ "eval_BB_NB_RUND_loss": 0.7247402667999268,
933
+ "eval_BB_NB_RUND_runtime": 182.0939,
934
+ "eval_BB_NB_RUND_samples_per_second": 17.837,
935
+ "eval_BB_NB_RUND_steps_per_second": 0.56,
936
+ "eval_BB_NB_RUND_wer": 0.2308105062645883,
937
+ "step": 37158
938
+ },
939
+ {
940
+ "epoch": 22.0,
941
+ "eval_rundkast_loss": 0.2898001968860626,
942
+ "eval_rundkast_runtime": 38.6925,
943
+ "eval_rundkast_samples_per_second": 34.761,
944
+ "eval_rundkast_steps_per_second": 1.111,
945
+ "eval_rundkast_wer": 0.13084632516703787,
946
+ "step": 37158
947
+ },
948
+ {
949
+ "epoch": 22.0,
950
+ "eval_nb_samtale_loss": 0.4750688672065735,
951
+ "eval_nb_samtale_runtime": 42.0801,
952
+ "eval_nb_samtale_samples_per_second": 12.666,
953
+ "eval_nb_samtale_steps_per_second": 0.404,
954
+ "eval_nb_samtale_wer": 0.1708984375,
955
+ "step": 37158
956
+ },
957
+ {
958
+ "epoch": 23.0,
959
+ "grad_norm": 3.2216553688049316,
960
+ "learning_rate": 4.348773841961853e-05,
961
+ "loss": 0.3985,
962
+ "step": 38847
963
+ },
964
+ {
965
+ "epoch": 23.0,
966
+ "eval_bigbrother_loss": 1.1696597337722778,
967
+ "eval_bigbrother_runtime": 41.468,
968
+ "eval_bigbrother_samples_per_second": 33.038,
969
+ "eval_bigbrother_steps_per_second": 1.037,
970
+ "eval_bigbrother_wer": 0.3846773543865302,
971
+ "step": 38847
972
+ },
973
+ {
974
+ "epoch": 23.0,
975
+ "eval_BB_NB_RUND_loss": 0.6836020350456238,
976
+ "eval_BB_NB_RUND_runtime": 175.228,
977
+ "eval_BB_NB_RUND_samples_per_second": 18.536,
978
+ "eval_BB_NB_RUND_steps_per_second": 0.582,
979
+ "eval_BB_NB_RUND_wer": 0.2291739328736619,
980
+ "step": 38847
981
+ },
982
+ {
983
+ "epoch": 23.0,
984
+ "eval_rundkast_loss": 0.2838425934314728,
985
+ "eval_rundkast_runtime": 32.5363,
986
+ "eval_rundkast_samples_per_second": 41.338,
987
+ "eval_rundkast_steps_per_second": 1.322,
988
+ "eval_rundkast_wer": 0.1319599109131403,
989
+ "step": 38847
990
+ },
991
+ {
992
+ "epoch": 23.0,
993
+ "eval_nb_samtale_loss": 0.442909300327301,
994
+ "eval_nb_samtale_runtime": 36.3978,
995
+ "eval_nb_samtale_samples_per_second": 14.644,
996
+ "eval_nb_samtale_steps_per_second": 0.467,
997
+ "eval_nb_samtale_wer": 0.17203776041666666,
998
+ "step": 38847
999
+ },
1000
+ {
1001
+ "epoch": 24.0,
1002
+ "grad_norm": 8.511246681213379,
1003
+ "learning_rate": 4.0933999394489856e-05,
1004
+ "loss": 0.3943,
1005
+ "step": 40536
1006
+ },
1007
+ {
1008
+ "epoch": 24.0,
1009
+ "eval_bigbrother_loss": 1.1965091228485107,
1010
+ "eval_bigbrother_runtime": 41.19,
1011
+ "eval_bigbrother_samples_per_second": 33.26,
1012
+ "eval_bigbrother_steps_per_second": 1.044,
1013
+ "eval_bigbrother_wer": 0.38363006525416904,
1014
+ "step": 40536
1015
+ },
1016
+ {
1017
+ "epoch": 24.0,
1018
+ "eval_BB_NB_RUND_loss": 0.7099454402923584,
1019
+ "eval_BB_NB_RUND_runtime": 129.9149,
1020
+ "eval_BB_NB_RUND_samples_per_second": 25.001,
1021
+ "eval_BB_NB_RUND_steps_per_second": 0.785,
1022
+ "eval_BB_NB_RUND_wer": 0.2286910095779787,
1023
+ "step": 40536
1024
+ },
1025
+ {
1026
+ "epoch": 24.0,
1027
+ "eval_rundkast_loss": 0.31351616978645325,
1028
+ "eval_rundkast_runtime": 32.5656,
1029
+ "eval_rundkast_samples_per_second": 41.301,
1030
+ "eval_rundkast_steps_per_second": 1.32,
1031
+ "eval_rundkast_wer": 0.13108495068405981,
1032
+ "step": 40536
1033
+ },
1034
+ {
1035
+ "epoch": 24.0,
1036
+ "eval_nb_samtale_loss": 0.4599841833114624,
1037
+ "eval_nb_samtale_runtime": 36.637,
1038
+ "eval_nb_samtale_samples_per_second": 14.548,
1039
+ "eval_nb_samtale_steps_per_second": 0.464,
1040
+ "eval_nb_samtale_wer": 0.17154947916666666,
1041
+ "step": 40536
1042
+ },
1043
+ {
1044
+ "epoch": 25.0,
1045
+ "grad_norm": 3.3434505462646484,
1046
+ "learning_rate": 3.837723281864972e-05,
1047
+ "loss": 0.3902,
1048
+ "step": 42225
1049
+ },
1050
+ {
1051
+ "epoch": 25.0,
1052
+ "eval_bigbrother_loss": 1.194956660270691,
1053
+ "eval_bigbrother_runtime": 41.082,
1054
+ "eval_bigbrother_samples_per_second": 33.348,
1055
+ "eval_bigbrother_steps_per_second": 1.047,
1056
+ "eval_bigbrother_wer": 0.38193829050189315,
1057
+ "step": 42225
1058
+ },
1059
+ {
1060
+ "epoch": 25.0,
1061
+ "eval_BB_NB_RUND_loss": 0.7117018103599548,
1062
+ "eval_BB_NB_RUND_runtime": 129.0515,
1063
+ "eval_BB_NB_RUND_samples_per_second": 25.168,
1064
+ "eval_BB_NB_RUND_steps_per_second": 0.79,
1065
+ "eval_BB_NB_RUND_wer": 0.2270812652590347,
1066
+ "step": 42225
1067
+ },
1068
+ {
1069
+ "epoch": 25.0,
1070
+ "eval_rundkast_loss": 0.31047695875167847,
1071
+ "eval_rundkast_runtime": 32.4929,
1072
+ "eval_rundkast_samples_per_second": 41.394,
1073
+ "eval_rundkast_steps_per_second": 1.323,
1074
+ "eval_rundkast_wer": 0.13124403436207446,
1075
+ "step": 42225
1076
+ },
1077
+ {
1078
+ "epoch": 25.0,
1079
+ "eval_nb_samtale_loss": 0.48264163732528687,
1080
+ "eval_nb_samtale_runtime": 36.4332,
1081
+ "eval_nb_samtale_samples_per_second": 14.63,
1082
+ "eval_nb_samtale_steps_per_second": 0.467,
1083
+ "eval_nb_samtale_wer": 0.16878255208333334,
1084
+ "step": 42225
1085
+ },
1086
+ {
1087
+ "epoch": 26.0,
1088
+ "grad_norm": 3.0726335048675537,
1089
+ "learning_rate": 3.582046624280957e-05,
1090
+ "loss": 0.3836,
1091
+ "step": 43914
1092
+ },
1093
+ {
1094
+ "epoch": 26.0,
1095
+ "eval_bigbrother_loss": 1.2235493659973145,
1096
+ "eval_bigbrother_runtime": 41.1244,
1097
+ "eval_bigbrother_samples_per_second": 33.314,
1098
+ "eval_bigbrother_steps_per_second": 1.046,
1099
+ "eval_bigbrother_wer": 0.3832272617417224,
1100
+ "step": 43914
1101
+ },
1102
+ {
1103
+ "epoch": 26.0,
1104
+ "eval_BB_NB_RUND_loss": 0.7329136729240417,
1105
+ "eval_BB_NB_RUND_runtime": 153.8243,
1106
+ "eval_BB_NB_RUND_samples_per_second": 21.115,
1107
+ "eval_BB_NB_RUND_steps_per_second": 0.663,
1108
+ "eval_BB_NB_RUND_wer": 0.22842271885815468,
1109
+ "step": 43914
1110
+ },
1111
+ {
1112
+ "epoch": 26.0,
1113
+ "eval_rundkast_loss": 0.3316984474658966,
1114
+ "eval_rundkast_runtime": 32.4356,
1115
+ "eval_rundkast_samples_per_second": 41.467,
1116
+ "eval_rundkast_steps_per_second": 1.326,
1117
+ "eval_rundkast_wer": 0.13434616608335984,
1118
+ "step": 43914
1119
+ },
1120
+ {
1121
+ "epoch": 26.0,
1122
+ "eval_nb_samtale_loss": 0.48570868372917175,
1123
+ "eval_nb_samtale_runtime": 36.6552,
1124
+ "eval_nb_samtale_samples_per_second": 14.541,
1125
+ "eval_nb_samtale_steps_per_second": 0.464,
1126
+ "eval_nb_samtale_wer": 0.16731770833333334,
1127
+ "step": 43914
1128
+ },
1129
+ {
1130
+ "epoch": 27.0,
1131
+ "grad_norm": 15.335138320922852,
1132
+ "learning_rate": 3.3263699666969425e-05,
1133
+ "loss": 0.3786,
1134
+ "step": 45603
1135
+ },
1136
+ {
1137
+ "epoch": 27.0,
1138
+ "eval_bigbrother_loss": 1.205081820487976,
1139
+ "eval_bigbrother_runtime": 40.4664,
1140
+ "eval_bigbrother_samples_per_second": 33.855,
1141
+ "eval_bigbrother_steps_per_second": 1.063,
1142
+ "eval_bigbrother_wer": 0.3794409087247241,
1143
+ "step": 45603
1144
+ },
1145
+ {
1146
+ "epoch": 27.0,
1147
+ "eval_BB_NB_RUND_loss": 0.7199556231498718,
1148
+ "eval_BB_NB_RUND_runtime": 130.4204,
1149
+ "eval_BB_NB_RUND_samples_per_second": 24.904,
1150
+ "eval_BB_NB_RUND_steps_per_second": 0.782,
1151
+ "eval_BB_NB_RUND_wer": 0.22506908486035468,
1152
+ "step": 45603
1153
+ },
1154
+ {
1155
+ "epoch": 27.0,
1156
+ "eval_rundkast_loss": 0.31949692964553833,
1157
+ "eval_rundkast_runtime": 32.7387,
1158
+ "eval_rundkast_samples_per_second": 41.083,
1159
+ "eval_rundkast_steps_per_second": 1.313,
1160
+ "eval_rundkast_wer": 0.12846006999681833,
1161
+ "step": 45603
1162
+ },
1163
+ {
1164
+ "epoch": 27.0,
1165
+ "eval_nb_samtale_loss": 0.48315760493278503,
1166
+ "eval_nb_samtale_runtime": 36.3915,
1167
+ "eval_nb_samtale_samples_per_second": 14.646,
1168
+ "eval_nb_samtale_steps_per_second": 0.467,
1169
+ "eval_nb_samtale_wer": 0.16715494791666666,
1170
+ "step": 45603
1171
+ },
1172
+ {
1173
+ "epoch": 28.0,
1174
+ "grad_norm": 9.487163543701172,
1175
+ "learning_rate": 3.0708446866485016e-05,
1176
+ "loss": 0.3752,
1177
+ "step": 47292
1178
+ },
1179
+ {
1180
+ "epoch": 28.0,
1181
+ "eval_bigbrother_loss": 1.200919508934021,
1182
+ "eval_bigbrother_runtime": 40.9519,
1183
+ "eval_bigbrother_samples_per_second": 33.454,
1184
+ "eval_bigbrother_steps_per_second": 1.05,
1185
+ "eval_bigbrother_wer": 0.380165955047128,
1186
+ "step": 47292
1187
+ },
1188
+ {
1189
+ "epoch": 28.0,
1190
+ "eval_BB_NB_RUND_loss": 0.7172989845275879,
1191
+ "eval_BB_NB_RUND_runtime": 127.4559,
1192
+ "eval_BB_NB_RUND_samples_per_second": 25.483,
1193
+ "eval_BB_NB_RUND_steps_per_second": 0.8,
1194
+ "eval_BB_NB_RUND_wer": 0.2256861535159499,
1195
+ "step": 47292
1196
+ },
1197
+ {
1198
+ "epoch": 28.0,
1199
+ "eval_rundkast_loss": 0.3196479082107544,
1200
+ "eval_rundkast_runtime": 32.5881,
1201
+ "eval_rundkast_samples_per_second": 41.273,
1202
+ "eval_rundkast_steps_per_second": 1.319,
1203
+ "eval_rundkast_wer": 0.13084632516703787,
1204
+ "step": 47292
1205
+ },
1206
+ {
1207
+ "epoch": 28.0,
1208
+ "eval_nb_samtale_loss": 0.4765280485153198,
1209
+ "eval_nb_samtale_runtime": 37.1947,
1210
+ "eval_nb_samtale_samples_per_second": 14.33,
1211
+ "eval_nb_samtale_steps_per_second": 0.457,
1212
+ "eval_nb_samtale_wer": 0.16731770833333334,
1213
+ "step": 47292
1214
+ },
1215
+ {
1216
+ "epoch": 29.0,
1217
+ "grad_norm": 4.333740234375,
1218
+ "learning_rate": 2.8153194066000604e-05,
1219
+ "loss": 0.3718,
1220
+ "step": 48981
1221
+ },
1222
+ {
1223
+ "epoch": 29.0,
1224
+ "eval_bigbrother_loss": 1.2218164205551147,
1225
+ "eval_bigbrother_runtime": 40.6907,
1226
+ "eval_bigbrother_samples_per_second": 33.669,
1227
+ "eval_bigbrother_steps_per_second": 1.057,
1228
+ "eval_bigbrother_wer": 0.37621848062515106,
1229
+ "step": 48981
1230
+ },
1231
+ {
1232
+ "epoch": 29.0,
1233
+ "eval_BB_NB_RUND_loss": 0.7251059412956238,
1234
+ "eval_BB_NB_RUND_runtime": 151.9233,
1235
+ "eval_BB_NB_RUND_samples_per_second": 21.379,
1236
+ "eval_BB_NB_RUND_steps_per_second": 0.671,
1237
+ "eval_BB_NB_RUND_wer": 0.22418372548493548,
1238
+ "step": 48981
1239
+ },
1240
+ {
1241
+ "epoch": 29.0,
1242
+ "eval_rundkast_loss": 0.319437175989151,
1243
+ "eval_rundkast_runtime": 32.7825,
1244
+ "eval_rundkast_samples_per_second": 41.028,
1245
+ "eval_rundkast_steps_per_second": 1.312,
1246
+ "eval_rundkast_wer": 0.13084632516703787,
1247
+ "step": 48981
1248
+ },
1249
+ {
1250
+ "epoch": 29.0,
1251
+ "eval_nb_samtale_loss": 0.4711519181728363,
1252
+ "eval_nb_samtale_runtime": 36.3015,
1253
+ "eval_nb_samtale_samples_per_second": 14.683,
1254
+ "eval_nb_samtale_steps_per_second": 0.468,
1255
+ "eval_nb_samtale_wer": 0.16609700520833334,
1256
+ "step": 48981
1257
+ },
1258
+ {
1259
+ "epoch": 30.0,
1260
+ "grad_norm": 6.403714179992676,
1261
+ "learning_rate": 2.5596427490160462e-05,
1262
+ "loss": 0.3645,
1263
+ "step": 50670
1264
+ },
1265
+ {
1266
+ "epoch": 30.0,
1267
+ "eval_bigbrother_loss": 1.183604121208191,
1268
+ "eval_bigbrother_runtime": 42.3075,
1269
+ "eval_bigbrother_samples_per_second": 32.382,
1270
+ "eval_bigbrother_steps_per_second": 1.016,
1271
+ "eval_bigbrother_wer": 0.37557399500523647,
1272
+ "step": 50670
1273
+ },
1274
+ {
1275
+ "epoch": 30.0,
1276
+ "eval_BB_NB_RUND_loss": 0.7078377604484558,
1277
+ "eval_BB_NB_RUND_runtime": 127.3976,
1278
+ "eval_BB_NB_RUND_samples_per_second": 25.495,
1279
+ "eval_BB_NB_RUND_steps_per_second": 0.801,
1280
+ "eval_BB_NB_RUND_wer": 0.22356665682934027,
1281
+ "step": 50670
1282
+ },
1283
+ {
1284
+ "epoch": 30.0,
1285
+ "eval_rundkast_loss": 0.3230808675289154,
1286
+ "eval_rundkast_runtime": 32.4456,
1287
+ "eval_rundkast_samples_per_second": 41.454,
1288
+ "eval_rundkast_steps_per_second": 1.325,
1289
+ "eval_rundkast_wer": 0.12861915367483295,
1290
+ "step": 50670
1291
+ },
1292
+ {
1293
+ "epoch": 30.0,
1294
+ "eval_nb_samtale_loss": 0.4557996094226837,
1295
+ "eval_nb_samtale_runtime": 36.3068,
1296
+ "eval_nb_samtale_samples_per_second": 14.68,
1297
+ "eval_nb_samtale_steps_per_second": 0.468,
1298
+ "eval_nb_samtale_wer": 0.16642252604166666,
1299
+ "step": 50670
1300
+ },
1301
+ {
1302
+ "epoch": 31.0,
1303
+ "grad_norm": 3.91894268989563,
1304
+ "learning_rate": 2.3041174689676053e-05,
1305
+ "loss": 0.3609,
1306
+ "step": 52359
1307
+ },
1308
+ {
1309
+ "epoch": 31.0,
1310
+ "eval_bigbrother_loss": 1.2197799682617188,
1311
+ "eval_bigbrother_runtime": 41.1407,
1312
+ "eval_bigbrother_samples_per_second": 33.3,
1313
+ "eval_bigbrother_steps_per_second": 1.045,
1314
+ "eval_bigbrother_wer": 0.37565455570772577,
1315
+ "step": 52359
1316
+ },
1317
+ {
1318
+ "epoch": 31.0,
1319
+ "eval_BB_NB_RUND_loss": 0.7260043025016785,
1320
+ "eval_BB_NB_RUND_runtime": 131.0819,
1321
+ "eval_BB_NB_RUND_samples_per_second": 24.778,
1322
+ "eval_BB_NB_RUND_steps_per_second": 0.778,
1323
+ "eval_BB_NB_RUND_wer": 0.22383494754916428,
1324
+ "step": 52359
1325
+ },
1326
+ {
1327
+ "epoch": 31.0,
1328
+ "eval_rundkast_loss": 0.32174140214920044,
1329
+ "eval_rundkast_runtime": 32.4715,
1330
+ "eval_rundkast_samples_per_second": 41.421,
1331
+ "eval_rundkast_steps_per_second": 1.324,
1332
+ "eval_rundkast_wer": 0.12885777919185493,
1333
+ "step": 52359
1334
+ },
1335
+ {
1336
+ "epoch": 31.0,
1337
+ "eval_nb_samtale_loss": 0.47712796926498413,
1338
+ "eval_nb_samtale_runtime": 36.1596,
1339
+ "eval_nb_samtale_samples_per_second": 14.74,
1340
+ "eval_nb_samtale_steps_per_second": 0.47,
1341
+ "eval_nb_samtale_wer": 0.166748046875,
1342
+ "step": 52359
1343
+ },
1344
+ {
1345
+ "epoch": 32.0,
1346
+ "grad_norm": 2.9196996688842773,
1347
+ "learning_rate": 2.0485921889191645e-05,
1348
+ "loss": 0.36,
1349
+ "step": 54048
1350
+ },
1351
+ {
1352
+ "epoch": 32.0,
1353
+ "eval_bigbrother_loss": 1.2731306552886963,
1354
+ "eval_bigbrother_runtime": 40.9963,
1355
+ "eval_bigbrother_samples_per_second": 33.418,
1356
+ "eval_bigbrother_steps_per_second": 1.049,
1357
+ "eval_bigbrother_wer": 0.3735599774430033,
1358
+ "step": 54048
1359
+ },
1360
+ {
1361
+ "epoch": 32.0,
1362
+ "eval_BB_NB_RUND_loss": 0.7525675296783447,
1363
+ "eval_BB_NB_RUND_runtime": 128.3644,
1364
+ "eval_BB_NB_RUND_samples_per_second": 25.303,
1365
+ "eval_BB_NB_RUND_steps_per_second": 0.795,
1366
+ "eval_BB_NB_RUND_wer": 0.22262763930995627,
1367
+ "step": 54048
1368
+ },
1369
+ {
1370
+ "epoch": 32.0,
1371
+ "eval_rundkast_loss": 0.3295101523399353,
1372
+ "eval_rundkast_runtime": 33.7671,
1373
+ "eval_rundkast_samples_per_second": 39.832,
1374
+ "eval_rundkast_steps_per_second": 1.273,
1375
+ "eval_rundkast_wer": 0.12798281896277441,
1376
+ "step": 54048
1377
+ },
1378
+ {
1379
+ "epoch": 32.0,
1380
+ "eval_nb_samtale_loss": 0.48206984996795654,
1381
+ "eval_nb_samtale_runtime": 36.7176,
1382
+ "eval_nb_samtale_samples_per_second": 14.516,
1383
+ "eval_nb_samtale_steps_per_second": 0.463,
1384
+ "eval_nb_samtale_wer": 0.16691080729166666,
1385
+ "step": 54048
1386
+ },
1387
+ {
1388
+ "epoch": 33.0,
1389
+ "grad_norm": 7.844558238983154,
1390
+ "learning_rate": 1.7929155313351502e-05,
1391
+ "loss": 0.3497,
1392
+ "step": 55737
1393
+ },
1394
+ {
1395
+ "epoch": 33.0,
1396
+ "eval_bigbrother_loss": 1.2425702810287476,
1397
+ "eval_bigbrother_runtime": 40.5135,
1398
+ "eval_bigbrother_samples_per_second": 33.816,
1399
+ "eval_bigbrother_steps_per_second": 1.061,
1400
+ "eval_bigbrother_wer": 0.37219044550068475,
1401
+ "step": 55737
1402
+ },
1403
+ {
1404
+ "epoch": 33.0,
1405
+ "eval_BB_NB_RUND_loss": 0.7353043556213379,
1406
+ "eval_BB_NB_RUND_runtime": 130.7216,
1407
+ "eval_BB_NB_RUND_samples_per_second": 24.847,
1408
+ "eval_BB_NB_RUND_steps_per_second": 0.78,
1409
+ "eval_BB_NB_RUND_wer": 0.22085692055911785,
1410
+ "step": 55737
1411
+ },
1412
+ {
1413
+ "epoch": 33.0,
1414
+ "eval_rundkast_loss": 0.32282164692878723,
1415
+ "eval_rundkast_runtime": 32.5615,
1416
+ "eval_rundkast_samples_per_second": 41.306,
1417
+ "eval_rundkast_steps_per_second": 1.321,
1418
+ "eval_rundkast_wer": 0.12623289850461342,
1419
+ "step": 55737
1420
+ },
1421
+ {
1422
+ "epoch": 33.0,
1423
+ "eval_nb_samtale_loss": 0.47214123606681824,
1424
+ "eval_nb_samtale_runtime": 36.5675,
1425
+ "eval_nb_samtale_samples_per_second": 14.576,
1426
+ "eval_nb_samtale_steps_per_second": 0.465,
1427
+ "eval_nb_samtale_wer": 0.16357421875,
1428
+ "step": 55737
1429
+ },
1430
+ {
1431
+ "epoch": 34.0,
1432
+ "grad_norm": 7.324841022491455,
1433
+ "learning_rate": 1.537541628822283e-05,
1434
+ "loss": 0.352,
1435
+ "step": 57426
1436
+ },
1437
+ {
1438
+ "epoch": 34.0,
1439
+ "eval_bigbrother_loss": 1.306195616722107,
1440
+ "eval_bigbrother_runtime": 41.3854,
1441
+ "eval_bigbrother_samples_per_second": 33.103,
1442
+ "eval_bigbrother_steps_per_second": 1.039,
1443
+ "eval_bigbrother_wer": 0.3747683879803432,
1444
+ "step": 57426
1445
+ },
1446
+ {
1447
+ "epoch": 34.0,
1448
+ "eval_BB_NB_RUND_loss": 0.7695896029472351,
1449
+ "eval_BB_NB_RUND_runtime": 128.8264,
1450
+ "eval_BB_NB_RUND_samples_per_second": 25.212,
1451
+ "eval_BB_NB_RUND_steps_per_second": 0.792,
1452
+ "eval_BB_NB_RUND_wer": 0.22206422879832585,
1453
+ "step": 57426
1454
+ },
1455
+ {
1456
+ "epoch": 34.0,
1457
+ "eval_rundkast_loss": 0.33627748489379883,
1458
+ "eval_rundkast_runtime": 35.7,
1459
+ "eval_rundkast_samples_per_second": 37.675,
1460
+ "eval_rundkast_steps_per_second": 1.204,
1461
+ "eval_rundkast_wer": 0.1270283168946866,
1462
+ "step": 57426
1463
+ },
1464
+ {
1465
+ "epoch": 34.0,
1466
+ "eval_nb_samtale_loss": 0.48346221446990967,
1467
+ "eval_nb_samtale_runtime": 37.2815,
1468
+ "eval_nb_samtale_samples_per_second": 14.297,
1469
+ "eval_nb_samtale_steps_per_second": 0.456,
1470
+ "eval_nb_samtale_wer": 0.16487630208333334,
1471
+ "step": 57426
1472
+ },
1473
+ {
1474
+ "epoch": 35.0,
1475
+ "grad_norm": 8.772356986999512,
1476
+ "learning_rate": 1.2818649712382683e-05,
1477
+ "loss": 0.3475,
1478
+ "step": 59115
1479
+ },
1480
+ {
1481
+ "epoch": 35.0,
1482
+ "eval_bigbrother_loss": 1.2660571336746216,
1483
+ "eval_bigbrother_runtime": 41.6526,
1484
+ "eval_bigbrother_samples_per_second": 32.891,
1485
+ "eval_bigbrother_steps_per_second": 1.032,
1486
+ "eval_bigbrother_wer": 0.37662128413759766,
1487
+ "step": 59115
1488
+ },
1489
+ {
1490
+ "epoch": 35.0,
1491
+ "eval_BB_NB_RUND_loss": 0.7468720078468323,
1492
+ "eval_BB_NB_RUND_runtime": 168.5154,
1493
+ "eval_BB_NB_RUND_samples_per_second": 19.274,
1494
+ "eval_BB_NB_RUND_steps_per_second": 0.605,
1495
+ "eval_BB_NB_RUND_wer": 0.22329836610951628,
1496
+ "step": 59115
1497
+ },
1498
+ {
1499
+ "epoch": 35.0,
1500
+ "eval_rundkast_loss": 0.3307986259460449,
1501
+ "eval_rundkast_runtime": 32.7759,
1502
+ "eval_rundkast_samples_per_second": 41.036,
1503
+ "eval_rundkast_steps_per_second": 1.312,
1504
+ "eval_rundkast_wer": 0.12861915367483295,
1505
+ "step": 59115
1506
+ },
1507
+ {
1508
+ "epoch": 35.0,
1509
+ "eval_nb_samtale_loss": 0.4614698588848114,
1510
+ "eval_nb_samtale_runtime": 36.7886,
1511
+ "eval_nb_samtale_samples_per_second": 14.488,
1512
+ "eval_nb_samtale_steps_per_second": 0.462,
1513
+ "eval_nb_samtale_wer": 0.1650390625,
1514
+ "step": 59115
1515
+ },
1516
+ {
1517
+ "epoch": 36.0,
1518
+ "grad_norm": 2.949153184890747,
1519
+ "learning_rate": 1.0261883136542537e-05,
1520
+ "loss": 0.3436,
1521
+ "step": 60804
1522
+ },
1523
+ {
1524
+ "epoch": 36.0,
1525
+ "eval_bigbrother_loss": 1.2538405656814575,
1526
+ "eval_bigbrother_runtime": 41.1392,
1527
+ "eval_bigbrother_samples_per_second": 33.302,
1528
+ "eval_bigbrother_steps_per_second": 1.045,
1529
+ "eval_bigbrother_wer": 0.3738822202529606,
1530
+ "step": 60804
1531
+ },
1532
+ {
1533
+ "epoch": 36.0,
1534
+ "eval_BB_NB_RUND_loss": 0.7353929877281189,
1535
+ "eval_BB_NB_RUND_runtime": 128.0616,
1536
+ "eval_BB_NB_RUND_samples_per_second": 25.363,
1537
+ "eval_BB_NB_RUND_steps_per_second": 0.796,
1538
+ "eval_BB_NB_RUND_wer": 0.22300324631770987,
1539
+ "step": 60804
1540
+ },
1541
+ {
1542
+ "epoch": 36.0,
1543
+ "eval_rundkast_loss": 0.313808798789978,
1544
+ "eval_rundkast_runtime": 33.2884,
1545
+ "eval_rundkast_samples_per_second": 40.404,
1546
+ "eval_rundkast_steps_per_second": 1.292,
1547
+ "eval_rundkast_wer": 0.1297327394209354,
1548
+ "step": 60804
1549
+ },
1550
+ {
1551
+ "epoch": 36.0,
1552
+ "eval_nb_samtale_loss": 0.466793030500412,
1553
+ "eval_nb_samtale_runtime": 36.3748,
1554
+ "eval_nb_samtale_samples_per_second": 14.653,
1555
+ "eval_nb_samtale_steps_per_second": 0.467,
1556
+ "eval_nb_samtale_wer": 0.16455078125,
1557
+ "step": 60804
1558
+ },
1559
+ {
1560
+ "epoch": 37.0,
1561
+ "grad_norm": 8.754982948303223,
1562
+ "learning_rate": 7.70663033605813e-06,
1563
+ "loss": 0.3476,
1564
+ "step": 62493
1565
+ },
1566
+ {
1567
+ "epoch": 37.0,
1568
+ "eval_bigbrother_loss": 1.2831249237060547,
1569
+ "eval_bigbrother_runtime": 41.6433,
1570
+ "eval_bigbrother_samples_per_second": 32.898,
1571
+ "eval_bigbrother_steps_per_second": 1.033,
1572
+ "eval_bigbrother_wer": 0.37219044550068475,
1573
+ "step": 62493
1574
+ },
1575
+ {
1576
+ "epoch": 37.0,
1577
+ "eval_BB_NB_RUND_loss": 0.7575647234916687,
1578
+ "eval_BB_NB_RUND_runtime": 156.4835,
1579
+ "eval_BB_NB_RUND_samples_per_second": 20.756,
1580
+ "eval_BB_NB_RUND_steps_per_second": 0.652,
1581
+ "eval_BB_NB_RUND_wer": 0.22139350199876587,
1582
+ "step": 62493
1583
+ },
1584
+ {
1585
+ "epoch": 37.0,
1586
+ "eval_rundkast_loss": 0.33385977149009705,
1587
+ "eval_rundkast_runtime": 32.6665,
1588
+ "eval_rundkast_samples_per_second": 41.174,
1589
+ "eval_rundkast_steps_per_second": 1.316,
1590
+ "eval_rundkast_wer": 0.12726694241170855,
1591
+ "step": 62493
1592
+ },
1593
+ {
1594
+ "epoch": 37.0,
1595
+ "eval_nb_samtale_loss": 0.47487109899520874,
1596
+ "eval_nb_samtale_runtime": 36.6818,
1597
+ "eval_nb_samtale_samples_per_second": 14.53,
1598
+ "eval_nb_samtale_steps_per_second": 0.463,
1599
+ "eval_nb_samtale_wer": 0.16495768229166666,
1600
+ "step": 62493
1601
+ },
1602
+ {
1603
+ "epoch": 38.0,
1604
+ "grad_norm": 3.9857819080352783,
1605
+ "learning_rate": 5.151377535573721e-06,
1606
+ "loss": 0.3395,
1607
+ "step": 64182
1608
+ },
1609
+ {
1610
+ "epoch": 38.0,
1611
+ "eval_bigbrother_loss": 1.2619588375091553,
1612
+ "eval_bigbrother_runtime": 40.9934,
1613
+ "eval_bigbrother_samples_per_second": 33.42,
1614
+ "eval_bigbrother_steps_per_second": 1.049,
1615
+ "eval_bigbrother_wer": 0.3714653991782808,
1616
+ "step": 64182
1617
+ },
1618
+ {
1619
+ "epoch": 38.0,
1620
+ "eval_BB_NB_RUND_loss": 0.7496170997619629,
1621
+ "eval_BB_NB_RUND_runtime": 127.9601,
1622
+ "eval_BB_NB_RUND_samples_per_second": 25.383,
1623
+ "eval_BB_NB_RUND_steps_per_second": 0.797,
1624
+ "eval_BB_NB_RUND_wer": 0.22184959622246667,
1625
+ "step": 64182
1626
+ },
1627
+ {
1628
+ "epoch": 38.0,
1629
+ "eval_rundkast_loss": 0.3360491693019867,
1630
+ "eval_rundkast_runtime": 33.333,
1631
+ "eval_rundkast_samples_per_second": 40.35,
1632
+ "eval_rundkast_steps_per_second": 1.29,
1633
+ "eval_rundkast_wer": 0.12830098631880368,
1634
+ "step": 64182
1635
+ },
1636
+ {
1637
+ "epoch": 38.0,
1638
+ "eval_nb_samtale_loss": 0.47765567898750305,
1639
+ "eval_nb_samtale_runtime": 36.2738,
1640
+ "eval_nb_samtale_samples_per_second": 14.694,
1641
+ "eval_nb_samtale_steps_per_second": 0.469,
1642
+ "eval_nb_samtale_wer": 0.16569010416666666,
1643
+ "step": 64182
1644
+ },
1645
+ {
1646
+ "epoch": 39.0,
1647
+ "grad_norm": 3.834691286087036,
1648
+ "learning_rate": 2.5946109597335756e-06,
1649
+ "loss": 0.3415,
1650
+ "step": 65871
1651
+ },
1652
+ {
1653
+ "epoch": 39.0,
1654
+ "eval_bigbrother_loss": 1.2587852478027344,
1655
+ "eval_bigbrother_runtime": 42.0349,
1656
+ "eval_bigbrother_samples_per_second": 32.592,
1657
+ "eval_bigbrother_steps_per_second": 1.023,
1658
+ "eval_bigbrother_wer": 0.3704986707484089,
1659
+ "step": 65871
1660
+ },
1661
+ {
1662
+ "epoch": 39.0,
1663
+ "eval_BB_NB_RUND_loss": 0.747022271156311,
1664
+ "eval_BB_NB_RUND_runtime": 165.2337,
1665
+ "eval_BB_NB_RUND_samples_per_second": 19.657,
1666
+ "eval_BB_NB_RUND_steps_per_second": 0.617,
1667
+ "eval_BB_NB_RUND_wer": 0.22021302283154026,
1668
+ "step": 65871
1669
+ },
1670
+ {
1671
+ "epoch": 39.0,
1672
+ "eval_rundkast_loss": 0.3341328203678131,
1673
+ "eval_rundkast_runtime": 32.991,
1674
+ "eval_rundkast_samples_per_second": 40.769,
1675
+ "eval_rundkast_steps_per_second": 1.303,
1676
+ "eval_rundkast_wer": 0.1265510658606427,
1677
+ "step": 65871
1678
+ },
1679
+ {
1680
+ "epoch": 39.0,
1681
+ "eval_nb_samtale_loss": 0.47388482093811035,
1682
+ "eval_nb_samtale_runtime": 36.3132,
1683
+ "eval_nb_samtale_samples_per_second": 14.678,
1684
+ "eval_nb_samtale_steps_per_second": 0.468,
1685
+ "eval_nb_samtale_wer": 0.16389973958333334,
1686
+ "step": 65871
1687
+ },
1688
+ {
1689
+ "epoch": 40.0,
1690
+ "grad_norm": 44.58503723144531,
1691
+ "learning_rate": 3.7844383893430213e-08,
1692
+ "loss": 0.3428,
1693
+ "step": 67560
1694
+ },
1695
+ {
1696
+ "epoch": 40.0,
1697
+ "eval_bigbrother_loss": 1.2595266103744507,
1698
+ "eval_bigbrother_runtime": 40.7024,
1699
+ "eval_bigbrother_samples_per_second": 33.659,
1700
+ "eval_bigbrother_steps_per_second": 1.056,
1701
+ "eval_bigbrother_wer": 0.3710625956658342,
1702
+ "step": 67560
1703
+ },
1704
+ {
1705
+ "epoch": 40.0,
1706
+ "eval_BB_NB_RUND_loss": 0.7480508089065552,
1707
+ "eval_BB_NB_RUND_runtime": 127.9218,
1708
+ "eval_BB_NB_RUND_samples_per_second": 25.391,
1709
+ "eval_BB_NB_RUND_steps_per_second": 0.797,
1710
+ "eval_BB_NB_RUND_wer": 0.22099106591902987,
1711
+ "step": 67560
1712
+ },
1713
+ {
1714
+ "epoch": 40.0,
1715
+ "eval_rundkast_loss": 0.33537447452545166,
1716
+ "eval_rundkast_runtime": 33.3316,
1717
+ "eval_rundkast_samples_per_second": 40.352,
1718
+ "eval_rundkast_steps_per_second": 1.29,
1719
+ "eval_rundkast_wer": 0.12726694241170855,
1720
+ "step": 67560
1721
+ },
1722
+ {
1723
+ "epoch": 40.0,
1724
+ "eval_nb_samtale_loss": 0.4731021523475647,
1725
+ "eval_nb_samtale_runtime": 36.64,
1726
+ "eval_nb_samtale_samples_per_second": 14.547,
1727
+ "eval_nb_samtale_steps_per_second": 0.464,
1728
+ "eval_nb_samtale_wer": 0.16471354166666666,
1729
+ "step": 67560
1730
+ }
1731
+ ],
1732
+ "logging_steps": 500,
1733
+ "max_steps": 67560,
1734
+ "num_input_tokens_seen": 0,
1735
+ "num_train_epochs": 40,
1736
+ "save_steps": 500,
1737
+ "total_flos": 3.75124860202745e+20,
1738
+ "train_batch_size": 48,
1739
+ "trial_name": null,
1740
+ "trial_params": null
1741
+ }
checkpoint-67560/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:350225cd13eaea5c53facdfd0bf5c84ee772638ee245537f79787ad7224840fa
3
+ size 4984
config.json ADDED
@@ -0,0 +1,116 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "NbAiLab/nb-wav2vec2-300m-bokmaal",
3
+ "activation_dropout": 0.055,
4
+ "adapter_attn_dim": null,
5
+ "adapter_kernel_size": 3,
6
+ "adapter_stride": 2,
7
+ "add_adapter": false,
8
+ "apply_spec_augment": true,
9
+ "architectures": [
10
+ "Wav2Vec2ForCTC"
11
+ ],
12
+ "attention_dropout": 0.094,
13
+ "bos_token_id": 1,
14
+ "classifier_proj_size": 256,
15
+ "codevector_dim": 768,
16
+ "contrastive_logits_temperature": 0.1,
17
+ "conv_bias": true,
18
+ "conv_dim": [
19
+ 512,
20
+ 512,
21
+ 512,
22
+ 512,
23
+ 512,
24
+ 512,
25
+ 512
26
+ ],
27
+ "conv_kernel": [
28
+ 10,
29
+ 3,
30
+ 3,
31
+ 3,
32
+ 3,
33
+ 2,
34
+ 2
35
+ ],
36
+ "conv_stride": [
37
+ 5,
38
+ 2,
39
+ 2,
40
+ 2,
41
+ 2,
42
+ 2,
43
+ 2
44
+ ],
45
+ "ctc_loss_reduction": "mean",
46
+ "ctc_zero_infinity": true,
47
+ "diversity_loss_weight": 0.1,
48
+ "do_stable_layer_norm": true,
49
+ "eos_token_id": 2,
50
+ "feat_extract_activation": "gelu",
51
+ "feat_extract_dropout": 0.0,
52
+ "feat_extract_norm": "layer",
53
+ "feat_proj_dropout": 0.04,
54
+ "feat_quantizer_dropout": 0.0,
55
+ "final_dropout": 0.0,
56
+ "hidden_act": "gelu",
57
+ "hidden_dropout": 0.047,
58
+ "hidden_size": 1024,
59
+ "initializer_range": 0.02,
60
+ "intermediate_size": 4096,
61
+ "layer_norm_eps": 1e-05,
62
+ "layerdrop": 0.041,
63
+ "mask_channel_length": 10,
64
+ "mask_channel_min_space": 1,
65
+ "mask_channel_other": 0.0,
66
+ "mask_channel_prob": 0.0,
67
+ "mask_channel_selection": "static",
68
+ "mask_feature_length": 64,
69
+ "mask_feature_min_masks": 0,
70
+ "mask_feature_prob": 0.25,
71
+ "mask_time_length": 10,
72
+ "mask_time_min_masks": 2,
73
+ "mask_time_min_space": 1,
74
+ "mask_time_other": 0.0,
75
+ "mask_time_prob": 0.082,
76
+ "mask_time_selection": "static",
77
+ "model_type": "wav2vec2",
78
+ "num_adapter_layers": 3,
79
+ "num_attention_heads": 16,
80
+ "num_codevector_groups": 2,
81
+ "num_codevectors_per_group": 320,
82
+ "num_conv_pos_embedding_groups": 16,
83
+ "num_conv_pos_embeddings": 128,
84
+ "num_feat_extract_layers": 7,
85
+ "num_hidden_layers": 24,
86
+ "num_negatives": 100,
87
+ "output_hidden_size": 1024,
88
+ "pad_token_id": 31,
89
+ "proj_codevector_dim": 768,
90
+ "tdnn_dilation": [
91
+ 1,
92
+ 2,
93
+ 3,
94
+ 1,
95
+ 1
96
+ ],
97
+ "tdnn_dim": [
98
+ 512,
99
+ 512,
100
+ 512,
101
+ 512,
102
+ 1500
103
+ ],
104
+ "tdnn_kernel": [
105
+ 5,
106
+ 3,
107
+ 3,
108
+ 1,
109
+ 1
110
+ ],
111
+ "torch_dtype": "float32",
112
+ "transformers_version": "4.38.1",
113
+ "use_weighted_layer_sum": false,
114
+ "vocab_size": 34,
115
+ "xvector_output_dim": 512
116
+ }
language_model/5gram.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b41c24c63f2f0585bea83666369593f3b3e6d047f327a90f36ebca2c35ef0ff
3
+ size 4243671427
language_model/attrs.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"alpha": 0.5, "beta": 0.1, "unk_score_offset": -10.0, "score_boundary": true}
language_model/unigrams.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac3e71ca49838ca355df6fdcb8d89344a5a9bf9e1a76587cdf5df1367c19b9a9
3
+ size 16759269
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6f2cb9759090ff3e4f9ed9a8800e2008d2c3ca13063af3457dea658c88a0b1a
3
+ size 1261946880
preprocessor_config.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_normalize": true,
3
+ "feature_extractor_type": "Wav2Vec2FeatureExtractor",
4
+ "feature_size": 1,
5
+ "padding_side": "right",
6
+ "padding_value": 0,
7
+ "processor_class": "Wav2Vec2ProcessorWithLM",
8
+ "return_attention_mask": true,
9
+ "sampling_rate": 16000
10
+ }
runs/May30_23-24-24_idun-04-09/events.out.tfevents.1717105991.idun-04-09.1310150.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cae4692eb12ce2fbd667289bc0540c92aef553e30292144ef9422b9238307e6
3
+ size 75361
special_tokens_map.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "<s>",
3
+ "eos_token": "</s>",
4
+ "pad_token": "[PAD]",
5
+ "unk_token": "[UNK]"
6
+ }
tokenizer_config.json ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "30": {
4
+ "content": "[UNK]",
5
+ "lstrip": true,
6
+ "normalized": false,
7
+ "rstrip": true,
8
+ "single_word": false,
9
+ "special": false
10
+ },
11
+ "31": {
12
+ "content": "[PAD]",
13
+ "lstrip": true,
14
+ "normalized": false,
15
+ "rstrip": true,
16
+ "single_word": false,
17
+ "special": false
18
+ },
19
+ "32": {
20
+ "content": "<s>",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "33": {
28
+ "content": "</s>",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ }
35
+ },
36
+ "bos_token": "<s>",
37
+ "clean_up_tokenization_spaces": true,
38
+ "do_lower_case": false,
39
+ "eos_token": "</s>",
40
+ "model_max_length": 1000000000000000019884624838656,
41
+ "pad_token": "[PAD]",
42
+ "replace_word_delimiter_char": " ",
43
+ "target_lang": null,
44
+ "tokenizer_class": "Wav2Vec2CTCTokenizer",
45
+ "unk_token": "[UNK]",
46
+ "word_delimiter_token": "|"
47
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:350225cd13eaea5c53facdfd0bf5c84ee772638ee245537f79787ad7224840fa
3
+ size 4984
vocab.json ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "[PAD]": 31,
3
+ "[UNK]": 30,
4
+ "a": 1,
5
+ "b": 2,
6
+ "c": 3,
7
+ "d": 4,
8
+ "e": 5,
9
+ "f": 6,
10
+ "g": 7,
11
+ "h": 8,
12
+ "i": 9,
13
+ "j": 10,
14
+ "k": 11,
15
+ "l": 12,
16
+ "m": 13,
17
+ "n": 14,
18
+ "o": 15,
19
+ "p": 16,
20
+ "q": 17,
21
+ "r": 18,
22
+ "s": 19,
23
+ "t": 20,
24
+ "u": 21,
25
+ "v": 22,
26
+ "w": 23,
27
+ "x": 24,
28
+ "y": 25,
29
+ "z": 26,
30
+ "|": 0,
31
+ "å": 27,
32
+ "æ": 28,
33
+ "ø": 29
34
+ }