shpotes commited on
Commit
879f203
1 Parent(s): 2a437db

Training in progress, step 500

Browse files
.gitignore CHANGED
@@ -1,2 +1,3 @@
1
  checkpoint-*/
2
- .venv
 
 
1
  checkpoint-*/
2
+ .venv
3
+ 1B/
README.md DELETED
@@ -1,61 +0,0 @@
1
- ---
2
- language:
3
- - et
4
- license: apache-2.0
5
- tags:
6
- - automatic-speech-recognition
7
- - mozilla-foundation/common_voice_7_0
8
- - generated_from_trainer
9
- datasets:
10
- - common_voice
11
- model-index:
12
- - name: ''
13
- results: []
14
- ---
15
-
16
- <!-- This model card has been generated automatically according to the information the Trainer had access to. You
17
- should probably proofread and complete it, then remove this comment. -->
18
-
19
- #
20
-
21
- This model is a fine-tuned version of [facebook/wav2vec2-xls-r-300m](https://huggingface.co/facebook/wav2vec2-xls-r-300m) on the MOZILLA-FOUNDATION/COMMON_VOICE_7_0 - ET dataset.
22
- It achieves the following results on the evaluation set:
23
- - Loss: 4.8300
24
- - Wer: 1.0
25
-
26
- ## Model description
27
-
28
- More information needed
29
-
30
- ## Intended uses & limitations
31
-
32
- More information needed
33
-
34
- ## Training and evaluation data
35
-
36
- More information needed
37
-
38
- ## Training procedure
39
-
40
- ### Training hyperparameters
41
-
42
- The following hyperparameters were used during training:
43
- - learning_rate: 0.0003
44
- - train_batch_size: 8
45
- - eval_batch_size: 16
46
- - seed: 42
47
- - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
48
- - lr_scheduler_type: linear
49
- - training_steps: 10
50
- - mixed_precision_training: Native AMP
51
-
52
- ### Training results
53
-
54
-
55
-
56
- ### Framework versions
57
-
58
- - Transformers 4.16.0.dev0
59
- - Pytorch 1.10.1+cu102
60
- - Datasets 1.18.1.dev0
61
- - Tokenizers 0.11.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
added_tokens.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"<s>": 37, "</s>": 38}
config.json ADDED
@@ -0,0 +1,107 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "facebook/wav2vec2-xls-r-300m",
3
+ "activation_dropout": 0.0,
4
+ "adapter_kernel_size": 3,
5
+ "adapter_stride": 2,
6
+ "add_adapter": false,
7
+ "apply_spec_augment": true,
8
+ "architectures": [
9
+ "Wav2Vec2ForCTC"
10
+ ],
11
+ "attention_dropout": 0.0,
12
+ "bos_token_id": 1,
13
+ "classifier_proj_size": 256,
14
+ "codevector_dim": 768,
15
+ "contrastive_logits_temperature": 0.1,
16
+ "conv_bias": true,
17
+ "conv_dim": [
18
+ 512,
19
+ 512,
20
+ 512,
21
+ 512,
22
+ 512,
23
+ 512,
24
+ 512
25
+ ],
26
+ "conv_kernel": [
27
+ 10,
28
+ 3,
29
+ 3,
30
+ 3,
31
+ 3,
32
+ 2,
33
+ 2
34
+ ],
35
+ "conv_stride": [
36
+ 5,
37
+ 2,
38
+ 2,
39
+ 2,
40
+ 2,
41
+ 2,
42
+ 2
43
+ ],
44
+ "ctc_loss_reduction": "mean",
45
+ "ctc_zero_infinity": false,
46
+ "diversity_loss_weight": 0.1,
47
+ "do_stable_layer_norm": true,
48
+ "eos_token_id": 2,
49
+ "feat_extract_activation": "gelu",
50
+ "feat_extract_dropout": 0.0,
51
+ "feat_extract_norm": "layer",
52
+ "feat_proj_dropout": 0.1,
53
+ "feat_quantizer_dropout": 0.0,
54
+ "final_dropout": 0.0,
55
+ "hidden_act": "gelu",
56
+ "hidden_dropout": 0.0,
57
+ "hidden_size": 1024,
58
+ "initializer_range": 0.02,
59
+ "intermediate_size": 4096,
60
+ "layer_norm_eps": 1e-05,
61
+ "layerdrop": 0.0,
62
+ "mask_feature_length": 10,
63
+ "mask_feature_min_masks": 0,
64
+ "mask_feature_prob": 0.0,
65
+ "mask_time_length": 10,
66
+ "mask_time_min_masks": 2,
67
+ "mask_time_prob": 0.1,
68
+ "model_type": "wav2vec2",
69
+ "num_adapter_layers": 3,
70
+ "num_attention_heads": 16,
71
+ "num_codevector_groups": 2,
72
+ "num_codevectors_per_group": 320,
73
+ "num_conv_pos_embedding_groups": 16,
74
+ "num_conv_pos_embeddings": 128,
75
+ "num_feat_extract_layers": 7,
76
+ "num_hidden_layers": 24,
77
+ "num_negatives": 100,
78
+ "output_hidden_size": 1024,
79
+ "pad_token_id": 36,
80
+ "proj_codevector_dim": 768,
81
+ "tdnn_dilation": [
82
+ 1,
83
+ 2,
84
+ 3,
85
+ 1,
86
+ 1
87
+ ],
88
+ "tdnn_dim": [
89
+ 512,
90
+ 512,
91
+ 512,
92
+ 512,
93
+ 1500
94
+ ],
95
+ "tdnn_kernel": [
96
+ 5,
97
+ 3,
98
+ 3,
99
+ 1,
100
+ 1
101
+ ],
102
+ "torch_dtype": "float32",
103
+ "transformers_version": "4.16.0.dev0",
104
+ "use_weighted_layer_sum": false,
105
+ "vocab_size": 39,
106
+ "xvector_output_dim": 512
107
+ }
errs ADDED
@@ -0,0 +1,456 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
0
  0%| | 0/1 [00:00<?, ?ba/s]
 
1
  0%| | 0/1 [00:00<?, ?ba/s]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2
  0%| | 0/6 [00:00<?, ?ba/s]
 
3
  0%| | 0/3 [00:00<?, ?ba/s]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4
  0% 0/18000 [00:00<?, ?it/s]
5
  0% 1/18000 [00:17<86:26:02, 17.29s/it]
6
  0% 2/18000 [00:30<75:01:49, 15.01s/it]
7
  0% 3/18000 [00:41<65:24:50, 13.08s/it]
8
  0% 4/18000 [00:50<58:10:48, 11.64s/it]
9
  0% 5/18000 [00:59<52:10:20, 10.44s/it]
10
  0% 6/18000 [01:06<46:21:37, 9.28s/it]
11
  0% 7/18000 [01:12<40:36:25, 8.12s/it]
12
  0% 8/18000 [01:16<34:47:36, 6.96s/it]
13
  0% 9/18000 [01:33<50:28:39, 10.10s/it]
14
  0% 10/18000 [01:46<54:51:39, 10.98s/it]
15
  0% 11/18000 [01:57<54:52:13, 10.98s/it]
16
  0% 12/18000 [02:07<52:52:40, 10.58s/it]
17
  0% 13/18000 [02:15<49:41:21, 9.95s/it]
18
  0% 14/18000 [02:22<45:26:54, 9.10s/it]
19
  0% 15/18000 [02:28<40:51:40, 8.18s/it]
20
  0% 16/18000 [02:33<35:21:44, 7.08s/it]
21
  0% 17/18000 [02:49<49:42:15, 9.95s/it]
22
  0% 18/18000 [03:03<55:21:19, 11.08s/it]
23
  0% 19/18000 [03:14<55:04:47, 11.03s/it]
24
  0% 20/18000 [03:23<52:40:52, 10.55s/it]
25
  0% 21/18000 [03:32<49:32:32, 9.92s/it]
26
  0% 22/18000 [03:39<45:11:01, 9.05s/it]
27
  0% 23/18000 [03:45<40:31:29, 8.12s/it]
28
  0% 24/18000 [03:50<35:20:48, 7.08s/it]
29
  0% 25/18000 [04:06<49:22:23, 9.89s/it]
30
  0% 26/18000 [04:19<54:38:50, 10.95s/it]
31
  0% 27/18000 [04:30<54:41:00, 10.95s/it]
32
  0% 28/18000 [04:40<52:18:06, 10.48s/it]
33
  0% 29/18000 [04:48<49:00:52, 9.82s/it]
34
  0% 30/18000 [04:55<45:04:29, 9.03s/it]
35
  0% 31/18000 [05:01<40:27:51, 8.11s/it]
36
  0% 32/18000 [05:06<35:02:45, 7.02s/it]
37
  0% 33/18000 [05:20<46:37:19, 9.34s/it]
38
  0% 34/18000 [05:30<47:26:00, 9.50s/it]
39
  0% 35/18000 [05:37<43:56:15, 8.80s/it]
40
  0% 36/18000 [05:41<35:44:20, 7.16s/it]
41
  0% 37/18000 [05:57<49:56:45, 10.01s/it]
42
  0% 38/18000 [06:10<54:30:48, 10.93s/it]
43
  0% 39/18000 [06:21<54:14:33, 10.87s/it]
44
  0% 40/18000 [06:31<52:09:33, 10.46s/it]
45
  0% 41/18000 [06:39<49:11:45, 9.86s/it]
46
  0% 42/18000 [06:46<45:07:06, 9.04s/it]
47
  0% 43/18000 [06:52<40:22:51, 8.10s/it]
48
  0% 44/18000 [06:57<35:07:39, 7.04s/it]
49
  0% 45/18000 [07:13<48:38:37, 9.75s/it]
50
  0% 46/18000 [07:26<53:56:40, 10.82s/it]
51
  0% 47/18000 [07:37<53:51:56, 10.80s/it]
52
  0% 48/18000 [07:46<51:52:52, 10.40s/it]
53
  0% 49/18000 [07:55<48:44:50, 9.78s/it]
54
  0% 50/18000 [08:02<44:52:04, 9.00s/it]
55
  0% 51/18000 [08:08<40:35:01, 8.14s/it]
56
  0% 52/18000 [08:13<35:13:14, 7.06s/it]
57
  0% 53/18000 [08:29<49:34:56, 9.95s/it]
58
  0% 54/18000 [08:43<54:54:51, 11.02s/it]
59
  0% 55/18000 [08:54<54:39:48, 10.97s/it]
60
  0% 56/18000 [09:03<51:47:45, 10.39s/it]
61
  0% 57/18000 [09:11<48:30:24, 9.73s/it]
62
  0% 58/18000 [09:18<44:04:17, 8.84s/it]
63
  0% 59/18000 [09:23<39:07:38, 7.85s/it]
64
  0% 60/18000 [09:28<33:56:38, 6.81s/it]
65
  0% 61/18000 [09:44<48:31:20, 9.74s/it]
66
  0% 62/18000 [09:58<54:20:24, 10.91s/it]
67
  0% 63/18000 [10:09<54:07:29, 10.86s/it]
68
  0% 64/18000 [10:18<52:41:53, 10.58s/it]
69
  0% 65/18000 [10:27<49:44:17, 9.98s/it]
70
  0% 66/18000 [10:34<45:08:18, 9.06s/it]
71
  0% 67/18000 [10:40<40:27:18, 8.12s/it]
72
  0% 68/18000 [10:44<35:05:04, 7.04s/it]
73
  0% 69/18000 [11:00<47:40:09, 9.57s/it]
74
  0% 70/18000 [11:10<48:34:46, 9.75s/it]
75
  0% 71/18000 [11:17<44:54:05, 9.02s/it]
76
  0% 72/18000 [11:21<36:10:47, 7.27s/it]
77
  0% 73/18000 [11:37<50:11:00, 10.08s/it]
78
  0% 74/18000 [11:50<54:44:05, 10.99s/it]
79
  0% 75/18000 [12:01<54:03:33, 10.86s/it]
80
  0% 76/18000 [12:10<51:30:17, 10.34s/it]
81
  0% 77/18000 [12:18<48:16:12, 9.70s/it]
82
  0% 78/18000 [12:25<44:02:08, 8.85s/it]
83
  0% 79/18000 [12:31<39:24:36, 7.92s/it]
84
  0% 80/18000 [12:35<34:06:06, 6.85s/it]
85
  0% 81/18000 [12:52<48:23:03, 9.72s/it]
86
  0% 82/18000 [13:05<54:09:04, 10.88s/it]
87
  0% 83/18000 [13:16<54:31:03, 10.95s/it]
88
  0% 84/18000 [13:26<52:35:45, 10.57s/it]
89
  0% 85/18000 [13:34<49:34:08, 9.96s/it]
90
  0% 86/18000 [13:42<45:29:05, 9.14s/it]
91
  0% 87/18000 [13:48<40:44:29, 8.19s/it]
92
  0% 88/18000 [13:52<35:22:46, 7.11s/it]
93
  0% 89/18000 [14:09<49:08:37, 9.88s/it]
94
  0% 90/18000 [14:22<53:55:22, 10.84s/it]
95
  1% 91/18000 [14:33<53:54:12, 10.84s/it]
96
  1% 92/18000 [14:42<51:57:31, 10.45s/it]
97
  1% 93/18000 [14:50<48:11:46, 9.69s/it]
98
  1% 94/18000 [14:57<44:05:28, 8.86s/it]
99
  1% 95/18000 [15:02<39:02:47, 7.85s/it]
100
  1% 96/18000 [15:07<33:46:57, 6.79s/it]
101
  1% 97/18000 [15:23<48:11:08, 9.69s/it]
102
  1% 98/18000 [15:36<53:29:06, 10.76s/it]
103
  1% 99/18000 [15:47<53:25:40, 10.74s/it]
104
  1% 100/18000 [15:57<51:48:37, 10.42s/it]
105
 
106
  1% 100/18000 [15:57<51:48:37, 10.42s/it]
107
  1% 101/18000 [16:05<48:40:04, 9.79s/it]
108
  1% 102/18000 [16:12<44:23:01, 8.93s/it]
109
  1% 103/18000 [16:18<39:26:24, 7.93s/it]
110
  1% 104/18000 [16:22<34:15:20, 6.89s/it]
111
  1% 105/18000 [16:37<46:43:13, 9.40s/it]
112
  1% 106/18000 [16:47<47:23:12, 9.53s/it]
113
  1% 107/18000 [16:54<43:44:40, 8.80s/it]
114
  1% 108/18000 [16:58<35:46:46, 7.20s/it]
115
  1% 109/18000 [17:14<48:43:15, 9.80s/it]
116
  1% 110/18000 [17:27<54:09:47, 10.90s/it]
117
  1% 111/18000 [17:38<54:15:19, 10.92s/it]
118
  1% 112/18000 [17:48<52:17:25, 10.52s/it]
119
  1% 113/18000 [17:56<49:14:31, 9.91s/it]
120
  1% 114/18000 [18:03<45:07:53, 9.08s/it]
121
  1% 115/18000 [18:09<40:13:03, 8.10s/it]
122
  1% 116/18000 [18:13<34:43:29, 6.99s/it]
123
  1% 117/18000 [18:30<48:46:18, 9.82s/it]
124
  1% 118/18000 [18:43<53:31:11, 10.77s/it]
125
  1% 119/18000 [18:53<53:11:36, 10.71s/it]
126
  1% 120/18000 [19:03<50:56:21, 10.26s/it]
127
  1% 121/18000 [19:11<47:23:37, 9.54s/it]
128
  1% 122/18000 [19:17<43:07:59, 8.69s/it]
129
  1% 123/18000 [19:23<38:34:05, 7.77s/it]
130
  1% 124/18000 [19:27<33:23:03, 6.72s/it]
131
  1% 125/18000 [19:43<47:43:04, 9.61s/it]
132
  1% 126/18000 [19:57<53:09:48, 10.71s/it]
133
  1% 127/18000 [20:08<53:19:09, 10.74s/it]
134
  1% 128/18000 [20:17<51:20:03, 10.34s/it]
135
  1% 129/18000 [20:25<48:12:21, 9.71s/it]
136
  1% 130/18000 [20:32<43:58:10, 8.86s/it]
137
  1% 131/18000 [20:38<39:28:05, 7.95s/it]
138
  1% 132/18000 [20:42<34:15:06, 6.90s/it]
139
  1% 133/18000 [20:59<48:28:40, 9.77s/it]
140
  1% 134/18000 [21:12<53:33:44, 10.79s/it]
141
  1% 135/18000 [21:23<53:23:03, 10.76s/it]
142
  1% 136/18000 [21:32<51:19:46, 10.34s/it]
143
  1% 137/18000 [21:40<48:04:44, 9.69s/it]
144
  1% 138/18000 [21:47<43:54:30, 8.85s/it]
145
  1% 139/18000 [21:53<39:05:17, 7.88s/it]
146
  1% 140/18000 [21:57<34:00:50, 6.86s/it]
147
  1% 141/18000 [22:13<46:40:32, 9.41s/it]
148
  1% 142/18000 [22:23<47:51:15, 9.65s/it]
149
  1% 143/18000 [22:30<44:22:27, 8.95s/it]
150
  1% 144/18000 [22:34<36:18:44, 7.32s/it]
151
  1% 145/18000 [22:50<49:56:40, 10.07s/it]
152
  1% 146/18000 [23:03<54:50:33, 11.06s/it]
153
  1% 147/18000 [23:14<54:23:30, 10.97s/it]
154
  1% 148/18000 [23:24<51:53:58, 10.47s/it]
155
  1% 149/18000 [23:32<48:32:27, 9.79s/it]
156
  1% 150/18000 [23:39<44:37:06, 9.00s/it]
157
  1% 151/18000 [23:45<39:56:07, 8.05s/it]
158
  1% 152/18000 [23:49<34:30:40, 6.96s/it]
159
  1% 153/18000 [24:06<48:51:50, 9.86s/it]
160
  1% 154/18000 [24:19<54:08:29, 10.92s/it]
161
  1% 155/18000 [24:30<54:07:19, 10.92s/it]
162
  1% 156/18000 [24:39<51:49:42, 10.46s/it]
163
  1% 157/18000 [24:48<48:49:19, 9.85s/it]
164
  1% 158/18000 [24:55<44:54:15, 9.06s/it]
165
  1% 159/18000 [25:01<40:01:43, 8.08s/it]
166
  1% 160/18000 [25:05<34:36:26, 6.98s/it]
167
  1% 161/18000 [25:22<48:39:48, 9.82s/it]
168
  1% 162/18000 [25:35<53:20:53, 10.77s/it]
169
  1% 163/18000 [25:45<53:02:40, 10.71s/it]
170
  1% 164/18000 [25:55<51:11:53, 10.33s/it]
171
  1% 165/18000 [26:03<48:01:45, 9.69s/it]
172
  1% 166/18000 [26:10<43:51:38, 8.85s/it]
173
  1% 167/18000 [26:16<39:20:09, 7.94s/it]
174
  1% 168/18000 [26:20<34:07:20, 6.89s/it]
175
  1% 169/18000 [26:37<48:26:45, 9.78s/it]
176
  1% 170/18000 [26:50<54:05:34, 10.92s/it]
177
  1% 171/18000 [27:01<54:10:19, 10.94s/it]
178
  1% 172/18000 [27:11<51:47:16, 10.46s/it]
179
  1% 173/18000 [27:19<48:35:45, 9.81s/it]
180
  1% 174/18000 [27:26<44:17:21, 8.94s/it]
181
  1% 175/18000 [27:32<39:40:01, 8.01s/it]
182
  1% 176/18000 [27:36<34:26:47, 6.96s/it]
183
  1% 177/18000 [27:51<46:22:02, 9.37s/it]
184
  1% 178/18000 [28:01<46:54:42, 9.48s/it]
185
  1% 179/18000 [28:08<43:12:54, 8.73s/it]
186
  1% 180/18000 [28:11<34:51:46, 7.04s/it]
187
  1% 181/18000 [28:27<48:41:49, 9.84s/it]
188
  1% 182/18000 [28:41<53:47:06, 10.87s/it]
189
  1% 183/18000 [28:51<53:26:11, 10.80s/it]
190
  1% 184/18000 [29:00<51:13:34, 10.35s/it]
191
  1% 185/18000 [29:08<47:40:37, 9.63s/it]
192
  1% 186/18000 [29:15<43:41:55, 8.83s/it]
193
  1% 187/18000 [29:21<39:02:36, 7.89s/it]
194
  1% 188/18000 [29:25<33:33:56, 6.78s/it]
195
  1% 189/18000 [29:41<46:58:38, 9.50s/it]
196
  1% 190/18000 [29:55<52:50:48, 10.68s/it]
197
  1% 191/18000 [30:05<53:13:50, 10.76s/it]
198
  1% 192/18000 [30:15<51:19:04, 10.37s/it]
199
  1% 193/18000 [30:23<47:46:28, 9.66s/it]
200
  1% 194/18000 [30:30<43:50:18, 8.86s/it]
201
  1% 195/18000 [30:36<39:23:19, 7.96s/it]
202
  1% 196/18000 [30:40<34:17:27, 6.93s/it]
203
  1% 197/18000 [30:57<48:42:25, 9.85s/it]
204
  1% 198/18000 [31:11<54:34:28, 11.04s/it]
205
  1% 199/18000 [31:22<54:40:44, 11.06s/it]
206
  1% 200/18000 [31:32<53:10:28, 10.75s/it]
207
 
208
  1% 200/18000 [31:32<53:10:28, 10.75s/it]
209
  1% 201/18000 [31:40<49:47:14, 10.07s/it]
210
  1% 202/18000 [31:47<45:18:07, 9.16s/it]
211
  1% 203/18000 [31:53<40:20:20, 8.16s/it]
212
  1% 204/18000 [31:58<34:46:55, 7.04s/it]
213
  1% 205/18000 [32:14<48:45:25, 9.86s/it]
214
  1% 206/18000 [32:27<53:32:26, 10.83s/it]
215
  1% 207/18000 [32:38<53:17:02, 10.78s/it]
216
  1% 208/18000 [32:47<51:12:19, 10.36s/it]
217
  1% 209/18000 [32:56<48:09:33, 9.75s/it]
218
  1% 210/18000 [33:03<44:08:23, 8.93s/it]
219
  1% 211/18000 [33:09<39:35:55, 8.01s/it]
220
  1% 212/18000 [33:13<34:23:10, 6.96s/it]
221
  1% 213/18000 [33:28<46:28:43, 9.41s/it]
222
  1% 214/18000 [33:38<46:56:12, 9.50s/it]
223
  1% 215/18000 [33:45<43:27:58, 8.80s/it]
224
  1% 216/18000 [33:48<35:04:07, 7.10s/it]
225
  1% 217/18000 [34:04<48:42:58, 9.86s/it]
226
  1% 218/18000 [34:18<53:32:18, 10.84s/it]
227
  1% 219/18000 [34:28<53:14:19, 10.78s/it]
228
  1% 220/18000 [34:38<51:06:07, 10.35s/it]
229
  1% 221/18000 [34:46<47:42:29, 9.66s/it]
230
  1% 222/18000 [34:52<43:16:38, 8.76s/it]
231
  1% 223/18000 [34:58<38:47:18, 7.85s/it]
232
  1% 224/18000 [35:02<33:35:15, 6.80s/it]
233
  1% 225/18000 [35:18<46:55:15, 9.50s/it]
234
  1% 226/18000 [35:32<52:36:24, 10.66s/it]
235
  1% 227/18000 [35:42<52:47:45, 10.69s/it]
236
  1% 228/18000 [35:52<50:52:21, 10.31s/it]
237
  1% 229/18000 [36:00<48:08:38, 9.75s/it]
238
  1% 230/18000 [36:07<44:14:44, 8.96s/it]
239
  1% 231/18000 [36:13<39:37:28, 8.03s/it]
240
  1% 232/18000 [36:18<34:13:31, 6.93s/it]
241
  1% 233/18000 [36:34<48:28:27, 9.82s/it]
242
  1% 234/18000 [36:48<53:55:28, 10.93s/it]
243
  1% 235/18000 [36:59<54:07:48, 10.97s/it]
244
  1% 236/18000 [37:08<52:09:20, 10.57s/it]
245
  1% 237/18000 [37:17<48:42:27, 9.87s/it]
246
  1% 238/18000 [37:23<44:21:14, 8.99s/it]
247
  1% 239/18000 [37:29<39:44:51, 8.06s/it]
248
  1% 240/18000 [37:34<34:23:30, 6.97s/it]
249
  1% 241/18000 [37:50<48:42:06, 9.87s/it]
250
  1% 242/18000 [38:03<53:25:27, 10.83s/it]
251
  1% 243/18000 [38:14<52:55:48, 10.73s/it]
252
  1% 244/18000 [38:23<50:37:01, 10.26s/it]
253
  1% 245/18000 [38:31<47:27:12, 9.62s/it]
254
  1% 246/18000 [38:38<43:25:26, 8.81s/it]
255
  1% 247/18000 [38:44<39:01:44, 7.91s/it]
256
  1% 248/18000 [38:48<33:54:20, 6.88s/it]
257
  1% 249/18000 [39:04<46:20:55, 9.40s/it]
258
  1% 250/18000 [39:14<47:17:59, 9.59s/it]
259
  1% 251/18000 [39:21<43:48:05, 8.88s/it]
260
  1% 252/18000 [39:24<35:17:51, 7.16s/it]
261
  1% 253/18000 [39:41<49:42:54, 10.08s/it]
262
  1% 254/18000 [39:55<54:40:20, 11.09s/it]
263
  1% 255/18000 [40:05<54:05:56, 10.98s/it]
264
  1% 256/18000 [40:15<51:41:45, 10.49s/it]
265
  1% 257/18000 [40:23<48:34:31, 9.86s/it]
266
  1% 258/18000 [40:30<44:23:42, 9.01s/it]
267
  1% 259/18000 [40:36<39:40:19, 8.05s/it]
268
  1% 260/18000 [40:40<34:13:42, 6.95s/it]
269
  1% 261/18000 [40:57<48:18:11, 9.80s/it]
270
  1% 262/18000 [41:10<53:34:01, 10.87s/it]
271
  1% 263/18000 [41:21<53:19:57, 10.82s/it]
272
  1% 264/18000 [41:30<50:44:07, 10.30s/it]
273
  1% 265/18000 [41:38<47:15:09, 9.59s/it]
274
  1% 266/18000 [41:44<43:02:02, 8.74s/it]
275
  1% 267/18000 [41:50<38:41:55, 7.86s/it]
276
  1% 268/18000 [41:55<33:41:12, 6.84s/it]
277
  1% 269/18000 [42:11<47:53:19, 9.72s/it]
278
  2% 270/18000 [42:24<53:01:13, 10.77s/it]
279
  2% 271/18000 [42:35<53:02:40, 10.77s/it]
280
  2% 272/18000 [42:45<51:00:00, 10.36s/it]
281
  2% 273/18000 [42:53<48:01:13, 9.75s/it]
282
  2% 274/18000 [43:00<44:05:26, 8.95s/it]
283
  2% 275/18000 [43:06<39:29:31, 8.02s/it]
284
  2% 276/18000 [43:10<34:20:22, 6.97s/it]
285
  2% 277/18000 [43:27<48:36:20, 9.87s/it]
286
  2% 278/18000 [43:41<54:13:56, 11.02s/it]
287
  2% 279/18000 [43:52<54:12:18, 11.01s/it]
288
  2% 280/18000 [44:01<51:45:06, 10.51s/it]
289
  2% 281/18000 [44:10<48:47:06, 9.91s/it]
290
  2% 282/18000 [44:16<44:16:39, 9.00s/it]
291
  2% 283/18000 [44:22<39:08:42, 7.95s/it]
292
  2% 284/18000 [44:26<33:59:45, 6.91s/it]
293
  2% 285/18000 [44:42<46:30:46, 9.45s/it]
294
  2% 286/18000 [44:52<47:30:24, 9.65s/it]
295
  2% 287/18000 [44:59<43:54:19, 8.92s/it]
296
  2% 288/18000 [45:03<35:52:00, 7.29s/it]
297
  2% 289/18000 [45:19<49:57:55, 10.16s/it]
298
  2% 290/18000 [45:33<54:54:58, 11.16s/it]
299
  2% 291/18000 [45:44<54:40:30, 11.11s/it]
300
  2% 292/18000 [45:54<52:24:02, 10.65s/it]
301
  2% 293/18000 [46:02<48:53:00, 9.94s/it]
302
  2% 294/18000 [46:09<44:31:18, 9.05s/it]
303
  2% 295/18000 [46:15<39:58:45, 8.13s/it]
304
  2% 296/18000 [46:19<34:41:14, 7.05s/it]
305
  2% 297/18000 [46:36<48:25:58, 9.85s/it]
306
  2% 298/18000 [46:49<53:21:33, 10.85s/it]
307
  2% 299/18000 [47:00<53:00:52, 10.78s/it]
308
  2% 300/18000 [47:09<51:02:08, 10.38s/it]
309
 
310
  2% 300/18000 [47:09<51:02:08, 10.38s/it]
311
  2% 301/18000 [47:17<47:51:13, 9.73s/it]
312
  2% 302/18000 [47:24<43:43:29, 8.89s/it]
313
  2% 303/18000 [47:30<39:03:22, 7.94s/it]
314
  2% 304/18000 [47:34<33:47:15, 6.87s/it]
315
  2% 305/18000 [47:51<47:55:18, 9.75s/it]
316
  2% 306/18000 [48:04<52:59:15, 10.78s/it]
317
  2% 307/18000 [48:15<52:51:07, 10.75s/it]
318
  2% 308/18000 [48:24<50:25:56, 10.26s/it]
319
  2% 309/18000 [48:32<47:33:47, 9.68s/it]
320
  2% 310/18000 [48:39<43:29:15, 8.85s/it]
321
  2% 311/18000 [48:45<38:43:45, 7.88s/it]
322
  2% 312/18000 [48:49<33:28:13, 6.81s/it]
323
  2% 313/18000 [49:05<47:37:14, 9.69s/it]
324
  2% 314/18000 [49:19<53:06:18, 10.81s/it]
325
  2% 315/18000 [49:29<52:32:02, 10.69s/it]
326
  2% 316/18000 [49:39<50:37:01, 10.30s/it]
327
  2% 317/18000 [49:47<47:35:40, 9.69s/it]
328
  2% 318/18000 [49:54<43:33:20, 8.87s/it]
329
  2% 319/18000 [50:00<39:14:50, 7.99s/it]
330
  2% 320/18000 [50:04<34:09:36, 6.96s/it]
331
  2% 321/18000 [50:19<46:07:44, 9.39s/it]
332
  2% 322/18000 [50:29<47:04:05, 9.59s/it]
333
  2% 323/18000 [50:37<43:38:37, 8.89s/it]
334
  2% 324/18000 [50:40<35:28:44, 7.23s/it]
335
  2% 325/18000 [50:56<49:06:27, 10.00s/it]
336
  2% 326/18000 [51:10<53:47:16, 10.96s/it]
337
  2% 327/18000 [51:20<53:23:03, 10.87s/it]
338
  2% 328/18000 [51:30<51:14:24, 10.44s/it]
339
  2% 329/18000 [51:38<48:08:52, 9.81s/it]
340
  2% 330/18000 [51:45<44:04:02, 8.98s/it]
341
  2% 331/18000 [51:51<39:27:52, 8.04s/it]
342
  2% 332/18000 [51:55<34:01:15, 6.93s/it]
343
  2% 333/18000 [52:12<47:55:08, 9.76s/it]
344
  2% 334/18000 [52:25<52:58:37, 10.80s/it]
345
  2% 335/18000 [52:36<53:03:41, 10.81s/it]
346
  2% 336/18000 [52:45<51:22:12, 10.47s/it]
347
  2% 337/18000 [52:54<48:17:41, 9.84s/it]
348
  2% 338/18000 [53:01<44:04:01, 8.98s/it]
349
  2% 339/18000 [53:06<39:19:19, 8.02s/it]
350
  2% 340/18000 [53:11<33:59:49, 6.93s/it]
351
  2% 341/18000 [53:28<48:17:19, 9.84s/it]
352
  2% 342/18000 [53:40<52:48:55, 10.77s/it]
353
  2% 343/18000 [53:51<52:45:57, 10.76s/it]
354
  2% 344/18000 [54:00<50:32:06, 10.30s/it]
355
  2% 345/18000 [54:09<47:20:31, 9.65s/it]
356
  2% 346/18000 [54:15<43:17:34, 8.83s/it]
357
  2% 347/18000 [54:21<38:41:00, 7.89s/it]
358
  2% 348/18000 [54:25<33:24:17, 6.81s/it]
359
  2% 349/18000 [54:42<47:36:12, 9.71s/it]
360
  2% 350/18000 [54:55<52:56:31, 10.80s/it]
361
  2% 351/18000 [55:05<52:05:17, 10.62s/it]
362
  2% 352/18000 [55:15<49:57:37, 10.19s/it]
363
  2% 353/18000 [55:23<46:53:40, 9.57s/it]
364
  2% 354/18000 [55:30<42:56:28, 8.76s/it]
365
  2% 355/18000 [55:35<38:35:32, 7.87s/it]
366
  2% 356/18000 [55:40<33:34:24, 6.85s/it]
367
  2% 357/18000 [55:55<46:02:43, 9.40s/it]
368
  2% 358/18000 [56:05<47:14:04, 9.64s/it]
369
  2% 359/18000 [56:13<43:54:21, 8.96s/it]
370
  2% 360/18000 [56:16<35:44:58, 7.30s/it]
371
  2% 361/18000 [56:33<49:37:45, 10.13s/it]
372
  2% 362/18000 [56:46<54:18:29, 11.08s/it]
373
  2% 363/18000 [56:57<53:18:49, 10.88s/it]
374
  2% 364/18000 [57:06<50:43:27, 10.35s/it]
375
  2% 365/18000 [57:14<47:50:00, 9.76s/it]
376
  2% 366/18000 [57:21<43:42:30, 8.92s/it]
377
  2% 367/18000 [57:27<38:47:25, 7.92s/it]
378
  2% 368/18000 [57:31<33:26:40, 6.83s/it]
379
  2% 369/18000 [57:47<47:20:50, 9.67s/it]
380
  2% 370/18000 [58:01<52:33:21, 10.73s/it]
381
  2% 371/18000 [58:11<52:40:27, 10.76s/it]
382
  2% 372/18000 [58:21<50:37:46, 10.34s/it]
383
  2% 373/18000 [58:29<47:13:33, 9.65s/it]
384
  2% 374/18000 [58:36<43:15:43, 8.84s/it]
385
  2% 375/18000 [58:41<38:46:26, 7.92s/it]
386
  2% 376/18000 [58:46<33:49:26, 6.91s/it]
387
  2% 377/18000 [59:03<47:58:02, 9.80s/it]
388
  2% 378/18000 [59:16<53:14:23, 10.88s/it]
389
  2% 379/18000 [59:27<53:21:26, 10.90s/it]
390
  2% 380/18000 [59:37<51:32:24, 10.53s/it]
391
  2% 381/18000 [59:45<48:23:16, 9.89s/it]
392
  2% 382/18000 [59:52<44:25:48, 9.08s/it]
393
  2% 383/18000 [59:58<39:54:39, 8.16s/it]
394
  2% 384/18000 [1:00:03<34:22:55, 7.03s/it]
395
  2% 385/18000 [1:00:19<48:14:08, 9.86s/it]
396
  2% 386/18000 [1:00:32<53:13:30, 10.88s/it]
397
  2% 387/18000 [1:00:43<52:53:09, 10.81s/it]
398
  2% 388/18000 [1:00:52<50:27:17, 10.31s/it]
399
  2% 389/18000 [1:01:00<47:11:15, 9.65s/it]
400
  2% 390/18000 [1:01:07<43:01:58, 8.80s/it]
401
  2% 391/18000 [1:01:13<38:27:51, 7.86s/it]
402
  2% 392/18000 [1:01:17<33:21:31, 6.82s/it]
403
  2% 393/18000 [1:01:32<44:31:41, 9.10s/it]
404
  2% 394/18000 [1:01:41<45:48:47, 9.37s/it]
405
  2% 395/18000 [1:01:49<42:48:03, 8.75s/it]
406
  2% 396/18000 [1:01:52<34:58:38, 7.15s/it]
407
  2% 397/18000 [1:02:09<48:50:53, 9.99s/it]
408
  2% 398/18000 [1:02:22<53:43:53, 10.99s/it]
409
  2% 399/18000 [1:02:33<53:20:56, 10.91s/it]
410
  2% 400/18000 [1:02:42<51:16:29, 10.49s/it]
411
 
412
  2% 400/18000 [1:02:42<51:16:29, 10.49s/it]
413
  2% 401/18000 [1:02:51<48:04:04, 9.83s/it]
414
  2% 402/18000 [1:02:58<43:47:40, 8.96s/it]
415
  2% 403/18000 [1:03:03<39:11:36, 8.02s/it]
416
  2% 404/18000 [1:03:08<33:59:02, 6.95s/it]
417
  2% 405/18000 [1:03:24<47:36:15, 9.74s/it]
418
  2% 406/18000 [1:03:37<52:47:43, 10.80s/it]
419
  2% 407/18000 [1:03:48<52:48:26, 10.81s/it]
420
  2% 408/18000 [1:03:58<50:44:50, 10.38s/it]
421
  2% 409/18000 [1:04:06<47:49:35, 9.79s/it]
422
  2% 410/18000 [1:04:13<43:57:02, 9.00s/it]
423
  2% 411/18000 [1:04:19<39:21:08, 8.05s/it]
424
  2% 412/18000 [1:04:23<33:57:31, 6.95s/it]
425
  2% 413/18000 [1:04:40<47:43:17, 9.77s/it]
426
  2% 414/18000 [1:04:53<53:05:33, 10.87s/it]
427
  2% 415/18000 [1:05:04<53:03:39, 10.86s/it]
428
  2% 416/18000 [1:05:14<51:10:13, 10.48s/it]
429
  2% 417/18000 [1:05:22<47:58:19, 9.82s/it]
430
  2% 418/18000 [1:05:29<43:46:49, 8.96s/it]
431
  2% 419/18000 [1:05:35<39:10:03, 8.02s/it]
432
  2% 420/18000 [1:05:39<33:58:45, 6.96s/it]
433
  2% 421/18000 [1:05:56<48:16:48, 9.89s/it]
434
  2% 422/18000 [1:06:09<53:30:55, 10.96s/it]
435
  2% 423/18000 [1:06:20<53:13:22, 10.90s/it]
436
  2% 424/18000 [1:06:29<50:26:10, 10.33s/it]
437
  2% 425/18000 [1:06:37<47:08:56, 9.66s/it]
438
  2% 426/18000 [1:06:44<43:19:15, 8.87s/it]
439
  2% 427/18000 [1:06:50<38:33:18, 7.90s/it]
440
  2% 428/18000 [1:06:54<33:33:27, 6.88s/it]
441
  2% 429/18000 [1:07:09<44:43:15, 9.16s/it]
442
  2% 430/18000 [1:07:19<46:00:07, 9.43s/it]
443
  2% 431/18000 [1:07:26<43:11:33, 8.85s/it]
444
  2% 432/18000 [1:07:30<34:56:30, 7.16s/it]
445
  2% 433/18000 [1:07:46<48:49:24, 10.01s/it]
446
  2% 434/18000 [1:08:00<53:38:05, 10.99s/it]
447
  2% 435/18000 [1:08:10<53:09:03, 10.89s/it]
448
  2% 436/18000 [1:08:19<50:38:26, 10.38s/it]
449
  2% 437/18000 [1:08:27<47:14:39, 9.68s/it]
450
  2% 438/18000 [1:08:34<42:52:00, 8.79s/it]
451
  2% 439/18000 [1:08:40<38:20:18, 7.86s/it]
452
  2% 440/18000 [1:08:44<33:10:31, 6.80s/it]
453
  2% 441/18000 [1:09:01<47:29:55, 9.74s/it]
454
  2% 442/18000 [1:09:14<52:47:34, 10.82s/it]
455
  2% 443/18000 [1:09:25<52:43:24, 10.81s/it]
456
  2% 444/18000 [1:09:34<50:46:19, 10.41s/it]
457
  2% 445/18000 [1:09:43<47:42:44, 9.78s/it]
458
  2% 446/18000 [1:09:50<43:40:10, 8.96s/it]
459
  2% 447/18000 [1:09:56<39:20:53, 8.07s/it]
460
  2% 448/18000 [1:10:00<34:14:21, 7.02s/it]
461
  2% 449/18000 [1:10:17<48:02:46, 9.86s/it]
462
  2% 450/18000 [1:10:30<53:38:52, 11.00s/it]
463
  3% 451/18000 [1:10:41<53:33:23, 10.99s/it]
464
  3% 452/18000 [1:10:51<51:28:10, 10.56s/it]
465
  3% 453/18000 [1:10:59<47:59:20, 9.85s/it]
466
  3% 454/18000 [1:11:06<43:39:42, 8.96s/it]
467
  3% 455/18000 [1:11:12<39:03:03, 8.01s/it]
468
  3% 456/18000 [1:11:16<33:48:03, 6.94s/it]
469
  3% 457/18000 [1:11:33<47:28:06, 9.74s/it]
470
  3% 458/18000 [1:11:46<52:13:26, 10.72s/it]
471
  3% 459/18000 [1:11:56<52:11:58, 10.71s/it]
472
  3% 460/18000 [1:12:06<50:26:50, 10.35s/it]
473
  3% 461/18000 [1:12:14<47:11:11, 9.69s/it]
474
  3% 462/18000 [1:12:21<43:22:01, 8.90s/it]
475
  3% 463/18000 [1:12:27<38:48:08, 7.97s/it]
476
  3% 464/18000 [1:12:31<33:40:40, 6.91s/it]
477
  3% 465/18000 [1:12:46<45:41:28, 9.38s/it]
478
  3% 466/18000 [1:12:56<46:32:41, 9.56s/it]
479
  3% 467/18000 [1:13:03<43:03:28, 8.84s/it]
480
  3% 468/18000 [1:13:07<34:43:53, 7.13s/it]
481
  3% 469/18000 [1:13:23<48:48:43, 10.02s/it]
482
  3% 470/18000 [1:13:37<54:05:41, 11.11s/it]
483
  3% 471/18000 [1:13:48<53:57:52, 11.08s/it]
484
  3% 472/18000 [1:13:58<51:57:14, 10.67s/it]
485
  3% 473/18000 [1:14:06<48:17:17, 9.92s/it]
486
  3% 474/18000 [1:14:13<44:14:22, 9.09s/it]
487
  3% 475/18000 [1:14:19<39:36:15, 8.14s/it]
488
  3% 476/18000 [1:14:24<34:21:02, 7.06s/it]
489
  3% 477/18000 [1:14:40<47:52:39, 9.84s/it]
490
  3% 478/18000 [1:14:53<52:38:58, 10.82s/it]
491
  3% 479/18000 [1:15:04<52:32:09, 10.79s/it]
492
  3% 480/18000 [1:15:13<50:33:14, 10.39s/it]
493
  3% 481/18000 [1:15:22<47:38:56, 9.79s/it]
494
  3% 482/18000 [1:15:28<43:19:51, 8.90s/it]
495
  3% 483/18000 [1:15:34<38:46:14, 7.97s/it]
496
  3% 484/18000 [1:15:39<33:35:21, 6.90s/it]
497
  3% 485/18000 [1:15:55<47:26:03, 9.75s/it]
498
  3% 486/18000 [1:16:08<52:32:49, 10.80s/it]
499
  3% 487/18000 [1:16:19<52:38:09, 10.82s/it]
500
  3% 488/18000 [1:16:28<50:31:07, 10.39s/it]
501
  3% 489/18000 [1:16:37<47:24:15, 9.75s/it]
502
  3% 490/18000 [1:16:44<43:32:47, 8.95s/it]
503
  3% 491/18000 [1:16:50<39:21:30, 8.09s/it]
504
  3% 492/18000 [1:16:54<34:02:14, 7.00s/it]
505
  3% 493/18000 [1:17:11<48:38:09, 10.00s/it]
506
  3% 494/18000 [1:17:25<53:24:35, 10.98s/it]
507
  3% 495/18000 [1:17:35<52:53:14, 10.88s/it]
508
  3% 496/18000 [1:17:45<50:41:49, 10.43s/it]
509
  3% 497/18000 [1:17:53<47:21:35, 9.74s/it]
510
  3% 498/18000 [1:18:00<43:18:58, 8.91s/it]
511
  3% 499/18000 [1:18:05<38:28:50, 7.92s/it]
512
  3% 500/18000 [1:18:10<33:36:35, 6.91s/it]
513
 
514
  3% 500/18000 [1:18:10<33:36:35, 6.91s/it]The following columns in the evaluation set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.
 
 
 
 
 
515
  0% 0/33 [00:00<?, ?it/s]
 
516
  6% 2/33 [00:04<01:10, 2.26s/it]
 
517
  9% 3/33 [00:08<01:33, 3.13s/it]
 
518
  12% 4/33 [00:12<01:39, 3.44s/it]
 
519
  15% 5/33 [00:16<01:42, 3.64s/it]
 
520
  18% 6/33 [00:20<01:42, 3.79s/it]
 
521
  21% 7/33 [00:24<01:38, 3.80s/it]
 
522
  24% 8/33 [00:28<01:36, 3.85s/it]
 
523
  27% 9/33 [00:32<01:33, 3.88s/it]
 
524
  30% 10/33 [00:37<01:33, 4.07s/it]
 
525
  33% 11/33 [00:41<01:29, 4.06s/it]
 
526
  36% 12/33 [00:45<01:24, 4.04s/it]
 
527
  39% 13/33 [00:49<01:19, 3.98s/it]
 
528
  42% 14/33 [00:53<01:16, 4.03s/it]
 
529
  45% 15/33 [00:57<01:12, 4.04s/it]
 
530
  48% 16/33 [01:01<01:10, 4.17s/it]
 
531
  52% 17/33 [01:06<01:09, 4.32s/it]
 
532
  55% 18/33 [01:10<01:03, 4.24s/it]
 
533
  58% 19/33 [01:14<00:59, 4.24s/it]
 
534
  61% 20/33 [01:19<00:55, 4.31s/it]
 
535
  64% 21/33 [01:23<00:52, 4.34s/it]
 
536
  67% 22/33 [01:27<00:47, 4.33s/it]
 
537
  70% 23/33 [01:32<00:43, 4.38s/it]
 
538
  73% 24/33 [01:36<00:39, 4.39s/it]
 
539
  76% 25/33 [01:41<00:35, 4.42s/it]
 
540
  79% 26/33 [01:45<00:30, 4.37s/it]
 
541
  82% 27/33 [01:49<00:25, 4.31s/it]
 
542
  85% 28/33 [01:54<00:21, 4.34s/it]
 
543
  88% 29/33 [01:57<00:16, 4.09s/it]
 
544
  91% 30/33 [02:00<00:11, 3.70s/it]
 
545
  94% 31/33 [02:03<00:06, 3.40s/it]
 
546
  97% 32/33 [02:05<00:03, 3.18s/it]
 
 
547
 
548
 
 
549
  3% 500/18000 [1:20:23<33:36:35, 6.91s/it]
 
550
  Saving model checkpoint to ./checkpoint-500
 
 
 
 
 
1
+
2
+
3
+
4
+ loading configuration file https://huggingface.co/facebook/wav2vec2-xls-r-300m/resolve/main/config.json from cache at /home/sagrilaft/.cache/huggingface/transformers/dabc27df63e37bd2a7a221c7774e35f36a280fbdf917cf54cadfc7df8c786f6f.a3e4c3c967d9985881e0ae550a5f6f668f897db5ab2e0802f9b97973b15970e6
5
+ Model config Wav2Vec2Config {
6
+ "_name_or_path": "facebook/wav2vec2-xls-r-300m",
7
+ "activation_dropout": 0.0,
8
+ "adapter_kernel_size": 3,
9
+ "adapter_stride": 2,
10
+ "add_adapter": false,
11
+ "apply_spec_augment": true,
12
+ "architectures": [
13
+ "Wav2Vec2ForPreTraining"
14
+ ],
15
+ "attention_dropout": 0.1,
16
+ "bos_token_id": 1,
17
+ "classifier_proj_size": 256,
18
+ "codevector_dim": 768,
19
+ "contrastive_logits_temperature": 0.1,
20
+ "conv_bias": true,
21
+ "conv_dim": [
22
+ 512,
23
+ 512,
24
+ 512,
25
+ 512,
26
+ 512,
27
+ 512,
28
+ 512
29
+ ],
30
+ "conv_kernel": [
31
+ 10,
32
+ 3,
33
+ 3,
34
+ 3,
35
+ 3,
36
+ 2,
37
+ 2
38
+ ],
39
+ "conv_stride": [
40
+ 5,
41
+ 2,
42
+ 2,
43
+ 2,
44
+ 2,
45
+ 2,
46
+ 2
47
+ ],
48
+ "ctc_loss_reduction": "sum",
49
+ "ctc_zero_infinity": false,
50
+ "diversity_loss_weight": 0.1,
51
+ "do_stable_layer_norm": true,
52
+ "eos_token_id": 2,
53
+ "feat_extract_activation": "gelu",
54
+ "feat_extract_dropout": 0.0,
55
+ "feat_extract_norm": "layer",
56
+ "feat_proj_dropout": 0.1,
57
+ "feat_quantizer_dropout": 0.0,
58
+ "final_dropout": 0.0,
59
+ "gradient_checkpointing": false,
60
+ "hidden_act": "gelu",
61
+ "hidden_dropout": 0.1,
62
+ "hidden_size": 1024,
63
+ "initializer_range": 0.02,
64
+ "intermediate_size": 4096,
65
+ "layer_norm_eps": 1e-05,
66
+ "layerdrop": 0.1,
67
+ "mask_feature_length": 10,
68
+ "mask_feature_min_masks": 0,
69
+ "mask_feature_prob": 0.0,
70
+ "mask_time_length": 10,
71
+ "mask_time_min_masks": 2,
72
+ "mask_time_prob": 0.075,
73
+ "model_type": "wav2vec2",
74
+ "num_adapter_layers": 3,
75
+ "num_attention_heads": 16,
76
+ "num_codevector_groups": 2,
77
+ "num_codevectors_per_group": 320,
78
+ "num_conv_pos_embedding_groups": 16,
79
+ "num_conv_pos_embeddings": 128,
80
+ "num_feat_extract_layers": 7,
81
+ "num_hidden_layers": 24,
82
+ "num_negatives": 100,
83
+ "output_hidden_size": 1024,
84
+ "pad_token_id": 0,
85
+ "proj_codevector_dim": 768,
86
+ "tdnn_dilation": [
87
+ 1,
88
+ 2,
89
+ 3,
90
+ 1,
91
+ 1
92
+ ],
93
+ "tdnn_dim": [
94
+ 512,
95
+ 512,
96
+ 512,
97
+ 512,
98
+ 1500
99
+ ],
100
+ "tdnn_kernel": [
101
+ 5,
102
+ 3,
103
+ 3,
104
+ 1,
105
+ 1
106
+ ],
107
+ "torch_dtype": "float32",
108
+ "transformers_version": "4.16.0.dev0",
109
+ "use_weighted_layer_sum": false,
110
+ "vocab_size": 32,
111
+ "xvector_output_dim": 512
112
+ }
113
+
114
+
115
  0%| | 0/1 [00:00<?, ?ba/s]
116
+
117
  0%| | 0/1 [00:00<?, ?ba/s]
118
+ Didn't find file ./tokenizer_config.json. We won't load it.
119
+ Didn't find file ./added_tokens.json. We won't load it.
120
+ Didn't find file ./special_tokens_map.json. We won't load it.
121
+ Didn't find file ./tokenizer.json. We won't load it.
122
+ loading file ./vocab.json
123
+ loading file None
124
+ loading file None
125
+ loading file None
126
+ loading file None
127
+ file ./config.json not found
128
+ Adding <s> to the vocabulary
129
+ Adding </s> to the vocabulary
130
+ Special tokens have been added in the vocabulary, make sure the associated word embeddings are fine-tuned or trained.
131
+ loading configuration file https://huggingface.co/facebook/wav2vec2-xls-r-300m/resolve/main/config.json from cache at /home/sagrilaft/.cache/huggingface/transformers/dabc27df63e37bd2a7a221c7774e35f36a280fbdf917cf54cadfc7df8c786f6f.a3e4c3c967d9985881e0ae550a5f6f668f897db5ab2e0802f9b97973b15970e6
132
+ Model config Wav2Vec2Config {
133
+ "_name_or_path": "facebook/wav2vec2-xls-r-300m",
134
+ "activation_dropout": 0.0,
135
+ "adapter_kernel_size": 3,
136
+ "adapter_stride": 2,
137
+ "add_adapter": false,
138
+ "apply_spec_augment": true,
139
+ "architectures": [
140
+ "Wav2Vec2ForPreTraining"
141
+ ],
142
+ "attention_dropout": 0.1,
143
+ "bos_token_id": 1,
144
+ "classifier_proj_size": 256,
145
+ "codevector_dim": 768,
146
+ "contrastive_logits_temperature": 0.1,
147
+ "conv_bias": true,
148
+ "conv_dim": [
149
+ 512,
150
+ 512,
151
+ 512,
152
+ 512,
153
+ 512,
154
+ 512,
155
+ 512
156
+ ],
157
+ "conv_kernel": [
158
+ 10,
159
+ 3,
160
+ 3,
161
+ 3,
162
+ 3,
163
+ 2,
164
+ 2
165
+ ],
166
+ "conv_stride": [
167
+ 5,
168
+ 2,
169
+ 2,
170
+ 2,
171
+ 2,
172
+ 2,
173
+ 2
174
+ ],
175
+ "ctc_loss_reduction": "sum",
176
+ "ctc_zero_infinity": false,
177
+ "diversity_loss_weight": 0.1,
178
+ "do_stable_layer_norm": true,
179
+ "eos_token_id": 2,
180
+ "feat_extract_activation": "gelu",
181
+ "feat_extract_dropout": 0.0,
182
+ "feat_extract_norm": "layer",
183
+ "feat_proj_dropout": 0.1,
184
+ "feat_quantizer_dropout": 0.0,
185
+ "final_dropout": 0.0,
186
+ "gradient_checkpointing": false,
187
+ "hidden_act": "gelu",
188
+ "hidden_dropout": 0.1,
189
+ "hidden_size": 1024,
190
+ "initializer_range": 0.02,
191
+ "intermediate_size": 4096,
192
+ "layer_norm_eps": 1e-05,
193
+ "layerdrop": 0.1,
194
+ "mask_feature_length": 10,
195
+ "mask_feature_min_masks": 0,
196
+ "mask_feature_prob": 0.0,
197
+ "mask_time_length": 10,
198
+ "mask_time_min_masks": 2,
199
+ "mask_time_prob": 0.075,
200
+ "model_type": "wav2vec2",
201
+ "num_adapter_layers": 3,
202
+ "num_attention_heads": 16,
203
+ "num_codevector_groups": 2,
204
+ "num_codevectors_per_group": 320,
205
+ "num_conv_pos_embedding_groups": 16,
206
+ "num_conv_pos_embeddings": 128,
207
+ "num_feat_extract_layers": 7,
208
+ "num_hidden_layers": 24,
209
+ "num_negatives": 100,
210
+ "output_hidden_size": 1024,
211
+ "pad_token_id": 0,
212
+ "proj_codevector_dim": 768,
213
+ "tdnn_dilation": [
214
+ 1,
215
+ 2,
216
+ 3,
217
+ 1,
218
+ 1
219
+ ],
220
+ "tdnn_dim": [
221
+ 512,
222
+ 512,
223
+ 512,
224
+ 512,
225
+ 1500
226
+ ],
227
+ "tdnn_kernel": [
228
+ 5,
229
+ 3,
230
+ 3,
231
+ 1,
232
+ 1
233
+ ],
234
+ "torch_dtype": "float32",
235
+ "transformers_version": "4.16.0.dev0",
236
+ "use_weighted_layer_sum": false,
237
+ "vocab_size": 32,
238
+ "xvector_output_dim": 512
239
+ }
240
+
241
+ loading feature extractor configuration file https://huggingface.co/facebook/wav2vec2-xls-r-300m/resolve/main/preprocessor_config.json from cache at /home/sagrilaft/.cache/huggingface/transformers/6fb028b95b394059e7d3b367bbca2382b576c66aebe896f04d2cd34e1b575f5b.d4484dc1c81456a2461485e7168b04347a7b9a4e3b1ef3aba723323b33e12326
242
+ Feature extractor Wav2Vec2FeatureExtractor {
243
+ "do_normalize": true,
244
+ "feature_extractor_type": "Wav2Vec2FeatureExtractor",
245
+ "feature_size": 1,
246
+ "padding_side": "right",
247
+ "padding_value": 0,
248
+ "return_attention_mask": true,
249
+ "sampling_rate": 16000
250
+ }
251
+
252
+ loading weights file https://huggingface.co/facebook/wav2vec2-xls-r-300m/resolve/main/pytorch_model.bin from cache at /home/sagrilaft/.cache/huggingface/transformers/1e6a6507f3b689035cd4b247e2a37c154e27f39143f31357a49b4e38baeccc36.1edb32803799e27ed554eb7dd935f6745b1a0b17b0ea256442fe24db6eb546cd
253
+ Some weights of the model checkpoint at facebook/wav2vec2-xls-r-300m were not used when initializing Wav2Vec2ForCTC: ['project_q.bias', 'project_q.weight', 'quantizer.weight_proj.weight', 'project_hid.bias', 'project_hid.weight', 'quantizer.codevectors', 'quantizer.weight_proj.bias']
254
+ - This IS expected if you are initializing Wav2Vec2ForCTC from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
255
+ - This IS NOT expected if you are initializing Wav2Vec2ForCTC from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
256
+ Some weights of Wav2Vec2ForCTC were not initialized from the model checkpoint at facebook/wav2vec2-xls-r-300m and are newly initialized: ['lm_head.bias', 'lm_head.weight']
257
+ You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.
258
+
259
+
260
+
261
  0%| | 0/6 [00:00<?, ?ba/s]
262
+
263
  0%| | 0/3 [00:00<?, ?ba/s]
264
+ Configuration saved in ./preprocessor_config.json
265
+ tokenizer config file saved in ./tokenizer_config.json
266
+ Special tokens file saved in ./special_tokens_map.json
267
+ added tokens file saved in ./added_tokens.json
268
+ Configuration saved in ./config.json
269
+ loading feature extractor configuration file ./preprocessor_config.json
270
+ loading configuration file ./config.json
271
+ Model config Wav2Vec2Config {
272
+ "_name_or_path": "./",
273
+ "activation_dropout": 0.0,
274
+ "adapter_kernel_size": 3,
275
+ "adapter_stride": 2,
276
+ "add_adapter": false,
277
+ "apply_spec_augment": true,
278
+ "architectures": [
279
+ "Wav2Vec2ForPreTraining"
280
+ ],
281
+ "attention_dropout": 0.0,
282
+ "bos_token_id": 1,
283
+ "classifier_proj_size": 256,
284
+ "codevector_dim": 768,
285
+ "contrastive_logits_temperature": 0.1,
286
+ "conv_bias": true,
287
+ "conv_dim": [
288
+ 512,
289
+ 512,
290
+ 512,
291
+ 512,
292
+ 512,
293
+ 512,
294
+ 512
295
+ ],
296
+ "conv_kernel": [
297
+ 10,
298
+ 3,
299
+ 3,
300
+ 3,
301
+ 3,
302
+ 2,
303
+ 2
304
+ ],
305
+ "conv_stride": [
306
+ 5,
307
+ 2,
308
+ 2,
309
+ 2,
310
+ 2,
311
+ 2,
312
+ 2
313
+ ],
314
+ "ctc_loss_reduction": "mean",
315
+ "ctc_zero_infinity": false,
316
+ "diversity_loss_weight": 0.1,
317
+ "do_stable_layer_norm": true,
318
+ "eos_token_id": 2,
319
+ "feat_extract_activation": "gelu",
320
+ "feat_extract_dropout": 0.0,
321
+ "feat_extract_norm": "layer",
322
+ "feat_proj_dropout": 0.1,
323
+ "feat_quantizer_dropout": 0.0,
324
+ "final_dropout": 0.0,
325
+ "hidden_act": "gelu",
326
+ "hidden_dropout": 0.0,
327
+ "hidden_size": 1024,
328
+ "initializer_range": 0.02,
329
+ "intermediate_size": 4096,
330
+ "layer_norm_eps": 1e-05,
331
+ "layerdrop": 0.0,
332
+ "mask_feature_length": 10,
333
+ "mask_feature_min_masks": 0,
334
+ "mask_feature_prob": 0.0,
335
+ "mask_time_length": 10,
336
+ "mask_time_min_masks": 2,
337
+ "mask_time_prob": 0.1,
338
+ "model_type": "wav2vec2",
339
+ "num_adapter_layers": 3,
340
+ "num_attention_heads": 16,
341
+ "num_codevector_groups": 2,
342
+ "num_codevectors_per_group": 320,
343
+ "num_conv_pos_embedding_groups": 16,
344
+ "num_conv_pos_embeddings": 128,
345
+ "num_feat_extract_layers": 7,
346
+ "num_hidden_layers": 24,
347
+ "num_negatives": 100,
348
+ "output_hidden_size": 1024,
349
+ "pad_token_id": 36,
350
+ "proj_codevector_dim": 768,
351
+ "tdnn_dilation": [
352
+ 1,
353
+ 2,
354
+ 3,
355
+ 1,
356
+ 1
357
+ ],
358
+ "tdnn_dim": [
359
+ 512,
360
+ 512,
361
+ 512,
362
+ 512,
363
+ 1500
364
+ ],
365
+ "tdnn_kernel": [
366
+ 5,
367
+ 3,
368
+ 3,
369
+ 1,
370
+ 1
371
+ ],
372
+ "torch_dtype": "float32",
373
+ "transformers_version": "4.16.0.dev0",
374
+ "use_weighted_layer_sum": false,
375
+ "vocab_size": 39,
376
+ "xvector_output_dim": 512
377
+ }
378
+
379
+ loading feature extractor configuration file ./preprocessor_config.json
380
+ Feature extractor Wav2Vec2FeatureExtractor {
381
+ "do_normalize": true,
382
+ "feature_extractor_type": "Wav2Vec2FeatureExtractor",
383
+ "feature_size": 1,
384
+ "padding_side": "right",
385
+ "padding_value": 0,
386
+ "return_attention_mask": true,
387
+ "sampling_rate": 16000
388
+ }
389
+
390
+ Didn't find file ./tokenizer.json. We won't load it.
391
+ loading file ./vocab.json
392
+ loading file ./tokenizer_config.json
393
+ loading file ./added_tokens.json
394
+ loading file ./special_tokens_map.json
395
+ loading file None
396
+ Adding <s> to the vocabulary
397
+ Adding </s> to the vocabulary
398
+ /home/sagrilaft/Project/audio/xls-r-et/./ is already a clone of https://huggingface.co/shpotes/xls-r-et. Make sure you pull the latest changes with `repo.git_pull()`.
399
+ Using amp half precision backend
400
+ The following columns in the training set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.
401
+ ***** Running training *****
402
+ Num examples = 5705
403
+ Num Epochs = 500
404
+ Instantaneous batch size per device = 80
405
+ Total train batch size (w. parallel, distributed & accumulation) = 160
406
+ Gradient Accumulation steps = 2
407
+ Total optimization steps = 18000
408
+ Automatic Weights & Biases logging enabled, to disable set os.environ["WANDB_DISABLED"] = "true"
409
+ wandb: Currently logged in as: shpotes (use `wandb login --relogin` to force relogin)
410
+ wandb: Tracking run with wandb version 0.12.9
411
+ wandb: Syncing run cosine+drop_proj+low_specaugment-300M
412
+ wandb: View project at https://wandb.ai/shpotes/xls-r-estonian
413
+ wandb: View run at https://wandb.ai/shpotes/xls-r-estonian/runs/1xdiy2kf
414
+ wandb: Run data is saved locally in /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf
415
+ wandb: Run `wandb offline` to turn off syncing.
416
+
417
  0% 0/18000 [00:00<?, ?it/s]
418
  0% 1/18000 [00:17<86:26:02, 17.29s/it]
419
  0% 2/18000 [00:30<75:01:49, 15.01s/it]
420
  0% 3/18000 [00:41<65:24:50, 13.08s/it]
421
  0% 4/18000 [00:50<58:10:48, 11.64s/it]
422
  0% 5/18000 [00:59<52:10:20, 10.44s/it]
423
  0% 6/18000 [01:06<46:21:37, 9.28s/it]
424
  0% 7/18000 [01:12<40:36:25, 8.12s/it]
425
  0% 8/18000 [01:16<34:47:36, 6.96s/it]
426
  0% 9/18000 [01:33<50:28:39, 10.10s/it]
427
  0% 10/18000 [01:46<54:51:39, 10.98s/it]
428
  0% 11/18000 [01:57<54:52:13, 10.98s/it]
429
  0% 12/18000 [02:07<52:52:40, 10.58s/it]
430
  0% 13/18000 [02:15<49:41:21, 9.95s/it]
431
  0% 14/18000 [02:22<45:26:54, 9.10s/it]
432
  0% 15/18000 [02:28<40:51:40, 8.18s/it]
433
  0% 16/18000 [02:33<35:21:44, 7.08s/it]
434
  0% 17/18000 [02:49<49:42:15, 9.95s/it]
435
  0% 18/18000 [03:03<55:21:19, 11.08s/it]
436
  0% 19/18000 [03:14<55:04:47, 11.03s/it]
437
  0% 20/18000 [03:23<52:40:52, 10.55s/it]
438
  0% 21/18000 [03:32<49:32:32, 9.92s/it]
439
  0% 22/18000 [03:39<45:11:01, 9.05s/it]
440
  0% 23/18000 [03:45<40:31:29, 8.12s/it]
441
  0% 24/18000 [03:50<35:20:48, 7.08s/it]
442
  0% 25/18000 [04:06<49:22:23, 9.89s/it]
443
  0% 26/18000 [04:19<54:38:50, 10.95s/it]
444
  0% 27/18000 [04:30<54:41:00, 10.95s/it]
445
  0% 28/18000 [04:40<52:18:06, 10.48s/it]
446
  0% 29/18000 [04:48<49:00:52, 9.82s/it]
447
  0% 30/18000 [04:55<45:04:29, 9.03s/it]
448
  0% 31/18000 [05:01<40:27:51, 8.11s/it]
449
  0% 32/18000 [05:06<35:02:45, 7.02s/it]
450
  0% 33/18000 [05:20<46:37:19, 9.34s/it]
451
  0% 34/18000 [05:30<47:26:00, 9.50s/it]
452
  0% 35/18000 [05:37<43:56:15, 8.80s/it]
453
  0% 36/18000 [05:41<35:44:20, 7.16s/it]
454
  0% 37/18000 [05:57<49:56:45, 10.01s/it]
455
  0% 38/18000 [06:10<54:30:48, 10.93s/it]
456
  0% 39/18000 [06:21<54:14:33, 10.87s/it]
457
  0% 40/18000 [06:31<52:09:33, 10.46s/it]
458
  0% 41/18000 [06:39<49:11:45, 9.86s/it]
459
  0% 42/18000 [06:46<45:07:06, 9.04s/it]
460
  0% 43/18000 [06:52<40:22:51, 8.10s/it]
461
  0% 44/18000 [06:57<35:07:39, 7.04s/it]
462
  0% 45/18000 [07:13<48:38:37, 9.75s/it]
463
  0% 46/18000 [07:26<53:56:40, 10.82s/it]
464
  0% 47/18000 [07:37<53:51:56, 10.80s/it]
465
  0% 48/18000 [07:46<51:52:52, 10.40s/it]
466
  0% 49/18000 [07:55<48:44:50, 9.78s/it]
467
  0% 50/18000 [08:02<44:52:04, 9.00s/it]
468
  0% 51/18000 [08:08<40:35:01, 8.14s/it]
469
  0% 52/18000 [08:13<35:13:14, 7.06s/it]
470
  0% 53/18000 [08:29<49:34:56, 9.95s/it]
471
  0% 54/18000 [08:43<54:54:51, 11.02s/it]
472
  0% 55/18000 [08:54<54:39:48, 10.97s/it]
473
  0% 56/18000 [09:03<51:47:45, 10.39s/it]
474
  0% 57/18000 [09:11<48:30:24, 9.73s/it]
475
  0% 58/18000 [09:18<44:04:17, 8.84s/it]
476
  0% 59/18000 [09:23<39:07:38, 7.85s/it]
477
  0% 60/18000 [09:28<33:56:38, 6.81s/it]
478
  0% 61/18000 [09:44<48:31:20, 9.74s/it]
479
  0% 62/18000 [09:58<54:20:24, 10.91s/it]
480
  0% 63/18000 [10:09<54:07:29, 10.86s/it]
481
  0% 64/18000 [10:18<52:41:53, 10.58s/it]
482
  0% 65/18000 [10:27<49:44:17, 9.98s/it]
483
  0% 66/18000 [10:34<45:08:18, 9.06s/it]
484
  0% 67/18000 [10:40<40:27:18, 8.12s/it]
485
  0% 68/18000 [10:44<35:05:04, 7.04s/it]
486
  0% 69/18000 [11:00<47:40:09, 9.57s/it]
487
  0% 70/18000 [11:10<48:34:46, 9.75s/it]
488
  0% 71/18000 [11:17<44:54:05, 9.02s/it]
489
  0% 72/18000 [11:21<36:10:47, 7.27s/it]
490
  0% 73/18000 [11:37<50:11:00, 10.08s/it]
491
  0% 74/18000 [11:50<54:44:05, 10.99s/it]
492
  0% 75/18000 [12:01<54:03:33, 10.86s/it]
493
  0% 76/18000 [12:10<51:30:17, 10.34s/it]
494
  0% 77/18000 [12:18<48:16:12, 9.70s/it]
495
  0% 78/18000 [12:25<44:02:08, 8.85s/it]
496
  0% 79/18000 [12:31<39:24:36, 7.92s/it]
497
  0% 80/18000 [12:35<34:06:06, 6.85s/it]
498
  0% 81/18000 [12:52<48:23:03, 9.72s/it]
499
  0% 82/18000 [13:05<54:09:04, 10.88s/it]
500
  0% 83/18000 [13:16<54:31:03, 10.95s/it]
501
  0% 84/18000 [13:26<52:35:45, 10.57s/it]
502
  0% 85/18000 [13:34<49:34:08, 9.96s/it]
503
  0% 86/18000 [13:42<45:29:05, 9.14s/it]
504
  0% 87/18000 [13:48<40:44:29, 8.19s/it]
505
  0% 88/18000 [13:52<35:22:46, 7.11s/it]
506
  0% 89/18000 [14:09<49:08:37, 9.88s/it]
507
  0% 90/18000 [14:22<53:55:22, 10.84s/it]
508
  1% 91/18000 [14:33<53:54:12, 10.84s/it]
509
  1% 92/18000 [14:42<51:57:31, 10.45s/it]
510
  1% 93/18000 [14:50<48:11:46, 9.69s/it]
511
  1% 94/18000 [14:57<44:05:28, 8.86s/it]
512
  1% 95/18000 [15:02<39:02:47, 7.85s/it]
513
  1% 96/18000 [15:07<33:46:57, 6.79s/it]
514
  1% 97/18000 [15:23<48:11:08, 9.69s/it]
515
  1% 98/18000 [15:36<53:29:06, 10.76s/it]
516
  1% 99/18000 [15:47<53:25:40, 10.74s/it]
517
  1% 100/18000 [15:57<51:48:37, 10.42s/it]
518
 
519
  1% 100/18000 [15:57<51:48:37, 10.42s/it]
520
  1% 101/18000 [16:05<48:40:04, 9.79s/it]
521
  1% 102/18000 [16:12<44:23:01, 8.93s/it]
522
  1% 103/18000 [16:18<39:26:24, 7.93s/it]
523
  1% 104/18000 [16:22<34:15:20, 6.89s/it]
524
  1% 105/18000 [16:37<46:43:13, 9.40s/it]
525
  1% 106/18000 [16:47<47:23:12, 9.53s/it]
526
  1% 107/18000 [16:54<43:44:40, 8.80s/it]
527
  1% 108/18000 [16:58<35:46:46, 7.20s/it]
528
  1% 109/18000 [17:14<48:43:15, 9.80s/it]
529
  1% 110/18000 [17:27<54:09:47, 10.90s/it]
530
  1% 111/18000 [17:38<54:15:19, 10.92s/it]
531
  1% 112/18000 [17:48<52:17:25, 10.52s/it]
532
  1% 113/18000 [17:56<49:14:31, 9.91s/it]
533
  1% 114/18000 [18:03<45:07:53, 9.08s/it]
534
  1% 115/18000 [18:09<40:13:03, 8.10s/it]
535
  1% 116/18000 [18:13<34:43:29, 6.99s/it]
536
  1% 117/18000 [18:30<48:46:18, 9.82s/it]
537
  1% 118/18000 [18:43<53:31:11, 10.77s/it]
538
  1% 119/18000 [18:53<53:11:36, 10.71s/it]
539
  1% 120/18000 [19:03<50:56:21, 10.26s/it]
540
  1% 121/18000 [19:11<47:23:37, 9.54s/it]
541
  1% 122/18000 [19:17<43:07:59, 8.69s/it]
542
  1% 123/18000 [19:23<38:34:05, 7.77s/it]
543
  1% 124/18000 [19:27<33:23:03, 6.72s/it]
544
  1% 125/18000 [19:43<47:43:04, 9.61s/it]
545
  1% 126/18000 [19:57<53:09:48, 10.71s/it]
546
  1% 127/18000 [20:08<53:19:09, 10.74s/it]
547
  1% 128/18000 [20:17<51:20:03, 10.34s/it]
548
  1% 129/18000 [20:25<48:12:21, 9.71s/it]
549
  1% 130/18000 [20:32<43:58:10, 8.86s/it]
550
  1% 131/18000 [20:38<39:28:05, 7.95s/it]
551
  1% 132/18000 [20:42<34:15:06, 6.90s/it]
552
  1% 133/18000 [20:59<48:28:40, 9.77s/it]
553
  1% 134/18000 [21:12<53:33:44, 10.79s/it]
554
  1% 135/18000 [21:23<53:23:03, 10.76s/it]
555
  1% 136/18000 [21:32<51:19:46, 10.34s/it]
556
  1% 137/18000 [21:40<48:04:44, 9.69s/it]
557
  1% 138/18000 [21:47<43:54:30, 8.85s/it]
558
  1% 139/18000 [21:53<39:05:17, 7.88s/it]
559
  1% 140/18000 [21:57<34:00:50, 6.86s/it]
560
  1% 141/18000 [22:13<46:40:32, 9.41s/it]
561
  1% 142/18000 [22:23<47:51:15, 9.65s/it]
562
  1% 143/18000 [22:30<44:22:27, 8.95s/it]
563
  1% 144/18000 [22:34<36:18:44, 7.32s/it]
564
  1% 145/18000 [22:50<49:56:40, 10.07s/it]
565
  1% 146/18000 [23:03<54:50:33, 11.06s/it]
566
  1% 147/18000 [23:14<54:23:30, 10.97s/it]
567
  1% 148/18000 [23:24<51:53:58, 10.47s/it]
568
  1% 149/18000 [23:32<48:32:27, 9.79s/it]
569
  1% 150/18000 [23:39<44:37:06, 9.00s/it]
570
  1% 151/18000 [23:45<39:56:07, 8.05s/it]
571
  1% 152/18000 [23:49<34:30:40, 6.96s/it]
572
  1% 153/18000 [24:06<48:51:50, 9.86s/it]
573
  1% 154/18000 [24:19<54:08:29, 10.92s/it]
574
  1% 155/18000 [24:30<54:07:19, 10.92s/it]
575
  1% 156/18000 [24:39<51:49:42, 10.46s/it]
576
  1% 157/18000 [24:48<48:49:19, 9.85s/it]
577
  1% 158/18000 [24:55<44:54:15, 9.06s/it]
578
  1% 159/18000 [25:01<40:01:43, 8.08s/it]
579
  1% 160/18000 [25:05<34:36:26, 6.98s/it]
580
  1% 161/18000 [25:22<48:39:48, 9.82s/it]
581
  1% 162/18000 [25:35<53:20:53, 10.77s/it]
582
  1% 163/18000 [25:45<53:02:40, 10.71s/it]
583
  1% 164/18000 [25:55<51:11:53, 10.33s/it]
584
  1% 165/18000 [26:03<48:01:45, 9.69s/it]
585
  1% 166/18000 [26:10<43:51:38, 8.85s/it]
586
  1% 167/18000 [26:16<39:20:09, 7.94s/it]
587
  1% 168/18000 [26:20<34:07:20, 6.89s/it]
588
  1% 169/18000 [26:37<48:26:45, 9.78s/it]
589
  1% 170/18000 [26:50<54:05:34, 10.92s/it]
590
  1% 171/18000 [27:01<54:10:19, 10.94s/it]
591
  1% 172/18000 [27:11<51:47:16, 10.46s/it]
592
  1% 173/18000 [27:19<48:35:45, 9.81s/it]
593
  1% 174/18000 [27:26<44:17:21, 8.94s/it]
594
  1% 175/18000 [27:32<39:40:01, 8.01s/it]
595
  1% 176/18000 [27:36<34:26:47, 6.96s/it]
596
  1% 177/18000 [27:51<46:22:02, 9.37s/it]
597
  1% 178/18000 [28:01<46:54:42, 9.48s/it]
598
  1% 179/18000 [28:08<43:12:54, 8.73s/it]
599
  1% 180/18000 [28:11<34:51:46, 7.04s/it]
600
  1% 181/18000 [28:27<48:41:49, 9.84s/it]
601
  1% 182/18000 [28:41<53:47:06, 10.87s/it]
602
  1% 183/18000 [28:51<53:26:11, 10.80s/it]
603
  1% 184/18000 [29:00<51:13:34, 10.35s/it]
604
  1% 185/18000 [29:08<47:40:37, 9.63s/it]
605
  1% 186/18000 [29:15<43:41:55, 8.83s/it]
606
  1% 187/18000 [29:21<39:02:36, 7.89s/it]
607
  1% 188/18000 [29:25<33:33:56, 6.78s/it]
608
  1% 189/18000 [29:41<46:58:38, 9.50s/it]
609
  1% 190/18000 [29:55<52:50:48, 10.68s/it]
610
  1% 191/18000 [30:05<53:13:50, 10.76s/it]
611
  1% 192/18000 [30:15<51:19:04, 10.37s/it]
612
  1% 193/18000 [30:23<47:46:28, 9.66s/it]
613
  1% 194/18000 [30:30<43:50:18, 8.86s/it]
614
  1% 195/18000 [30:36<39:23:19, 7.96s/it]
615
  1% 196/18000 [30:40<34:17:27, 6.93s/it]
616
  1% 197/18000 [30:57<48:42:25, 9.85s/it]
617
  1% 198/18000 [31:11<54:34:28, 11.04s/it]
618
  1% 199/18000 [31:22<54:40:44, 11.06s/it]
619
  1% 200/18000 [31:32<53:10:28, 10.75s/it]
620
 
621
  1% 200/18000 [31:32<53:10:28, 10.75s/it]
622
  1% 201/18000 [31:40<49:47:14, 10.07s/it]
623
  1% 202/18000 [31:47<45:18:07, 9.16s/it]
624
  1% 203/18000 [31:53<40:20:20, 8.16s/it]
625
  1% 204/18000 [31:58<34:46:55, 7.04s/it]
626
  1% 205/18000 [32:14<48:45:25, 9.86s/it]
627
  1% 206/18000 [32:27<53:32:26, 10.83s/it]
628
  1% 207/18000 [32:38<53:17:02, 10.78s/it]
629
  1% 208/18000 [32:47<51:12:19, 10.36s/it]
630
  1% 209/18000 [32:56<48:09:33, 9.75s/it]
631
  1% 210/18000 [33:03<44:08:23, 8.93s/it]
632
  1% 211/18000 [33:09<39:35:55, 8.01s/it]
633
  1% 212/18000 [33:13<34:23:10, 6.96s/it]
634
  1% 213/18000 [33:28<46:28:43, 9.41s/it]
635
  1% 214/18000 [33:38<46:56:12, 9.50s/it]
636
  1% 215/18000 [33:45<43:27:58, 8.80s/it]
637
  1% 216/18000 [33:48<35:04:07, 7.10s/it]
638
  1% 217/18000 [34:04<48:42:58, 9.86s/it]
639
  1% 218/18000 [34:18<53:32:18, 10.84s/it]
640
  1% 219/18000 [34:28<53:14:19, 10.78s/it]
641
  1% 220/18000 [34:38<51:06:07, 10.35s/it]
642
  1% 221/18000 [34:46<47:42:29, 9.66s/it]
643
  1% 222/18000 [34:52<43:16:38, 8.76s/it]
644
  1% 223/18000 [34:58<38:47:18, 7.85s/it]
645
  1% 224/18000 [35:02<33:35:15, 6.80s/it]
646
  1% 225/18000 [35:18<46:55:15, 9.50s/it]
647
  1% 226/18000 [35:32<52:36:24, 10.66s/it]
648
  1% 227/18000 [35:42<52:47:45, 10.69s/it]
649
  1% 228/18000 [35:52<50:52:21, 10.31s/it]
650
  1% 229/18000 [36:00<48:08:38, 9.75s/it]
651
  1% 230/18000 [36:07<44:14:44, 8.96s/it]
652
  1% 231/18000 [36:13<39:37:28, 8.03s/it]
653
  1% 232/18000 [36:18<34:13:31, 6.93s/it]
654
  1% 233/18000 [36:34<48:28:27, 9.82s/it]
655
  1% 234/18000 [36:48<53:55:28, 10.93s/it]
656
  1% 235/18000 [36:59<54:07:48, 10.97s/it]
657
  1% 236/18000 [37:08<52:09:20, 10.57s/it]
658
  1% 237/18000 [37:17<48:42:27, 9.87s/it]
659
  1% 238/18000 [37:23<44:21:14, 8.99s/it]
660
  1% 239/18000 [37:29<39:44:51, 8.06s/it]
661
  1% 240/18000 [37:34<34:23:30, 6.97s/it]
662
  1% 241/18000 [37:50<48:42:06, 9.87s/it]
663
  1% 242/18000 [38:03<53:25:27, 10.83s/it]
664
  1% 243/18000 [38:14<52:55:48, 10.73s/it]
665
  1% 244/18000 [38:23<50:37:01, 10.26s/it]
666
  1% 245/18000 [38:31<47:27:12, 9.62s/it]
667
  1% 246/18000 [38:38<43:25:26, 8.81s/it]
668
  1% 247/18000 [38:44<39:01:44, 7.91s/it]
669
  1% 248/18000 [38:48<33:54:20, 6.88s/it]
670
  1% 249/18000 [39:04<46:20:55, 9.40s/it]
671
  1% 250/18000 [39:14<47:17:59, 9.59s/it]
672
  1% 251/18000 [39:21<43:48:05, 8.88s/it]
673
  1% 252/18000 [39:24<35:17:51, 7.16s/it]
674
  1% 253/18000 [39:41<49:42:54, 10.08s/it]
675
  1% 254/18000 [39:55<54:40:20, 11.09s/it]
676
  1% 255/18000 [40:05<54:05:56, 10.98s/it]
677
  1% 256/18000 [40:15<51:41:45, 10.49s/it]
678
  1% 257/18000 [40:23<48:34:31, 9.86s/it]
679
  1% 258/18000 [40:30<44:23:42, 9.01s/it]
680
  1% 259/18000 [40:36<39:40:19, 8.05s/it]
681
  1% 260/18000 [40:40<34:13:42, 6.95s/it]
682
  1% 261/18000 [40:57<48:18:11, 9.80s/it]
683
  1% 262/18000 [41:10<53:34:01, 10.87s/it]
684
  1% 263/18000 [41:21<53:19:57, 10.82s/it]
685
  1% 264/18000 [41:30<50:44:07, 10.30s/it]
686
  1% 265/18000 [41:38<47:15:09, 9.59s/it]
687
  1% 266/18000 [41:44<43:02:02, 8.74s/it]
688
  1% 267/18000 [41:50<38:41:55, 7.86s/it]
689
  1% 268/18000 [41:55<33:41:12, 6.84s/it]
690
  1% 269/18000 [42:11<47:53:19, 9.72s/it]
691
  2% 270/18000 [42:24<53:01:13, 10.77s/it]
692
  2% 271/18000 [42:35<53:02:40, 10.77s/it]
693
  2% 272/18000 [42:45<51:00:00, 10.36s/it]
694
  2% 273/18000 [42:53<48:01:13, 9.75s/it]
695
  2% 274/18000 [43:00<44:05:26, 8.95s/it]
696
  2% 275/18000 [43:06<39:29:31, 8.02s/it]
697
  2% 276/18000 [43:10<34:20:22, 6.97s/it]
698
  2% 277/18000 [43:27<48:36:20, 9.87s/it]
699
  2% 278/18000 [43:41<54:13:56, 11.02s/it]
700
  2% 279/18000 [43:52<54:12:18, 11.01s/it]
701
  2% 280/18000 [44:01<51:45:06, 10.51s/it]
702
  2% 281/18000 [44:10<48:47:06, 9.91s/it]
703
  2% 282/18000 [44:16<44:16:39, 9.00s/it]
704
  2% 283/18000 [44:22<39:08:42, 7.95s/it]
705
  2% 284/18000 [44:26<33:59:45, 6.91s/it]
706
  2% 285/18000 [44:42<46:30:46, 9.45s/it]
707
  2% 286/18000 [44:52<47:30:24, 9.65s/it]
708
  2% 287/18000 [44:59<43:54:19, 8.92s/it]
709
  2% 288/18000 [45:03<35:52:00, 7.29s/it]
710
  2% 289/18000 [45:19<49:57:55, 10.16s/it]
711
  2% 290/18000 [45:33<54:54:58, 11.16s/it]
712
  2% 291/18000 [45:44<54:40:30, 11.11s/it]
713
  2% 292/18000 [45:54<52:24:02, 10.65s/it]
714
  2% 293/18000 [46:02<48:53:00, 9.94s/it]
715
  2% 294/18000 [46:09<44:31:18, 9.05s/it]
716
  2% 295/18000 [46:15<39:58:45, 8.13s/it]
717
  2% 296/18000 [46:19<34:41:14, 7.05s/it]
718
  2% 297/18000 [46:36<48:25:58, 9.85s/it]
719
  2% 298/18000 [46:49<53:21:33, 10.85s/it]
720
  2% 299/18000 [47:00<53:00:52, 10.78s/it]
721
  2% 300/18000 [47:09<51:02:08, 10.38s/it]
722
 
723
  2% 300/18000 [47:09<51:02:08, 10.38s/it]
724
  2% 301/18000 [47:17<47:51:13, 9.73s/it]
725
  2% 302/18000 [47:24<43:43:29, 8.89s/it]
726
  2% 303/18000 [47:30<39:03:22, 7.94s/it]
727
  2% 304/18000 [47:34<33:47:15, 6.87s/it]
728
  2% 305/18000 [47:51<47:55:18, 9.75s/it]
729
  2% 306/18000 [48:04<52:59:15, 10.78s/it]
730
  2% 307/18000 [48:15<52:51:07, 10.75s/it]
731
  2% 308/18000 [48:24<50:25:56, 10.26s/it]
732
  2% 309/18000 [48:32<47:33:47, 9.68s/it]
733
  2% 310/18000 [48:39<43:29:15, 8.85s/it]
734
  2% 311/18000 [48:45<38:43:45, 7.88s/it]
735
  2% 312/18000 [48:49<33:28:13, 6.81s/it]
736
  2% 313/18000 [49:05<47:37:14, 9.69s/it]
737
  2% 314/18000 [49:19<53:06:18, 10.81s/it]
738
  2% 315/18000 [49:29<52:32:02, 10.69s/it]
739
  2% 316/18000 [49:39<50:37:01, 10.30s/it]
740
  2% 317/18000 [49:47<47:35:40, 9.69s/it]
741
  2% 318/18000 [49:54<43:33:20, 8.87s/it]
742
  2% 319/18000 [50:00<39:14:50, 7.99s/it]
743
  2% 320/18000 [50:04<34:09:36, 6.96s/it]
744
  2% 321/18000 [50:19<46:07:44, 9.39s/it]
745
  2% 322/18000 [50:29<47:04:05, 9.59s/it]
746
  2% 323/18000 [50:37<43:38:37, 8.89s/it]
747
  2% 324/18000 [50:40<35:28:44, 7.23s/it]
748
  2% 325/18000 [50:56<49:06:27, 10.00s/it]
749
  2% 326/18000 [51:10<53:47:16, 10.96s/it]
750
  2% 327/18000 [51:20<53:23:03, 10.87s/it]
751
  2% 328/18000 [51:30<51:14:24, 10.44s/it]
752
  2% 329/18000 [51:38<48:08:52, 9.81s/it]
753
  2% 330/18000 [51:45<44:04:02, 8.98s/it]
754
  2% 331/18000 [51:51<39:27:52, 8.04s/it]
755
  2% 332/18000 [51:55<34:01:15, 6.93s/it]
756
  2% 333/18000 [52:12<47:55:08, 9.76s/it]
757
  2% 334/18000 [52:25<52:58:37, 10.80s/it]
758
  2% 335/18000 [52:36<53:03:41, 10.81s/it]
759
  2% 336/18000 [52:45<51:22:12, 10.47s/it]
760
  2% 337/18000 [52:54<48:17:41, 9.84s/it]
761
  2% 338/18000 [53:01<44:04:01, 8.98s/it]
762
  2% 339/18000 [53:06<39:19:19, 8.02s/it]
763
  2% 340/18000 [53:11<33:59:49, 6.93s/it]
764
  2% 341/18000 [53:28<48:17:19, 9.84s/it]
765
  2% 342/18000 [53:40<52:48:55, 10.77s/it]
766
  2% 343/18000 [53:51<52:45:57, 10.76s/it]
767
  2% 344/18000 [54:00<50:32:06, 10.30s/it]
768
  2% 345/18000 [54:09<47:20:31, 9.65s/it]
769
  2% 346/18000 [54:15<43:17:34, 8.83s/it]
770
  2% 347/18000 [54:21<38:41:00, 7.89s/it]
771
  2% 348/18000 [54:25<33:24:17, 6.81s/it]
772
  2% 349/18000 [54:42<47:36:12, 9.71s/it]
773
  2% 350/18000 [54:55<52:56:31, 10.80s/it]
774
  2% 351/18000 [55:05<52:05:17, 10.62s/it]
775
  2% 352/18000 [55:15<49:57:37, 10.19s/it]
776
  2% 353/18000 [55:23<46:53:40, 9.57s/it]
777
  2% 354/18000 [55:30<42:56:28, 8.76s/it]
778
  2% 355/18000 [55:35<38:35:32, 7.87s/it]
779
  2% 356/18000 [55:40<33:34:24, 6.85s/it]
780
  2% 357/18000 [55:55<46:02:43, 9.40s/it]
781
  2% 358/18000 [56:05<47:14:04, 9.64s/it]
782
  2% 359/18000 [56:13<43:54:21, 8.96s/it]
783
  2% 360/18000 [56:16<35:44:58, 7.30s/it]
784
  2% 361/18000 [56:33<49:37:45, 10.13s/it]
785
  2% 362/18000 [56:46<54:18:29, 11.08s/it]
786
  2% 363/18000 [56:57<53:18:49, 10.88s/it]
787
  2% 364/18000 [57:06<50:43:27, 10.35s/it]
788
  2% 365/18000 [57:14<47:50:00, 9.76s/it]
789
  2% 366/18000 [57:21<43:42:30, 8.92s/it]
790
  2% 367/18000 [57:27<38:47:25, 7.92s/it]
791
  2% 368/18000 [57:31<33:26:40, 6.83s/it]
792
  2% 369/18000 [57:47<47:20:50, 9.67s/it]
793
  2% 370/18000 [58:01<52:33:21, 10.73s/it]
794
  2% 371/18000 [58:11<52:40:27, 10.76s/it]
795
  2% 372/18000 [58:21<50:37:46, 10.34s/it]
796
  2% 373/18000 [58:29<47:13:33, 9.65s/it]
797
  2% 374/18000 [58:36<43:15:43, 8.84s/it]
798
  2% 375/18000 [58:41<38:46:26, 7.92s/it]
799
  2% 376/18000 [58:46<33:49:26, 6.91s/it]
800
  2% 377/18000 [59:03<47:58:02, 9.80s/it]
801
  2% 378/18000 [59:16<53:14:23, 10.88s/it]
802
  2% 379/18000 [59:27<53:21:26, 10.90s/it]
803
  2% 380/18000 [59:37<51:32:24, 10.53s/it]
804
  2% 381/18000 [59:45<48:23:16, 9.89s/it]
805
  2% 382/18000 [59:52<44:25:48, 9.08s/it]
806
  2% 383/18000 [59:58<39:54:39, 8.16s/it]
807
  2% 384/18000 [1:00:03<34:22:55, 7.03s/it]
808
  2% 385/18000 [1:00:19<48:14:08, 9.86s/it]
809
  2% 386/18000 [1:00:32<53:13:30, 10.88s/it]
810
  2% 387/18000 [1:00:43<52:53:09, 10.81s/it]
811
  2% 388/18000 [1:00:52<50:27:17, 10.31s/it]
812
  2% 389/18000 [1:01:00<47:11:15, 9.65s/it]
813
  2% 390/18000 [1:01:07<43:01:58, 8.80s/it]
814
  2% 391/18000 [1:01:13<38:27:51, 7.86s/it]
815
  2% 392/18000 [1:01:17<33:21:31, 6.82s/it]
816
  2% 393/18000 [1:01:32<44:31:41, 9.10s/it]
817
  2% 394/18000 [1:01:41<45:48:47, 9.37s/it]
818
  2% 395/18000 [1:01:49<42:48:03, 8.75s/it]
819
  2% 396/18000 [1:01:52<34:58:38, 7.15s/it]
820
  2% 397/18000 [1:02:09<48:50:53, 9.99s/it]
821
  2% 398/18000 [1:02:22<53:43:53, 10.99s/it]
822
  2% 399/18000 [1:02:33<53:20:56, 10.91s/it]
823
  2% 400/18000 [1:02:42<51:16:29, 10.49s/it]
824
 
825
  2% 400/18000 [1:02:42<51:16:29, 10.49s/it]
826
  2% 401/18000 [1:02:51<48:04:04, 9.83s/it]
827
  2% 402/18000 [1:02:58<43:47:40, 8.96s/it]
828
  2% 403/18000 [1:03:03<39:11:36, 8.02s/it]
829
  2% 404/18000 [1:03:08<33:59:02, 6.95s/it]
830
  2% 405/18000 [1:03:24<47:36:15, 9.74s/it]
831
  2% 406/18000 [1:03:37<52:47:43, 10.80s/it]
832
  2% 407/18000 [1:03:48<52:48:26, 10.81s/it]
833
  2% 408/18000 [1:03:58<50:44:50, 10.38s/it]
834
  2% 409/18000 [1:04:06<47:49:35, 9.79s/it]
835
  2% 410/18000 [1:04:13<43:57:02, 9.00s/it]
836
  2% 411/18000 [1:04:19<39:21:08, 8.05s/it]
837
  2% 412/18000 [1:04:23<33:57:31, 6.95s/it]
838
  2% 413/18000 [1:04:40<47:43:17, 9.77s/it]
839
  2% 414/18000 [1:04:53<53:05:33, 10.87s/it]
840
  2% 415/18000 [1:05:04<53:03:39, 10.86s/it]
841
  2% 416/18000 [1:05:14<51:10:13, 10.48s/it]
842
  2% 417/18000 [1:05:22<47:58:19, 9.82s/it]
843
  2% 418/18000 [1:05:29<43:46:49, 8.96s/it]
844
  2% 419/18000 [1:05:35<39:10:03, 8.02s/it]
845
  2% 420/18000 [1:05:39<33:58:45, 6.96s/it]
846
  2% 421/18000 [1:05:56<48:16:48, 9.89s/it]
847
  2% 422/18000 [1:06:09<53:30:55, 10.96s/it]
848
  2% 423/18000 [1:06:20<53:13:22, 10.90s/it]
849
  2% 424/18000 [1:06:29<50:26:10, 10.33s/it]
850
  2% 425/18000 [1:06:37<47:08:56, 9.66s/it]
851
  2% 426/18000 [1:06:44<43:19:15, 8.87s/it]
852
  2% 427/18000 [1:06:50<38:33:18, 7.90s/it]
853
  2% 428/18000 [1:06:54<33:33:27, 6.88s/it]
854
  2% 429/18000 [1:07:09<44:43:15, 9.16s/it]
855
  2% 430/18000 [1:07:19<46:00:07, 9.43s/it]
856
  2% 431/18000 [1:07:26<43:11:33, 8.85s/it]
857
  2% 432/18000 [1:07:30<34:56:30, 7.16s/it]
858
  2% 433/18000 [1:07:46<48:49:24, 10.01s/it]
859
  2% 434/18000 [1:08:00<53:38:05, 10.99s/it]
860
  2% 435/18000 [1:08:10<53:09:03, 10.89s/it]
861
  2% 436/18000 [1:08:19<50:38:26, 10.38s/it]
862
  2% 437/18000 [1:08:27<47:14:39, 9.68s/it]
863
  2% 438/18000 [1:08:34<42:52:00, 8.79s/it]
864
  2% 439/18000 [1:08:40<38:20:18, 7.86s/it]
865
  2% 440/18000 [1:08:44<33:10:31, 6.80s/it]
866
  2% 441/18000 [1:09:01<47:29:55, 9.74s/it]
867
  2% 442/18000 [1:09:14<52:47:34, 10.82s/it]
868
  2% 443/18000 [1:09:25<52:43:24, 10.81s/it]
869
  2% 444/18000 [1:09:34<50:46:19, 10.41s/it]
870
  2% 445/18000 [1:09:43<47:42:44, 9.78s/it]
871
  2% 446/18000 [1:09:50<43:40:10, 8.96s/it]
872
  2% 447/18000 [1:09:56<39:20:53, 8.07s/it]
873
  2% 448/18000 [1:10:00<34:14:21, 7.02s/it]
874
  2% 449/18000 [1:10:17<48:02:46, 9.86s/it]
875
  2% 450/18000 [1:10:30<53:38:52, 11.00s/it]
876
  3% 451/18000 [1:10:41<53:33:23, 10.99s/it]
877
  3% 452/18000 [1:10:51<51:28:10, 10.56s/it]
878
  3% 453/18000 [1:10:59<47:59:20, 9.85s/it]
879
  3% 454/18000 [1:11:06<43:39:42, 8.96s/it]
880
  3% 455/18000 [1:11:12<39:03:03, 8.01s/it]
881
  3% 456/18000 [1:11:16<33:48:03, 6.94s/it]
882
  3% 457/18000 [1:11:33<47:28:06, 9.74s/it]
883
  3% 458/18000 [1:11:46<52:13:26, 10.72s/it]
884
  3% 459/18000 [1:11:56<52:11:58, 10.71s/it]
885
  3% 460/18000 [1:12:06<50:26:50, 10.35s/it]
886
  3% 461/18000 [1:12:14<47:11:11, 9.69s/it]
887
  3% 462/18000 [1:12:21<43:22:01, 8.90s/it]
888
  3% 463/18000 [1:12:27<38:48:08, 7.97s/it]
889
  3% 464/18000 [1:12:31<33:40:40, 6.91s/it]
890
  3% 465/18000 [1:12:46<45:41:28, 9.38s/it]
891
  3% 466/18000 [1:12:56<46:32:41, 9.56s/it]
892
  3% 467/18000 [1:13:03<43:03:28, 8.84s/it]
893
  3% 468/18000 [1:13:07<34:43:53, 7.13s/it]
894
  3% 469/18000 [1:13:23<48:48:43, 10.02s/it]
895
  3% 470/18000 [1:13:37<54:05:41, 11.11s/it]
896
  3% 471/18000 [1:13:48<53:57:52, 11.08s/it]
897
  3% 472/18000 [1:13:58<51:57:14, 10.67s/it]
898
  3% 473/18000 [1:14:06<48:17:17, 9.92s/it]
899
  3% 474/18000 [1:14:13<44:14:22, 9.09s/it]
900
  3% 475/18000 [1:14:19<39:36:15, 8.14s/it]
901
  3% 476/18000 [1:14:24<34:21:02, 7.06s/it]
902
  3% 477/18000 [1:14:40<47:52:39, 9.84s/it]
903
  3% 478/18000 [1:14:53<52:38:58, 10.82s/it]
904
  3% 479/18000 [1:15:04<52:32:09, 10.79s/it]
905
  3% 480/18000 [1:15:13<50:33:14, 10.39s/it]
906
  3% 481/18000 [1:15:22<47:38:56, 9.79s/it]
907
  3% 482/18000 [1:15:28<43:19:51, 8.90s/it]
908
  3% 483/18000 [1:15:34<38:46:14, 7.97s/it]
909
  3% 484/18000 [1:15:39<33:35:21, 6.90s/it]
910
  3% 485/18000 [1:15:55<47:26:03, 9.75s/it]
911
  3% 486/18000 [1:16:08<52:32:49, 10.80s/it]
912
  3% 487/18000 [1:16:19<52:38:09, 10.82s/it]
913
  3% 488/18000 [1:16:28<50:31:07, 10.39s/it]
914
  3% 489/18000 [1:16:37<47:24:15, 9.75s/it]
915
  3% 490/18000 [1:16:44<43:32:47, 8.95s/it]
916
  3% 491/18000 [1:16:50<39:21:30, 8.09s/it]
917
  3% 492/18000 [1:16:54<34:02:14, 7.00s/it]
918
  3% 493/18000 [1:17:11<48:38:09, 10.00s/it]
919
  3% 494/18000 [1:17:25<53:24:35, 10.98s/it]
920
  3% 495/18000 [1:17:35<52:53:14, 10.88s/it]
921
  3% 496/18000 [1:17:45<50:41:49, 10.43s/it]
922
  3% 497/18000 [1:17:53<47:21:35, 9.74s/it]
923
  3% 498/18000 [1:18:00<43:18:58, 8.91s/it]
924
  3% 499/18000 [1:18:05<38:28:50, 7.92s/it]
925
  3% 500/18000 [1:18:10<33:36:35, 6.91s/it]
926
 
927
  3% 500/18000 [1:18:10<33:36:35, 6.91s/it]The following columns in the evaluation set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.
928
+ ***** Running Evaluation *****
929
+ Num examples = 2609
930
+ Batch size = 80
931
+
932
+
933
  0% 0/33 [00:00<?, ?it/s]
934
+
935
  6% 2/33 [00:04<01:10, 2.26s/it]
936
+
937
  9% 3/33 [00:08<01:33, 3.13s/it]
938
+
939
  12% 4/33 [00:12<01:39, 3.44s/it]
940
+
941
  15% 5/33 [00:16<01:42, 3.64s/it]
942
+
943
  18% 6/33 [00:20<01:42, 3.79s/it]
944
+
945
  21% 7/33 [00:24<01:38, 3.80s/it]
946
+
947
  24% 8/33 [00:28<01:36, 3.85s/it]
948
+
949
  27% 9/33 [00:32<01:33, 3.88s/it]
950
+
951
  30% 10/33 [00:37<01:33, 4.07s/it]
952
+
953
  33% 11/33 [00:41<01:29, 4.06s/it]
954
+
955
  36% 12/33 [00:45<01:24, 4.04s/it]
956
+
957
  39% 13/33 [00:49<01:19, 3.98s/it]
958
+
959
  42% 14/33 [00:53<01:16, 4.03s/it]
960
+
961
  45% 15/33 [00:57<01:12, 4.04s/it]
962
+
963
  48% 16/33 [01:01<01:10, 4.17s/it]
964
+
965
  52% 17/33 [01:06<01:09, 4.32s/it]
966
+
967
  55% 18/33 [01:10<01:03, 4.24s/it]
968
+
969
  58% 19/33 [01:14<00:59, 4.24s/it]
970
+
971
  61% 20/33 [01:19<00:55, 4.31s/it]
972
+
973
  64% 21/33 [01:23<00:52, 4.34s/it]
974
+
975
  67% 22/33 [01:27<00:47, 4.33s/it]
976
+
977
  70% 23/33 [01:32<00:43, 4.38s/it]
978
+
979
  73% 24/33 [01:36<00:39, 4.39s/it]
980
+
981
  76% 25/33 [01:41<00:35, 4.42s/it]
982
+
983
  79% 26/33 [01:45<00:30, 4.37s/it]
984
+
985
  82% 27/33 [01:49<00:25, 4.31s/it]
986
+
987
  85% 28/33 [01:54<00:21, 4.34s/it]
988
+
989
  88% 29/33 [01:57<00:16, 4.09s/it]
990
+
991
  91% 30/33 [02:00<00:11, 3.70s/it]
992
+
993
  94% 31/33 [02:03<00:06, 3.40s/it]
994
+
995
  97% 32/33 [02:05<00:03, 3.18s/it]
996
+
997
+
998
 
999
 
1000
+
1001
  3% 500/18000 [1:20:23<33:36:35, 6.91s/it]
1002
+
1003
  Saving model checkpoint to ./checkpoint-500
1004
+ Configuration saved in ./checkpoint-500/config.json
1005
+ Model weights saved in ./checkpoint-500/pytorch_model.bin
1006
+ Configuration saved in ./checkpoint-500/preprocessor_config.json
1007
+ Configuration saved in ./preprocessor_config.json
logs ADDED
@@ -0,0 +1,99 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 01/26/2022 10:56:56 - WARNING - __main__ - Process rank: -1, device: cuda:0, n_gpu: 1distributed training: False, 16-bits training: True
2
+ 01/26/2022 10:56:56 - INFO - __main__ - Training/evaluation parameters TrainingArguments(
3
+ _n_gpu=1,
4
+ adafactor=False,
5
+ adam_beta1=0.9,
6
+ adam_beta2=0.999,
7
+ adam_epsilon=1e-08,
8
+ bf16=False,
9
+ bf16_full_eval=False,
10
+ dataloader_drop_last=False,
11
+ dataloader_num_workers=0,
12
+ dataloader_pin_memory=True,
13
+ ddp_bucket_cap_mb=None,
14
+ ddp_find_unused_parameters=None,
15
+ debug=[],
16
+ deepspeed=None,
17
+ disable_tqdm=False,
18
+ do_eval=True,
19
+ do_predict=False,
20
+ do_train=True,
21
+ eval_accumulation_steps=None,
22
+ eval_steps=500,
23
+ evaluation_strategy=IntervalStrategy.STEPS,
24
+ fp16=True,
25
+ fp16_backend=auto,
26
+ fp16_full_eval=False,
27
+ fp16_opt_level=O1,
28
+ gradient_accumulation_steps=2,
29
+ gradient_checkpointing=True,
30
+ greater_is_better=None,
31
+ group_by_length=True,
32
+ half_precision_backend=auto,
33
+ hub_model_id=None,
34
+ hub_strategy=HubStrategy.EVERY_SAVE,
35
+ hub_token=<HUB_TOKEN>,
36
+ ignore_data_skip=False,
37
+ label_names=None,
38
+ label_smoothing_factor=0.0,
39
+ learning_rate=0.0003,
40
+ length_column_name=input_length,
41
+ load_best_model_at_end=False,
42
+ local_rank=-1,
43
+ log_level=-1,
44
+ log_level_replica=-1,
45
+ log_on_each_node=True,
46
+ logging_dir=./runs/Jan26_10-56-56_ganymede.eafit.edu.co,
47
+ logging_first_step=False,
48
+ logging_nan_inf_filter=True,
49
+ logging_steps=100,
50
+ logging_strategy=IntervalStrategy.STEPS,
51
+ lr_scheduler_type=SchedulerType.COSINE,
52
+ max_grad_norm=1.0,
53
+ max_steps=-1,
54
+ metric_for_best_model=None,
55
+ mp_parameters=,
56
+ no_cuda=False,
57
+ num_train_epochs=500.0,
58
+ optim=OptimizerNames.ADAMW_HF,
59
+ output_dir=./,
60
+ overwrite_output_dir=True,
61
+ past_index=-1,
62
+ per_device_eval_batch_size=80,
63
+ per_device_train_batch_size=80,
64
+ prediction_loss_only=False,
65
+ push_to_hub=True,
66
+ push_to_hub_model_id=None,
67
+ push_to_hub_organization=None,
68
+ push_to_hub_token=<PUSH_TO_HUB_TOKEN>,
69
+ remove_unused_columns=True,
70
+ report_to=['wandb'],
71
+ resume_from_checkpoint=None,
72
+ run_name=cosine+drop_proj+low_specaugment-300M,
73
+ save_on_each_node=False,
74
+ save_steps=500,
75
+ save_strategy=IntervalStrategy.STEPS,
76
+ save_total_limit=1,
77
+ seed=42,
78
+ sharded_ddp=[],
79
+ skip_memory_metrics=True,
80
+ tf32=None,
81
+ tpu_metrics_debug=False,
82
+ tpu_num_cores=None,
83
+ use_legacy_prediction_loop=False,
84
+ warmup_ratio=0.0,
85
+ warmup_steps=500,
86
+ weight_decay=0.0,
87
+ xpu_backend=None,
88
+ )
89
+ 01/26/2022 10:57:00 - WARNING - datasets.builder - Reusing dataset common_voice (/home/sagrilaft/.cache/huggingface/datasets/mozilla-foundation___common_voice/et/7.0.0/33e08856cfa0d0665e837bcad73ffd920a0bc713ce8c5fffb55dbdf1c084d5ba)
90
+ 01/26/2022 10:57:02 - WARNING - datasets.builder - Reusing dataset common_voice (/home/sagrilaft/.cache/huggingface/datasets/mozilla-foundation___common_voice/et/7.0.0/33e08856cfa0d0665e837bcad73ffd920a0bc713ce8c5fffb55dbdf1c084d5ba)
91
+ 01/26/2022 10:57:02 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sagrilaft/.cache/huggingface/datasets/mozilla-foundation___common_voice/et/7.0.0/33e08856cfa0d0665e837bcad73ffd920a0bc713ce8c5fffb55dbdf1c084d5ba/cache-f4479ce33e07f5c7.arrow
92
+ 01/26/2022 10:57:02 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/sagrilaft/.cache/huggingface/datasets/mozilla-foundation___common_voice/et/7.0.0/33e08856cfa0d0665e837bcad73ffd920a0bc713ce8c5fffb55dbdf1c084d5ba/cache-105cefde64f772a9.arrow
93
+ 01/26/2022 10:58:44 - WARNING - huggingface_hub.repository - /home/sagrilaft/Project/audio/xls-r-et/./ is already a clone of https://huggingface.co/shpotes/xls-r-et. Make sure you pull the latest changes with `repo.git_pull()`.
94
+
95
+ {'loss': 4.5903, 'learning_rate': 0.00019800000000000002, 'epoch': 2.78}
96
+ {'loss': 2.9083, 'learning_rate': 0.000398, 'epoch': 5.56}
97
+ {'loss': 1.2823, 'learning_rate': 0.000598, 'epoch': 8.33}
98
+ {'loss': 0.3962, 'learning_rate': 0.0007980000000000001, 'epoch': 11.11}
99
+ {'loss': 0.3034, 'learning_rate': 0.000998, 'epoch': 13.89}
preprocessor_config.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_normalize": true,
3
+ "feature_extractor_type": "Wav2Vec2FeatureExtractor",
4
+ "feature_size": 1,
5
+ "padding_side": "right",
6
+ "padding_value": 0,
7
+ "return_attention_mask": true,
8
+ "sampling_rate": 16000
9
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3aae5e50ef4a8b89fd5fb88e1636f3e95144e39211b78b0a3f3767d443d62958
3
+ size 1262083569
run-1b.sh CHANGED
@@ -13,7 +13,7 @@ python src/run_speech_recognition_ctc_bnb.py \
13
  --per_device_train_batch_size=48 \
14
  --per_device_eval_batch_size=48 \
15
  --gradient_accumulation_steps=2 \
16
- --learning_rate=3e-4 \
17
  --save_total_limit=1 \
18
  --warmup_steps=500 \
19
  --evaluation_strategy=steps \
 
13
  --per_device_train_batch_size=48 \
14
  --per_device_eval_batch_size=48 \
15
  --gradient_accumulation_steps=2 \
16
+ --learning_rate=5e-5 \
17
  --save_total_limit=1 \
18
  --warmup_steps=500 \
19
  --evaluation_strategy=steps \
run-300M.sh CHANGED
@@ -9,7 +9,7 @@ python src/run_speech_recognition_ctc_bnb.py \
9
  --dataset_config_name="et" \
10
  --output_dir="./" \
11
  --overwrite_output_dir \
12
- --num_train_epochs=100 \
13
  --per_device_train_batch_size=80 \
14
  --per_device_eval_batch_size=80 \
15
  --gradient_accumulation_steps=2 \
@@ -19,8 +19,8 @@ python src/run_speech_recognition_ctc_bnb.py \
19
  --evaluation_strategy=steps \
20
  --text_column_name=sentence \
21
  --length_column_name=input_length \
22
- --save_steps=1000 \
23
- --eval_steps=250 \
24
  --logging_steps=100 \
25
  --layerdrop=0.0 \
26
  --freeze_feature_encoder \
 
9
  --dataset_config_name="et" \
10
  --output_dir="./" \
11
  --overwrite_output_dir \
12
+ --num_train_epochs=500 \
13
  --per_device_train_batch_size=80 \
14
  --per_device_eval_batch_size=80 \
15
  --gradient_accumulation_steps=2 \
 
19
  --evaluation_strategy=steps \
20
  --text_column_name=sentence \
21
  --length_column_name=input_length \
22
+ --save_steps=500 \
23
+ --eval_steps=500 \
24
  --logging_steps=100 \
25
  --layerdrop=0.0 \
26
  --freeze_feature_encoder \
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]", "additional_special_tokens": [{"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}]}
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"unk_token": "[UNK]", "bos_token": "<s>", "eos_token": "</s>", "pad_token": "[PAD]", "do_lower_case": false, "word_delimiter_token": "|", "special_tokens_map_file": null, "tokenizer_file": null, "name_or_path": "./", "tokenizer_class": "Wav2Vec2CTCTokenizer"}
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9be3a7c88f8500cf6b3a8b0b089125768d465147886310e4abb4ddc8cf154dd1
3
+ size 3055
vocab.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"a": 1, "b": 2, "c": 3, "d": 4, "e": 5, "f": 6, "g": 7, "h": 8, "i": 9, "j": 10, "k": 11, "l": 12, "m": 13, "n": 14, "o": 15, "p": 16, "q": 17, "r": 18, "s": 19, "t": 20, "u": 21, "v": 22, "w": 23, "x": 24, "y": 25, "z": 26, "ä": 27, "õ": 28, "ö": 29, "ü": 30, "š": 31, "ž": 32, "̇": 33, "„": 34, "|": 0, "[UNK]": 35, "[PAD]": 36}
wandb/debug-internal.log ADDED
@@ -0,0 +1 @@
 
 
1
+ run-20220126_121554-295enqix/logs/debug-internal.log
wandb/debug.log ADDED
@@ -0,0 +1 @@
 
 
1
+ run-20220126_121554-295enqix/logs/debug.log
wandb/latest-run ADDED
@@ -0,0 +1 @@
 
 
1
+ run-20220126_121554-295enqix
wandb/run-20220126_105847-1xdiy2kf/files/config.yaml ADDED
The diff for this file is too large to render. See raw diff
 
wandb/run-20220126_105847-1xdiy2kf/files/output.log ADDED
@@ -0,0 +1,544 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+
3
+
4
+
5
+
6
+
7
+
8
+
9
+
10
+
11
+
12
+
13
+
14
+
15
+
16
+
17
+
18
+
19
+
20
+
21
+
22
+
23
+
24
+
25
+
26
+
27
+
28
+
29
+
30
+
31
+
32
+
33
+
34
+
35
+
36
+
37
+
38
+
39
+
40
+
41
+
42
+
43
+
44
+
45
+
46
+
47
+
48
+
49
+
50
+
51
+
52
+
53
+
54
+
55
+
56
+
57
+
58
+
59
+
60
+
61
+
62
+
63
+
64
+
65
+
66
+
67
+
68
+
69
+
70
+
71
+
72
+
73
+
74
+
75
+
76
+
77
+
78
+
79
+
80
+
81
+
82
+
83
+
84
+
85
+
86
+
87
+
88
+
89
+
90
+
91
+
92
+
93
+
94
+
95
+
96
+
97
+
98
+
99
+
100
+
101
+
102
+
103
+
104
+
105
+
106
+
107
+
108
+
109
+
110
+
111
+
112
+
113
+
114
+
115
+
116
+
117
+
118
+
119
+
120
+
121
+
122
+
123
+
124
+
125
+
126
+
127
+
128
+
129
+
130
+
131
+
132
+
133
+
134
+
135
+
136
+
137
+
138
+
139
+
140
+
141
+
142
+
143
+
144
+
145
+
146
+
147
+
148
+
149
+
150
+
151
+
152
+
153
+
154
+
155
+
156
+
157
+
158
+
159
+
160
+
161
+
162
+
163
+
164
+
165
+
166
+
167
+
168
+
169
+
170
+
171
+
172
+
173
+
174
+
175
+
176
+
177
+
178
+
179
+
180
+
181
+
182
+
183
+
184
+
185
+
186
+
187
+
188
+
189
+
190
+
191
+
192
+
193
+
194
+
195
+
196
+
197
+
198
+
199
+
200
+
201
+
202
+
203
+
204
+
205
+
206
+
207
+
208
+
209
+
210
+
211
+
212
+
213
+
214
+
215
+
216
+
217
+
218
+
219
+
220
+
221
+
222
+
223
+
224
+
225
+
226
+
227
+
228
+
229
+
230
+
231
+
232
+
233
+
234
+
235
+
236
+
237
+
238
+
239
+
240
+
241
+
242
+
243
+
244
+
245
+
246
+
247
+
248
+
249
+
250
+
251
+
252
+
253
+
254
+
255
+
256
+
257
+
258
+
259
+
260
+
261
+
262
+
263
+
264
+
265
+
266
+
267
+
268
+
269
+
270
+
271
+
272
+
273
+
274
+
275
+
276
+
277
+
278
+
279
+
280
+
281
+
282
+
283
+
284
+
285
+
286
+
287
+
288
+
289
+
290
+
291
+
292
+
293
+
294
+
295
+
296
+
297
+
298
+
299
+
300
+
301
+
302
+
303
+
304
+
305
+
306
+
307
+
308
+
309
+
310
+
311
+
312
+
313
+
314
+
315
+
316
+
317
+
318
+
319
+
320
+
321
+
322
+
323
+
324
+
325
+
326
+
327
+
328
+
329
+
330
+
331
+
332
+
333
+
334
+
335
+
336
+
337
+
338
+
339
+
340
+
341
+
342
+
343
+
344
+
345
+
346
+
347
+
348
+
349
+
350
+
351
+
352
+
353
+
354
+
355
+
356
+
357
+
358
+
359
+
360
+
361
+
362
+
363
+
364
+
365
+
366
+
367
+
368
+
369
+
370
+
371
+
372
+
373
+
374
+
375
+
376
+
377
+
378
+
379
+
380
+
381
+
382
+
383
+
384
+
385
+
386
+
387
+
388
+
389
+
390
+
391
+
392
+
393
+
394
+
395
+
396
+
397
+
398
+
399
+
400
+
401
+
402
+
403
+
404
+
405
+
406
+
407
+
408
+
409
+
410
+
411
+
412
+
413
+
414
+
415
+
416
+
417
+
418
+
419
+
420
+
421
+
422
+
423
+
424
+
425
+
426
+
427
+
428
+
429
+
430
+
431
+
432
+
433
+
434
+
435
+
436
+
437
+
438
+
439
+
440
+
441
+
442
+
443
+
444
+
445
+
446
+
447
+
448
+
449
+
450
+
451
+
452
+
453
+
454
+
455
+
456
+
457
+
458
+
459
+
460
+
461
+
462
+
463
+
464
+
465
+
466
+
467
+
468
+
469
+
470
+
471
+
472
+
473
+
474
+
475
+
476
+
477
+
478
+
479
+
480
+
481
+
482
+
483
+
484
+
485
+
486
+
487
+
488
+
489
+
490
+
491
+
492
+
493
+
494
+
495
+
496
+
497
+
498
+
499
+
500
+
501
+ 3% 500/18000 [1:18:10<33:36:35, 6.91s/it]The following columns in the evaluation set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.
502
+ ***** Running Evaluation *****
503
+ Num examples = 2609
504
+ Batch size = 80
505
+ {'loss': 4.5903, 'learning_rate': 0.00019800000000000002, 'epoch': 2.78}
506
+ {'loss': 2.9083, 'learning_rate': 0.000398, 'epoch': 5.56}
507
+ {'loss': 1.2823, 'learning_rate': 0.000598, 'epoch': 8.33}
508
+ {'loss': 0.3962, 'learning_rate': 0.0007980000000000001, 'epoch': 11.11}
509
+ {'loss': 0.3034, 'learning_rate': 0.000998, 'epoch': 13.89}
510
+
511
+
512
+
513
+
514
+
515
+
516
+
517
+
518
+
519
+
520
+
521
+
522
+
523
+
524
+
525
+
526
+
527
+
528
+
529
+
530
+
531
+
532
+
533
+
534
+
535
+
536
+
537
+
538
+
539
+
540
+
541
+
542
+ Configuration saved in ./checkpoint-500/config.json
543
+ Model weights saved in ./checkpoint-500/pytorch_model.bin
544
+ Configuration saved in ./checkpoint-500/preprocessor_config.json
wandb/run-20220126_105847-1xdiy2kf/files/requirements.txt ADDED
@@ -0,0 +1,87 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ aiohttp==3.8.1
2
+ aiosignal==1.2.0
3
+ appdirs==1.4.4
4
+ async-timeout==4.0.2
5
+ attrs==21.4.0
6
+ audioread==2.1.9
7
+ bitsandbytes-cuda113==0.26.0
8
+ certifi==2021.10.8
9
+ cffi==1.15.0
10
+ charset-normalizer==2.0.10
11
+ click==8.0.3
12
+ clldutils==3.10.1
13
+ colorlog==6.6.0
14
+ configparser==5.2.0
15
+ csvw==1.11.0
16
+ datasets==1.18.1.dev0
17
+ decorator==5.1.1
18
+ dill==0.3.4
19
+ dlinfo==1.2.1
20
+ docker-pycreds==0.4.0
21
+ filelock==3.4.2
22
+ frozenlist==1.3.0
23
+ fsspec==2022.1.0
24
+ gitdb==4.0.9
25
+ gitpython==3.1.26
26
+ huggingface-hub==0.4.0
27
+ hypothesis==6.36.0
28
+ idna==3.3
29
+ isodate==0.6.1
30
+ jiwer==2.3.0
31
+ joblib==1.1.0
32
+ librosa==0.8.1
33
+ llvmlite==0.38.0
34
+ multidict==6.0.2
35
+ multiprocess==0.70.12.2
36
+ numba==0.55.0
37
+ numpy==1.21.5
38
+ packaging==21.3
39
+ pandas==1.4.0
40
+ pathtools==0.1.2
41
+ phonemizer==3.0.1
42
+ pip==21.3.1
43
+ pooch==1.6.0
44
+ promise==2.3
45
+ protobuf==3.19.3
46
+ psutil==5.9.0
47
+ pyarrow==6.0.1
48
+ pycparser==2.21
49
+ pyctcdecode==0.3.0
50
+ pygtrie==2.4.2
51
+ pyparsing==3.0.7
52
+ python-dateutil==2.8.2
53
+ python-levenshtein==0.12.2
54
+ pytz==2021.3
55
+ pyyaml==6.0
56
+ regex==2022.1.18
57
+ requests==2.27.1
58
+ resampy==0.2.2
59
+ rfc3986==2.0.0
60
+ sacremoses==0.0.47
61
+ scikit-learn==1.0.2
62
+ scipy==1.7.3
63
+ segments==2.2.0
64
+ sentry-sdk==1.5.4
65
+ setuptools==60.2.0
66
+ shortuuid==1.0.8
67
+ six==1.16.0
68
+ smmap==5.0.0
69
+ sortedcontainers==2.4.0
70
+ soundfile==0.10.3.post1
71
+ subprocess32==3.5.4
72
+ tabulate==0.8.9
73
+ termcolor==1.1.0
74
+ threadpoolctl==3.0.0
75
+ tokenizers==0.11.4
76
+ torch==1.10.1
77
+ torchaudio==0.10.1
78
+ tqdm==4.62.3
79
+ transformers==4.16.0.dev0
80
+ typing-extensions==4.0.1
81
+ uritemplate==4.1.1
82
+ urllib3==1.26.8
83
+ wandb==0.12.9
84
+ wheel==0.37.1
85
+ xxhash==2.0.2
86
+ yarl==1.7.2
87
+ yaspin==2.1.0
wandb/run-20220126_105847-1xdiy2kf/files/wandb-metadata.json ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-4.18.0-305.10.2.el8_4.x86_64-x86_64-with-glibc2.28",
3
+ "python": "3.9.6",
4
+ "heartbeatAt": "2022-01-26T15:58:48.495262",
5
+ "startedAt": "2022-01-26T15:58:47.536839",
6
+ "docker": null,
7
+ "gpu": "Tesla V100-PCIE-32GB",
8
+ "gpu_count": 3,
9
+ "cpu_count": 64,
10
+ "cuda": null,
11
+ "args": [
12
+ "--dataset_name=mozilla-foundation/common_voice_7_0",
13
+ "--model_name_or_path=facebook/wav2vec2-xls-r-300m",
14
+ "--dataset_config_name=et",
15
+ "--output_dir=./",
16
+ "--overwrite_output_dir",
17
+ "--num_train_epochs=500",
18
+ "--per_device_train_batch_size=80",
19
+ "--per_device_eval_batch_size=80",
20
+ "--gradient_accumulation_steps=2",
21
+ "--learning_rate=3e-4",
22
+ "--save_total_limit=1",
23
+ "--warmup_steps=500",
24
+ "--evaluation_strategy=steps",
25
+ "--text_column_name=sentence",
26
+ "--length_column_name=input_length",
27
+ "--save_steps=500",
28
+ "--eval_steps=500",
29
+ "--logging_steps=100",
30
+ "--layerdrop=0.0",
31
+ "--freeze_feature_encoder",
32
+ "--feat_proj_dropout=0.1",
33
+ "--chars_to_ignore",
34
+ ",",
35
+ "?",
36
+ ".",
37
+ "!",
38
+ "-",
39
+ ";",
40
+ ":",
41
+ "\"",
42
+ "\u201c",
43
+ "%",
44
+ "\u2018",
45
+ "\u201d",
46
+ "\ufffd",
47
+ "\u2014",
48
+ "\u2019",
49
+ "\u2026",
50
+ "\u2013",
51
+ "--gradient_checkpointing",
52
+ "--lr_scheduler_type=cosine",
53
+ "--fp16",
54
+ "--group_by_length",
55
+ "--mask_time_prob=0.1",
56
+ "--mask_time_length=10",
57
+ "--report_to=wandb",
58
+ "--run_name=cosine+drop_proj+low_specaugment-300M",
59
+ "--do_train",
60
+ "--do_eval",
61
+ "--use_auth_token",
62
+ "--push_to_hub"
63
+ ],
64
+ "state": "running",
65
+ "program": "/home/sagrilaft/Project/audio/xls-r-et/src/run_speech_recognition_ctc_bnb.py",
66
+ "codePath": "src/run_speech_recognition_ctc_bnb.py",
67
+ "git": {
68
+ "remote": "https://huggingface.co/shpotes/xls-r-et",
69
+ "commit": "2a437db2644553c5c9c2b9e81553ed9bdf92207e"
70
+ },
71
+ "email": "shpotes3@gmail.com",
72
+ "root": "/home/sagrilaft/Project/audio/xls-r-et",
73
+ "host": "ganymede.eafit.edu.co",
74
+ "username": "sagrilaft",
75
+ "executable": "/home/sagrilaft/Project/audio/xls-r-et/.venv/bin/python"
76
+ }
wandb/run-20220126_105847-1xdiy2kf/files/wandb-summary.json ADDED
The diff for this file is too large to render. See raw diff
 
wandb/run-20220126_105847-1xdiy2kf/logs/debug-internal.log ADDED
The diff for this file is too large to render. See raw diff
 
wandb/run-20220126_105847-1xdiy2kf/logs/debug.log ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2022-01-26 10:58:47,539 INFO MainThread:2220463 [wandb_setup.py:_flush():71] setting env: {'project': 'xls-r-estonian'}
2
+ 2022-01-26 10:58:47,540 INFO MainThread:2220463 [wandb_setup.py:_flush():71] setting login settings: {}
3
+ 2022-01-26 10:58:47,540 INFO MainThread:2220463 [wandb_init.py:_log_setup():371] Logging user logs to /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/logs/debug.log
4
+ 2022-01-26 10:58:47,540 INFO MainThread:2220463 [wandb_init.py:_log_setup():372] Logging internal logs to /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_105847-1xdiy2kf/logs/debug-internal.log
5
+ 2022-01-26 10:58:47,540 INFO MainThread:2220463 [wandb_init.py:init():404] calling init triggers
6
+ 2022-01-26 10:58:47,541 INFO MainThread:2220463 [wandb_init.py:init():409] wandb.init called with sweep_config: {}
7
+ config: {}
8
+ 2022-01-26 10:58:47,541 INFO MainThread:2220463 [wandb_init.py:init():460] starting backend
9
+ 2022-01-26 10:58:47,541 INFO MainThread:2220463 [backend.py:_multiprocessing_setup():99] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
10
+ 2022-01-26 10:58:47,575 INFO MainThread:2220463 [backend.py:ensure_launched():216] starting backend process...
11
+ 2022-01-26 10:58:47,598 INFO MainThread:2220463 [backend.py:ensure_launched():221] started backend process with pid: 2220828
12
+ 2022-01-26 10:58:47,600 INFO MainThread:2220463 [wandb_init.py:init():469] backend started and connected
13
+ 2022-01-26 10:58:47,604 INFO MainThread:2220463 [wandb_init.py:init():533] updated telemetry
14
+ 2022-01-26 10:58:47,664 INFO MainThread:2220463 [wandb_init.py:init():563] communicating current version
15
+ 2022-01-26 10:58:48,298 INFO MainThread:2220463 [wandb_init.py:init():568] got version response
16
+ 2022-01-26 10:58:48,299 INFO MainThread:2220463 [wandb_init.py:init():578] communicating run to backend with 30 second timeout
17
+ 2022-01-26 10:58:48,488 INFO MainThread:2220463 [wandb_init.py:init():606] starting run threads in backend
18
+ 2022-01-26 10:58:48,534 INFO MainThread:2220463 [wandb_run.py:_console_start():1810] atexit reg
19
+ 2022-01-26 10:58:48,535 INFO MainThread:2220463 [wandb_run.py:_redirect():1684] redirect: SettingsConsole.REDIRECT
20
+ 2022-01-26 10:58:48,536 INFO MainThread:2220463 [wandb_run.py:_redirect():1689] Redirecting console.
21
+ 2022-01-26 10:58:48,541 INFO MainThread:2220463 [wandb_run.py:_redirect():1745] Redirects installed.
22
+ 2022-01-26 10:58:48,541 INFO MainThread:2220463 [wandb_init.py:init():633] run started, returning control to user process
23
+ 2022-01-26 10:58:48,562 INFO MainThread:2220463 [wandb_run.py:_config_callback():956] config_cb None None {'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': 'float32', 'use_bfloat16': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'chunk_size_feed_forward': 0, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'architectures': ['Wav2Vec2ForPreTraining'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': 1, 'pad_token_id': 36, 'eos_token_id': 2, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'facebook/wav2vec2-xls-r-300m', 'transformers_version': '4.16.0.dev0', 'feat_extract_dropout': 0.0, 'model_type': 'wav2vec2', 'num_feat_extract_layers': 7, 'hidden_size': 1024, 'feat_extract_norm': 'layer', 'feat_extract_activation': 'gelu', 'conv_dim': [512, 512, 512, 512, 512, 512, 512], 'conv_stride': [5, 2, 2, 2, 2, 2, 2], 'conv_kernel': [10, 3, 3, 3, 3, 2, 2], 'conv_bias': True, 'num_conv_pos_embeddings': 128, 'num_conv_pos_embedding_groups': 16, 'num_hidden_layers': 24, 'intermediate_size': 4096, 'hidden_act': 'gelu', 'num_attention_heads': 16, 'hidden_dropout': 0.0, 'attention_dropout': 0.0, 'activation_dropout': 0.0, 'feat_proj_dropout': 0.1, 'final_dropout': 0.0, 'layerdrop': 0.0, 'layer_norm_eps': 1e-05, 'initializer_range': 0.02, 'vocab_size': 39, 'do_stable_layer_norm': True, 'use_weighted_layer_sum': False, 'apply_spec_augment': True, 'mask_time_prob': 0.1, 'mask_time_length': 10, 'mask_time_min_masks': 2, 'mask_feature_prob': 0.0, 'mask_feature_length': 10, 'mask_feature_min_masks': 0, 'num_codevectors_per_group': 320, 'num_codevector_groups': 2, 'contrastive_logits_temperature': 0.1, 'feat_quantizer_dropout': 0.0, 'num_negatives': 100, 'codevector_dim': 768, 'proj_codevector_dim': 768, 'diversity_loss_weight': 0.1, 'ctc_loss_reduction': 'mean', 'ctc_zero_infinity': False, 'add_adapter': False, 'adapter_kernel_size': 3, 'adapter_stride': 2, 'num_adapter_layers': 3, 'output_hidden_size': 1024, 'classifier_proj_size': 256, 'tdnn_dim': [512, 512, 512, 512, 1500], 'tdnn_kernel': [5, 3, 3, 1, 1], 'tdnn_dilation': [1, 2, 3, 1, 1], 'xvector_output_dim': 512, 'output_dir': './', 'overwrite_output_dir': True, 'do_train': True, 'do_eval': True, 'do_predict': False, 'evaluation_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 80, 'per_device_eval_batch_size': 80, 'per_gpu_train_batch_size': 'None', 'per_gpu_eval_batch_size': 'None', 'gradient_accumulation_steps': 2, 'eval_accumulation_steps': 'None', 'learning_rate': 0.0003, 'weight_decay': 0.0, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 500.0, 'max_steps': -1, 'lr_scheduler_type': 'cosine', 'warmup_ratio': 0.0, 'warmup_steps': 500, 'log_level': -1, 'log_level_replica': -1, 'log_on_each_node': True, 'logging_dir': './runs/Jan26_10-56-56_ganymede.eafit.edu.co', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 100, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 500, 'save_total_limit': 1, 'save_on_each_node': False, 'no_cuda': False, 'seed': 42, 'bf16': False, 'fp16': True, 'fp16_opt_level': 'O1', 'half_precision_backend': 'amp', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': 'None', 'local_rank': -1, 'xpu_backend': 'None', 'tpu_num_cores': 'None', 'tpu_metrics_debug': False, 'debug': '[]', 'dataloader_drop_last': False, 'eval_steps': 500, 'dataloader_num_workers': 0, 'past_index': -1, 'run_name': 'cosine+drop_proj+low_specaugment-300M', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': 'None', 'load_best_model_at_end': False, 'metric_for_best_model': 'None', 'greater_is_better': 'None', 'ignore_data_skip': False, 'sharded_ddp': '[]', 'deepspeed': 'None', 'label_smoothing_factor': 0.0, 'optim': 'adamw_hf', 'adafactor': False, 'group_by_length': True, 'length_column_name': 'input_length', 'report_to': "['wandb']", 'ddp_find_unused_parameters': 'None', 'ddp_bucket_cap_mb': 'None', 'dataloader_pin_memory': True, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': True, 'resume_from_checkpoint': 'None', 'hub_model_id': 'None', 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'gradient_checkpointing': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': 'None', 'push_to_hub_organization': 'None', 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', '_n_gpu': 1, 'mp_parameters': '', 'train_batch_size': 80, 'eval_batch_size': 80}
24
+ 2022-01-26 10:58:48,565 INFO MainThread:2220463 [wandb_watch.py:watch():43] Watching
wandb/run-20220126_105847-1xdiy2kf/run-1xdiy2kf.wandb ADDED
Binary file (3.49 MB). View file
 
wandb/run-20220126_121554-295enqix/files/config.yaml ADDED
@@ -0,0 +1,649 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ wandb_version: 1
2
+
3
+ _n_gpu:
4
+ desc: null
5
+ value: 1
6
+ _name_or_path:
7
+ desc: null
8
+ value: facebook/wav2vec2-xls-r-1b
9
+ _wandb:
10
+ desc: null
11
+ value:
12
+ cli_version: 0.12.9
13
+ framework: huggingface
14
+ huggingface_version: 4.16.0.dev0
15
+ is_jupyter_run: false
16
+ is_kaggle_kernel: true
17
+ m:
18
+ - 1: train/global_step
19
+ 6:
20
+ - 3
21
+ python_version: 3.9.6
22
+ start_time: 1643217354
23
+ t:
24
+ 1:
25
+ - 1
26
+ - 5
27
+ - 11
28
+ 3:
29
+ - 13
30
+ 4: 3.9.6
31
+ 5: 0.12.9
32
+ 6: 4.16.0.dev0
33
+ 8:
34
+ - 2
35
+ - 5
36
+ activation_dropout:
37
+ desc: null
38
+ value: 0.0
39
+ adafactor:
40
+ desc: null
41
+ value: false
42
+ adam_beta1:
43
+ desc: null
44
+ value: 0.9
45
+ adam_beta2:
46
+ desc: null
47
+ value: 0.999
48
+ adam_epsilon:
49
+ desc: null
50
+ value: 1.0e-08
51
+ adapter_kernel_size:
52
+ desc: null
53
+ value: 3
54
+ adapter_stride:
55
+ desc: null
56
+ value: 2
57
+ add_adapter:
58
+ desc: null
59
+ value: false
60
+ add_cross_attention:
61
+ desc: null
62
+ value: false
63
+ apply_spec_augment:
64
+ desc: null
65
+ value: true
66
+ architectures:
67
+ desc: null
68
+ value:
69
+ - Wav2Vec2ForPreTraining
70
+ attention_dropout:
71
+ desc: null
72
+ value: 0.0
73
+ bad_words_ids:
74
+ desc: null
75
+ value: null
76
+ bf16:
77
+ desc: null
78
+ value: false
79
+ bf16_full_eval:
80
+ desc: null
81
+ value: false
82
+ bos_token_id:
83
+ desc: null
84
+ value: 1
85
+ chunk_size_feed_forward:
86
+ desc: null
87
+ value: 0
88
+ classifier_proj_size:
89
+ desc: null
90
+ value: 256
91
+ codevector_dim:
92
+ desc: null
93
+ value: 1024
94
+ contrastive_logits_temperature:
95
+ desc: null
96
+ value: 0.1
97
+ conv_bias:
98
+ desc: null
99
+ value: true
100
+ conv_dim:
101
+ desc: null
102
+ value:
103
+ - 512
104
+ - 512
105
+ - 512
106
+ - 512
107
+ - 512
108
+ - 512
109
+ - 512
110
+ conv_kernel:
111
+ desc: null
112
+ value:
113
+ - 10
114
+ - 3
115
+ - 3
116
+ - 3
117
+ - 3
118
+ - 2
119
+ - 2
120
+ conv_stride:
121
+ desc: null
122
+ value:
123
+ - 5
124
+ - 2
125
+ - 2
126
+ - 2
127
+ - 2
128
+ - 2
129
+ - 2
130
+ cross_attention_hidden_size:
131
+ desc: null
132
+ value: null
133
+ ctc_loss_reduction:
134
+ desc: null
135
+ value: mean
136
+ ctc_zero_infinity:
137
+ desc: null
138
+ value: false
139
+ dataloader_drop_last:
140
+ desc: null
141
+ value: false
142
+ dataloader_num_workers:
143
+ desc: null
144
+ value: 0
145
+ dataloader_pin_memory:
146
+ desc: null
147
+ value: true
148
+ ddp_bucket_cap_mb:
149
+ desc: null
150
+ value: None
151
+ ddp_find_unused_parameters:
152
+ desc: null
153
+ value: None
154
+ debug:
155
+ desc: null
156
+ value: '[]'
157
+ decoder_start_token_id:
158
+ desc: null
159
+ value: null
160
+ deepspeed:
161
+ desc: null
162
+ value: None
163
+ disable_tqdm:
164
+ desc: null
165
+ value: false
166
+ diversity_loss_weight:
167
+ desc: null
168
+ value: 0.1
169
+ diversity_penalty:
170
+ desc: null
171
+ value: 0.0
172
+ do_eval:
173
+ desc: null
174
+ value: true
175
+ do_predict:
176
+ desc: null
177
+ value: false
178
+ do_sample:
179
+ desc: null
180
+ value: false
181
+ do_stable_layer_norm:
182
+ desc: null
183
+ value: true
184
+ do_train:
185
+ desc: null
186
+ value: true
187
+ early_stopping:
188
+ desc: null
189
+ value: false
190
+ encoder_no_repeat_ngram_size:
191
+ desc: null
192
+ value: 0
193
+ eos_token_id:
194
+ desc: null
195
+ value: 2
196
+ eval_accumulation_steps:
197
+ desc: null
198
+ value: None
199
+ eval_batch_size:
200
+ desc: null
201
+ value: 48
202
+ eval_steps:
203
+ desc: null
204
+ value: 250
205
+ evaluation_strategy:
206
+ desc: null
207
+ value: steps
208
+ feat_extract_activation:
209
+ desc: null
210
+ value: gelu
211
+ feat_extract_dropout:
212
+ desc: null
213
+ value: 0.0
214
+ feat_extract_norm:
215
+ desc: null
216
+ value: layer
217
+ feat_proj_dropout:
218
+ desc: null
219
+ value: 0.1
220
+ feat_quantizer_dropout:
221
+ desc: null
222
+ value: 0.0
223
+ final_dropout:
224
+ desc: null
225
+ value: 0.0
226
+ finetuning_task:
227
+ desc: null
228
+ value: null
229
+ forced_bos_token_id:
230
+ desc: null
231
+ value: null
232
+ forced_eos_token_id:
233
+ desc: null
234
+ value: null
235
+ fp16:
236
+ desc: null
237
+ value: true
238
+ fp16_backend:
239
+ desc: null
240
+ value: auto
241
+ fp16_full_eval:
242
+ desc: null
243
+ value: false
244
+ fp16_opt_level:
245
+ desc: null
246
+ value: O1
247
+ gradient_accumulation_steps:
248
+ desc: null
249
+ value: 2
250
+ gradient_checkpointing:
251
+ desc: null
252
+ value: true
253
+ greater_is_better:
254
+ desc: null
255
+ value: None
256
+ group_by_length:
257
+ desc: null
258
+ value: true
259
+ half_precision_backend:
260
+ desc: null
261
+ value: amp
262
+ hidden_act:
263
+ desc: null
264
+ value: gelu
265
+ hidden_dropout:
266
+ desc: null
267
+ value: 0.0
268
+ hidden_size:
269
+ desc: null
270
+ value: 1280
271
+ hub_model_id:
272
+ desc: null
273
+ value: None
274
+ hub_strategy:
275
+ desc: null
276
+ value: every_save
277
+ hub_token:
278
+ desc: null
279
+ value: <HUB_TOKEN>
280
+ id2label:
281
+ desc: null
282
+ value:
283
+ '0': LABEL_0
284
+ '1': LABEL_1
285
+ ignore_data_skip:
286
+ desc: null
287
+ value: false
288
+ initializer_range:
289
+ desc: null
290
+ value: 0.02
291
+ intermediate_size:
292
+ desc: null
293
+ value: 5120
294
+ is_decoder:
295
+ desc: null
296
+ value: false
297
+ is_encoder_decoder:
298
+ desc: null
299
+ value: false
300
+ label2id:
301
+ desc: null
302
+ value:
303
+ LABEL_0: 0
304
+ LABEL_1: 1
305
+ label_names:
306
+ desc: null
307
+ value: None
308
+ label_smoothing_factor:
309
+ desc: null
310
+ value: 0.0
311
+ layer_norm_eps:
312
+ desc: null
313
+ value: 1.0e-05
314
+ layerdrop:
315
+ desc: null
316
+ value: 0.0
317
+ learning_rate:
318
+ desc: null
319
+ value: 5.0e-05
320
+ length_column_name:
321
+ desc: null
322
+ value: input_length
323
+ length_penalty:
324
+ desc: null
325
+ value: 1.0
326
+ load_best_model_at_end:
327
+ desc: null
328
+ value: false
329
+ local_rank:
330
+ desc: null
331
+ value: -1
332
+ log_level:
333
+ desc: null
334
+ value: -1
335
+ log_level_replica:
336
+ desc: null
337
+ value: -1
338
+ log_on_each_node:
339
+ desc: null
340
+ value: true
341
+ logging_dir:
342
+ desc: null
343
+ value: ./1B/runs/Jan26_12-15-06_ganymede.eafit.edu.co
344
+ logging_first_step:
345
+ desc: null
346
+ value: false
347
+ logging_nan_inf_filter:
348
+ desc: null
349
+ value: true
350
+ logging_steps:
351
+ desc: null
352
+ value: 100
353
+ logging_strategy:
354
+ desc: null
355
+ value: steps
356
+ lr_scheduler_type:
357
+ desc: null
358
+ value: cosine
359
+ mask_feature_length:
360
+ desc: null
361
+ value: 10
362
+ mask_feature_min_masks:
363
+ desc: null
364
+ value: 0
365
+ mask_feature_prob:
366
+ desc: null
367
+ value: 0.0
368
+ mask_time_length:
369
+ desc: null
370
+ value: 10
371
+ mask_time_min_masks:
372
+ desc: null
373
+ value: 2
374
+ mask_time_prob:
375
+ desc: null
376
+ value: 0.1
377
+ max_grad_norm:
378
+ desc: null
379
+ value: 1.0
380
+ max_length:
381
+ desc: null
382
+ value: 20
383
+ max_steps:
384
+ desc: null
385
+ value: -1
386
+ metric_for_best_model:
387
+ desc: null
388
+ value: None
389
+ min_length:
390
+ desc: null
391
+ value: 0
392
+ model_type:
393
+ desc: null
394
+ value: wav2vec2
395
+ mp_parameters:
396
+ desc: null
397
+ value: ''
398
+ no_cuda:
399
+ desc: null
400
+ value: false
401
+ no_repeat_ngram_size:
402
+ desc: null
403
+ value: 0
404
+ num_adapter_layers:
405
+ desc: null
406
+ value: 3
407
+ num_attention_heads:
408
+ desc: null
409
+ value: 16
410
+ num_beam_groups:
411
+ desc: null
412
+ value: 1
413
+ num_beams:
414
+ desc: null
415
+ value: 1
416
+ num_codevector_groups:
417
+ desc: null
418
+ value: 2
419
+ num_codevectors_per_group:
420
+ desc: null
421
+ value: 320
422
+ num_conv_pos_embedding_groups:
423
+ desc: null
424
+ value: 16
425
+ num_conv_pos_embeddings:
426
+ desc: null
427
+ value: 128
428
+ num_feat_extract_layers:
429
+ desc: null
430
+ value: 7
431
+ num_hidden_layers:
432
+ desc: null
433
+ value: 48
434
+ num_negatives:
435
+ desc: null
436
+ value: 100
437
+ num_return_sequences:
438
+ desc: null
439
+ value: 1
440
+ num_train_epochs:
441
+ desc: null
442
+ value: 100.0
443
+ optim:
444
+ desc: null
445
+ value: adamw_hf
446
+ output_attentions:
447
+ desc: null
448
+ value: false
449
+ output_dir:
450
+ desc: null
451
+ value: ./1B
452
+ output_hidden_size:
453
+ desc: null
454
+ value: 1280
455
+ output_hidden_states:
456
+ desc: null
457
+ value: false
458
+ output_scores:
459
+ desc: null
460
+ value: false
461
+ overwrite_output_dir:
462
+ desc: null
463
+ value: true
464
+ pad_token_id:
465
+ desc: null
466
+ value: 36
467
+ past_index:
468
+ desc: null
469
+ value: -1
470
+ per_device_eval_batch_size:
471
+ desc: null
472
+ value: 48
473
+ per_device_train_batch_size:
474
+ desc: null
475
+ value: 48
476
+ per_gpu_eval_batch_size:
477
+ desc: null
478
+ value: None
479
+ per_gpu_train_batch_size:
480
+ desc: null
481
+ value: None
482
+ prediction_loss_only:
483
+ desc: null
484
+ value: false
485
+ prefix:
486
+ desc: null
487
+ value: null
488
+ problem_type:
489
+ desc: null
490
+ value: null
491
+ proj_codevector_dim:
492
+ desc: null
493
+ value: 1024
494
+ pruned_heads:
495
+ desc: null
496
+ value: {}
497
+ push_to_hub:
498
+ desc: null
499
+ value: false
500
+ push_to_hub_model_id:
501
+ desc: null
502
+ value: None
503
+ push_to_hub_organization:
504
+ desc: null
505
+ value: None
506
+ push_to_hub_token:
507
+ desc: null
508
+ value: <PUSH_TO_HUB_TOKEN>
509
+ remove_invalid_values:
510
+ desc: null
511
+ value: false
512
+ remove_unused_columns:
513
+ desc: null
514
+ value: true
515
+ repetition_penalty:
516
+ desc: null
517
+ value: 1.0
518
+ report_to:
519
+ desc: null
520
+ value: '[''wandb'']'
521
+ resume_from_checkpoint:
522
+ desc: null
523
+ value: None
524
+ return_dict:
525
+ desc: null
526
+ value: true
527
+ return_dict_in_generate:
528
+ desc: null
529
+ value: false
530
+ run_name:
531
+ desc: null
532
+ value: cosine+drop_proj+low_specaugment-1b
533
+ save_on_each_node:
534
+ desc: null
535
+ value: false
536
+ save_steps:
537
+ desc: null
538
+ value: 1000
539
+ save_strategy:
540
+ desc: null
541
+ value: steps
542
+ save_total_limit:
543
+ desc: null
544
+ value: 1
545
+ seed:
546
+ desc: null
547
+ value: 42
548
+ sep_token_id:
549
+ desc: null
550
+ value: null
551
+ sharded_ddp:
552
+ desc: null
553
+ value: '[]'
554
+ skip_memory_metrics:
555
+ desc: null
556
+ value: true
557
+ task_specific_params:
558
+ desc: null
559
+ value: null
560
+ tdnn_dilation:
561
+ desc: null
562
+ value:
563
+ - 1
564
+ - 2
565
+ - 3
566
+ - 1
567
+ - 1
568
+ tdnn_dim:
569
+ desc: null
570
+ value:
571
+ - 512
572
+ - 512
573
+ - 512
574
+ - 512
575
+ - 1500
576
+ tdnn_kernel:
577
+ desc: null
578
+ value:
579
+ - 5
580
+ - 3
581
+ - 3
582
+ - 1
583
+ - 1
584
+ temperature:
585
+ desc: null
586
+ value: 1.0
587
+ tf32:
588
+ desc: null
589
+ value: None
590
+ tie_encoder_decoder:
591
+ desc: null
592
+ value: false
593
+ tie_word_embeddings:
594
+ desc: null
595
+ value: true
596
+ tokenizer_class:
597
+ desc: null
598
+ value: null
599
+ top_k:
600
+ desc: null
601
+ value: 50
602
+ top_p:
603
+ desc: null
604
+ value: 1.0
605
+ torch_dtype:
606
+ desc: null
607
+ value: float32
608
+ torchscript:
609
+ desc: null
610
+ value: false
611
+ tpu_metrics_debug:
612
+ desc: null
613
+ value: false
614
+ tpu_num_cores:
615
+ desc: null
616
+ value: None
617
+ train_batch_size:
618
+ desc: null
619
+ value: 48
620
+ transformers_version:
621
+ desc: null
622
+ value: 4.16.0.dev0
623
+ use_bfloat16:
624
+ desc: null
625
+ value: false
626
+ use_legacy_prediction_loop:
627
+ desc: null
628
+ value: false
629
+ use_weighted_layer_sum:
630
+ desc: null
631
+ value: false
632
+ vocab_size:
633
+ desc: null
634
+ value: 39
635
+ warmup_ratio:
636
+ desc: null
637
+ value: 0.0
638
+ warmup_steps:
639
+ desc: null
640
+ value: 500
641
+ weight_decay:
642
+ desc: null
643
+ value: 0.0
644
+ xpu_backend:
645
+ desc: null
646
+ value: None
647
+ xvector_output_dim:
648
+ desc: null
649
+ value: 512
wandb/run-20220126_121554-295enqix/files/output.log ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+
3
+
4
+
5
+
6
+
7
+
8
+
9
+
10
+
11
+
12
+
13
+
14
+
15
+
16
+
17
+
18
+
19
+
20
+
wandb/run-20220126_121554-295enqix/files/requirements.txt ADDED
@@ -0,0 +1,87 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ aiohttp==3.8.1
2
+ aiosignal==1.2.0
3
+ appdirs==1.4.4
4
+ async-timeout==4.0.2
5
+ attrs==21.4.0
6
+ audioread==2.1.9
7
+ bitsandbytes-cuda113==0.26.0
8
+ certifi==2021.10.8
9
+ cffi==1.15.0
10
+ charset-normalizer==2.0.10
11
+ click==8.0.3
12
+ clldutils==3.10.1
13
+ colorlog==6.6.0
14
+ configparser==5.2.0
15
+ csvw==1.11.0
16
+ datasets==1.18.1.dev0
17
+ decorator==5.1.1
18
+ dill==0.3.4
19
+ dlinfo==1.2.1
20
+ docker-pycreds==0.4.0
21
+ filelock==3.4.2
22
+ frozenlist==1.3.0
23
+ fsspec==2022.1.0
24
+ gitdb==4.0.9
25
+ gitpython==3.1.26
26
+ huggingface-hub==0.4.0
27
+ hypothesis==6.36.0
28
+ idna==3.3
29
+ isodate==0.6.1
30
+ jiwer==2.3.0
31
+ joblib==1.1.0
32
+ librosa==0.8.1
33
+ llvmlite==0.38.0
34
+ multidict==6.0.2
35
+ multiprocess==0.70.12.2
36
+ numba==0.55.0
37
+ numpy==1.21.5
38
+ packaging==21.3
39
+ pandas==1.4.0
40
+ pathtools==0.1.2
41
+ phonemizer==3.0.1
42
+ pip==21.3.1
43
+ pooch==1.6.0
44
+ promise==2.3
45
+ protobuf==3.19.3
46
+ psutil==5.9.0
47
+ pyarrow==6.0.1
48
+ pycparser==2.21
49
+ pyctcdecode==0.3.0
50
+ pygtrie==2.4.2
51
+ pyparsing==3.0.7
52
+ python-dateutil==2.8.2
53
+ python-levenshtein==0.12.2
54
+ pytz==2021.3
55
+ pyyaml==6.0
56
+ regex==2022.1.18
57
+ requests==2.27.1
58
+ resampy==0.2.2
59
+ rfc3986==2.0.0
60
+ sacremoses==0.0.47
61
+ scikit-learn==1.0.2
62
+ scipy==1.7.3
63
+ segments==2.2.0
64
+ sentry-sdk==1.5.4
65
+ setuptools==60.2.0
66
+ shortuuid==1.0.8
67
+ six==1.16.0
68
+ smmap==5.0.0
69
+ sortedcontainers==2.4.0
70
+ soundfile==0.10.3.post1
71
+ subprocess32==3.5.4
72
+ tabulate==0.8.9
73
+ termcolor==1.1.0
74
+ threadpoolctl==3.0.0
75
+ tokenizers==0.11.4
76
+ torch==1.10.1
77
+ torchaudio==0.10.1
78
+ tqdm==4.62.3
79
+ transformers==4.16.0.dev0
80
+ typing-extensions==4.0.1
81
+ uritemplate==4.1.1
82
+ urllib3==1.26.8
83
+ wandb==0.12.9
84
+ wheel==0.37.1
85
+ xxhash==2.0.2
86
+ yarl==1.7.2
87
+ yaspin==2.1.0
wandb/run-20220126_121554-295enqix/files/wandb-metadata.json ADDED
@@ -0,0 +1,74 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-4.18.0-305.10.2.el8_4.x86_64-x86_64-with-glibc2.28",
3
+ "python": "3.9.6",
4
+ "heartbeatAt": "2022-01-26T17:15:55.285233",
5
+ "startedAt": "2022-01-26T17:15:54.341820",
6
+ "docker": null,
7
+ "gpu": "Tesla V100-PCIE-32GB",
8
+ "gpu_count": 3,
9
+ "cpu_count": 64,
10
+ "cuda": null,
11
+ "args": [
12
+ "--dataset_name=mozilla-foundation/common_voice_7_0",
13
+ "--model_name_or_path=facebook/wav2vec2-xls-r-1b",
14
+ "--dataset_config_name=et",
15
+ "--output_dir=./1B",
16
+ "--overwrite_output_dir",
17
+ "--num_train_epochs=100",
18
+ "--per_device_train_batch_size=48",
19
+ "--per_device_eval_batch_size=48",
20
+ "--gradient_accumulation_steps=2",
21
+ "--learning_rate=5e-5",
22
+ "--save_total_limit=1",
23
+ "--warmup_steps=500",
24
+ "--evaluation_strategy=steps",
25
+ "--text_column_name=sentence",
26
+ "--length_column_name=input_length",
27
+ "--save_steps=1000",
28
+ "--eval_steps=250",
29
+ "--logging_steps=100",
30
+ "--layerdrop=0.0",
31
+ "--freeze_feature_encoder",
32
+ "--feat_proj_dropout=0.1",
33
+ "--chars_to_ignore",
34
+ ",",
35
+ "?",
36
+ ".",
37
+ "!",
38
+ "-",
39
+ ";",
40
+ ":",
41
+ "\"",
42
+ "\u201c",
43
+ "%",
44
+ "\u2018",
45
+ "\u201d",
46
+ "\ufffd",
47
+ "\u2014",
48
+ "\u2019",
49
+ "\u2026",
50
+ "\u2013",
51
+ "--gradient_checkpointing",
52
+ "--lr_scheduler_type=cosine",
53
+ "--fp16",
54
+ "--group_by_length",
55
+ "--mask_time_prob=0.1",
56
+ "--mask_time_length=10",
57
+ "--report_to=wandb",
58
+ "--run_name=cosine+drop_proj+low_specaugment-1b",
59
+ "--do_train",
60
+ "--do_eval"
61
+ ],
62
+ "state": "running",
63
+ "program": "/home/sagrilaft/Project/audio/xls-r-et/src/run_speech_recognition_ctc_bnb.py",
64
+ "codePath": "src/run_speech_recognition_ctc_bnb.py",
65
+ "git": {
66
+ "remote": "https://huggingface.co/shpotes/xls-r-et",
67
+ "commit": "2a437db2644553c5c9c2b9e81553ed9bdf92207e"
68
+ },
69
+ "email": "shpotes3@gmail.com",
70
+ "root": "/home/sagrilaft/Project/audio/xls-r-et",
71
+ "host": "ganymede.eafit.edu.co",
72
+ "username": "sagrilaft",
73
+ "executable": "/home/sagrilaft/Project/audio/xls-r-et/.venv/bin/python"
74
+ }
wandb/run-20220126_121554-295enqix/files/wandb-summary.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {}
wandb/run-20220126_121554-295enqix/logs/debug-internal.log ADDED
@@ -0,0 +1,87 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2022-01-26 12:15:54,828 INFO MainThread:2226380 [internal.py:wandb_internal():87] W&B internal server running at pid: 2226380, started at: 2022-01-26 12:15:54.828545
2
+ 2022-01-26 12:15:54,831 DEBUG HandlerThread:2226380 [handler.py:handle_request():130] handle_request: check_version
3
+ 2022-01-26 12:15:54,831 INFO WriterThread:2226380 [datastore.py:open_for_write():77] open: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/run-295enqix.wandb
4
+ 2022-01-26 12:15:54,833 DEBUG SenderThread:2226380 [sender.py:send():234] send: header
5
+ 2022-01-26 12:15:54,834 DEBUG SenderThread:2226380 [sender.py:send_request():248] send_request: check_version
6
+ 2022-01-26 12:15:55,103 DEBUG SenderThread:2226380 [sender.py:send():234] send: run
7
+ 2022-01-26 12:15:55,276 INFO SenderThread:2226380 [dir_watcher.py:__init__():169] watching files in: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files
8
+ 2022-01-26 12:15:55,276 INFO SenderThread:2226380 [sender.py:_start_run_threads():804] run started: 295enqix with start time 1643217354
9
+ 2022-01-26 12:15:55,276 DEBUG SenderThread:2226380 [sender.py:send():234] send: summary
10
+ 2022-01-26 12:15:55,276 INFO SenderThread:2226380 [sender.py:_save_file():939] saving file wandb-summary.json with policy end
11
+ 2022-01-26 12:15:55,278 DEBUG HandlerThread:2226380 [handler.py:handle_request():130] handle_request: run_start
12
+ 2022-01-26 12:15:55,284 DEBUG HandlerThread:2226380 [meta.py:__init__():40] meta init
13
+ 2022-01-26 12:15:55,285 DEBUG HandlerThread:2226380 [meta.py:__init__():54] meta init done
14
+ 2022-01-26 12:15:55,285 DEBUG HandlerThread:2226380 [meta.py:probe():214] probe
15
+ 2022-01-26 12:15:55,291 DEBUG HandlerThread:2226380 [meta.py:_setup_git():204] setup git
16
+ 2022-01-26 12:15:55,309 DEBUG HandlerThread:2226380 [meta.py:_setup_git():211] setup git done
17
+ 2022-01-26 12:15:55,309 DEBUG HandlerThread:2226380 [meta.py:_save_pip():58] save pip
18
+ 2022-01-26 12:15:55,309 DEBUG HandlerThread:2226380 [meta.py:_save_pip():72] save pip done
19
+ 2022-01-26 12:15:55,309 DEBUG HandlerThread:2226380 [meta.py:probe():252] probe done
20
+ 2022-01-26 12:15:55,313 DEBUG SenderThread:2226380 [sender.py:send():234] send: files
21
+ 2022-01-26 12:15:55,313 INFO SenderThread:2226380 [sender.py:_save_file():939] saving file wandb-metadata.json with policy now
22
+ 2022-01-26 12:15:55,322 DEBUG HandlerThread:2226380 [handler.py:handle_request():130] handle_request: stop_status
23
+ 2022-01-26 12:15:55,323 DEBUG SenderThread:2226380 [sender.py:send_request():248] send_request: stop_status
24
+ 2022-01-26 12:15:55,460 DEBUG SenderThread:2226380 [sender.py:send():234] send: config
25
+ 2022-01-26 12:15:55,461 DEBUG SenderThread:2226380 [sender.py:send():234] send: metric
26
+ 2022-01-26 12:15:55,462 DEBUG SenderThread:2226380 [sender.py:send():234] send: metric
27
+ 2022-01-26 12:15:55,462 WARNING SenderThread:2226380 [sender.py:send_metric():897] Seen metric with glob (shouldnt happen)
28
+ 2022-01-26 12:15:55,937 INFO Thread-11 :2226380 [upload_job.py:push():137] Uploaded file /tmp/tmp0kjyvd1nwandb/sa83kpbt-wandb-metadata.json
29
+ 2022-01-26 12:15:56,277 INFO Thread-8 :2226380 [dir_watcher.py:_on_file_created():217] file/dir created: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files/wandb-metadata.json
30
+ 2022-01-26 12:15:56,278 INFO Thread-8 :2226380 [dir_watcher.py:_on_file_created():217] file/dir created: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files/requirements.txt
31
+ 2022-01-26 12:15:56,278 INFO Thread-8 :2226380 [dir_watcher.py:_on_file_created():217] file/dir created: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files/output.log
32
+ 2022-01-26 12:15:56,278 INFO Thread-8 :2226380 [dir_watcher.py:_on_file_created():217] file/dir created: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files/wandb-summary.json
33
+ 2022-01-26 12:15:58,277 INFO Thread-8 :2226380 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files/output.log
34
+ 2022-01-26 12:16:10,577 DEBUG HandlerThread:2226380 [handler.py:handle_request():130] handle_request: stop_status
35
+ 2022-01-26 12:16:10,577 DEBUG SenderThread:2226380 [sender.py:send_request():248] send_request: stop_status
36
+ 2022-01-26 12:16:16,285 INFO Thread-8 :2226380 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files/output.log
37
+ 2022-01-26 12:16:24,276 DEBUG SenderThread:2226380 [sender.py:send():234] send: stats
38
+ 2022-01-26 12:16:25,718 DEBUG HandlerThread:2226380 [handler.py:handle_request():130] handle_request: stop_status
39
+ 2022-01-26 12:16:25,719 DEBUG SenderThread:2226380 [sender.py:send_request():248] send_request: stop_status
40
+ 2022-01-26 12:16:26,289 INFO Thread-8 :2226380 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files/config.yaml
41
+ 2022-01-26 12:16:30,291 INFO Thread-8 :2226380 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files/output.log
42
+ 2022-01-26 12:16:40,861 DEBUG HandlerThread:2226380 [handler.py:handle_request():130] handle_request: stop_status
43
+ 2022-01-26 12:16:40,862 DEBUG SenderThread:2226380 [sender.py:send_request():248] send_request: stop_status
44
+ 2022-01-26 12:16:44,298 INFO Thread-8 :2226380 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files/output.log
45
+ 2022-01-26 12:16:55,255 DEBUG SenderThread:2226380 [sender.py:send():234] send: stats
46
+ 2022-01-26 12:16:56,119 DEBUG HandlerThread:2226380 [handler.py:handle_request():130] handle_request: stop_status
47
+ 2022-01-26 12:16:56,119 DEBUG SenderThread:2226380 [sender.py:send_request():248] send_request: stop_status
48
+ 2022-01-26 12:16:56,303 INFO Thread-8 :2226380 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files/output.log
49
+ 2022-01-26 12:17:06,308 INFO Thread-8 :2226380 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files/output.log
50
+ 2022-01-26 12:17:11,395 DEBUG HandlerThread:2226380 [handler.py:handle_request():130] handle_request: stop_status
51
+ 2022-01-26 12:17:11,395 DEBUG SenderThread:2226380 [sender.py:send_request():248] send_request: stop_status
52
+ 2022-01-26 12:17:16,312 INFO Thread-8 :2226380 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files/output.log
53
+ 2022-01-26 12:17:26,266 DEBUG SenderThread:2226380 [sender.py:send():234] send: stats
54
+ 2022-01-26 12:17:26,317 INFO Thread-8 :2226380 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files/output.log
55
+ 2022-01-26 12:17:26,631 DEBUG HandlerThread:2226380 [handler.py:handle_request():130] handle_request: stop_status
56
+ 2022-01-26 12:17:26,632 DEBUG SenderThread:2226380 [sender.py:send_request():248] send_request: stop_status
57
+ 2022-01-26 12:17:34,321 INFO Thread-8 :2226380 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files/output.log
58
+ 2022-01-26 12:17:41,857 DEBUG HandlerThread:2226380 [handler.py:handle_request():130] handle_request: stop_status
59
+ 2022-01-26 12:17:41,858 DEBUG SenderThread:2226380 [sender.py:send_request():248] send_request: stop_status
60
+ 2022-01-26 12:17:42,325 INFO Thread-8 :2226380 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files/output.log
61
+ 2022-01-26 12:17:50,329 INFO Thread-8 :2226380 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files/output.log
62
+ 2022-01-26 12:17:56,331 INFO Thread-8 :2226380 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files/output.log
63
+ 2022-01-26 12:17:57,090 DEBUG HandlerThread:2226380 [handler.py:handle_request():130] handle_request: stop_status
64
+ 2022-01-26 12:17:57,090 DEBUG SenderThread:2226380 [sender.py:send_request():248] send_request: stop_status
65
+ 2022-01-26 12:17:57,233 DEBUG SenderThread:2226380 [sender.py:send():234] send: stats
66
+ 2022-01-26 12:18:02,334 INFO Thread-8 :2226380 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files/output.log
67
+ 2022-01-26 12:18:08,337 INFO Thread-8 :2226380 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files/output.log
68
+ 2022-01-26 12:18:12,358 DEBUG HandlerThread:2226380 [handler.py:handle_request():130] handle_request: stop_status
69
+ 2022-01-26 12:18:12,359 DEBUG SenderThread:2226380 [sender.py:send_request():248] send_request: stop_status
70
+ 2022-01-26 12:18:13,339 INFO Thread-8 :2226380 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files/output.log
71
+ 2022-01-26 12:18:27,555 DEBUG HandlerThread:2226380 [handler.py:handle_request():130] handle_request: stop_status
72
+ 2022-01-26 12:18:27,555 DEBUG SenderThread:2226380 [sender.py:send_request():248] send_request: stop_status
73
+ 2022-01-26 12:18:28,215 DEBUG SenderThread:2226380 [sender.py:send():234] send: stats
74
+ 2022-01-26 12:18:31,347 INFO Thread-8 :2226380 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files/output.log
75
+ 2022-01-26 12:18:42,695 DEBUG HandlerThread:2226380 [handler.py:handle_request():130] handle_request: stop_status
76
+ 2022-01-26 12:18:42,695 DEBUG SenderThread:2226380 [sender.py:send_request():248] send_request: stop_status
77
+ 2022-01-26 12:18:45,354 INFO Thread-8 :2226380 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files/output.log
78
+ 2022-01-26 12:18:57,952 DEBUG HandlerThread:2226380 [handler.py:handle_request():130] handle_request: stop_status
79
+ 2022-01-26 12:18:57,952 DEBUG SenderThread:2226380 [sender.py:send_request():248] send_request: stop_status
80
+ 2022-01-26 12:18:59,199 DEBUG SenderThread:2226380 [sender.py:send():234] send: stats
81
+ 2022-01-26 12:18:59,360 INFO Thread-8 :2226380 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files/output.log
82
+ 2022-01-26 12:19:11,366 INFO Thread-8 :2226380 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files/output.log
83
+ 2022-01-26 12:19:13,205 DEBUG HandlerThread:2226380 [handler.py:handle_request():130] handle_request: stop_status
84
+ 2022-01-26 12:19:13,206 DEBUG SenderThread:2226380 [sender.py:send_request():248] send_request: stop_status
85
+ 2022-01-26 12:19:23,373 INFO Thread-8 :2226380 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/files/output.log
86
+ 2022-01-26 12:19:28,370 DEBUG HandlerThread:2226380 [handler.py:handle_request():130] handle_request: stop_status
87
+ 2022-01-26 12:19:28,371 DEBUG SenderThread:2226380 [sender.py:send_request():248] send_request: stop_status
wandb/run-20220126_121554-295enqix/logs/debug.log ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2022-01-26 12:15:54,344 INFO MainThread:2226158 [wandb_setup.py:_flush():71] setting env: {'project': 'xls-r-estonian'}
2
+ 2022-01-26 12:15:54,344 INFO MainThread:2226158 [wandb_setup.py:_flush():71] setting login settings: {}
3
+ 2022-01-26 12:15:54,345 INFO MainThread:2226158 [wandb_init.py:_log_setup():371] Logging user logs to /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/logs/debug.log
4
+ 2022-01-26 12:15:54,345 INFO MainThread:2226158 [wandb_init.py:_log_setup():372] Logging internal logs to /home/sagrilaft/Project/audio/xls-r-et/wandb/run-20220126_121554-295enqix/logs/debug-internal.log
5
+ 2022-01-26 12:15:54,345 INFO MainThread:2226158 [wandb_init.py:init():404] calling init triggers
6
+ 2022-01-26 12:15:54,346 INFO MainThread:2226158 [wandb_init.py:init():409] wandb.init called with sweep_config: {}
7
+ config: {}
8
+ 2022-01-26 12:15:54,346 INFO MainThread:2226158 [wandb_init.py:init():460] starting backend
9
+ 2022-01-26 12:15:54,346 INFO MainThread:2226158 [backend.py:_multiprocessing_setup():99] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
10
+ 2022-01-26 12:15:54,373 INFO MainThread:2226158 [backend.py:ensure_launched():216] starting backend process...
11
+ 2022-01-26 12:15:54,395 INFO MainThread:2226158 [backend.py:ensure_launched():221] started backend process with pid: 2226380
12
+ 2022-01-26 12:15:54,396 INFO MainThread:2226158 [wandb_init.py:init():469] backend started and connected
13
+ 2022-01-26 12:15:54,401 INFO MainThread:2226158 [wandb_init.py:init():533] updated telemetry
14
+ 2022-01-26 12:15:54,459 INFO MainThread:2226158 [wandb_init.py:init():563] communicating current version
15
+ 2022-01-26 12:15:55,101 INFO MainThread:2226158 [wandb_init.py:init():568] got version response
16
+ 2022-01-26 12:15:55,101 INFO MainThread:2226158 [wandb_init.py:init():578] communicating run to backend with 30 second timeout
17
+ 2022-01-26 12:15:55,277 INFO MainThread:2226158 [wandb_init.py:init():606] starting run threads in backend
18
+ 2022-01-26 12:15:55,320 INFO MainThread:2226158 [wandb_run.py:_console_start():1810] atexit reg
19
+ 2022-01-26 12:15:55,321 INFO MainThread:2226158 [wandb_run.py:_redirect():1684] redirect: SettingsConsole.REDIRECT
20
+ 2022-01-26 12:15:55,322 INFO MainThread:2226158 [wandb_run.py:_redirect():1689] Redirecting console.
21
+ 2022-01-26 12:15:55,325 INFO MainThread:2226158 [wandb_run.py:_redirect():1745] Redirects installed.
22
+ 2022-01-26 12:15:55,325 INFO MainThread:2226158 [wandb_init.py:init():633] run started, returning control to user process
23
+ 2022-01-26 12:15:55,341 INFO MainThread:2226158 [wandb_run.py:_config_callback():956] config_cb None None {'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': 'float32', 'use_bfloat16': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'chunk_size_feed_forward': 0, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'architectures': ['Wav2Vec2ForPreTraining'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': 1, 'pad_token_id': 36, 'eos_token_id': 2, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'facebook/wav2vec2-xls-r-1b', 'transformers_version': '4.16.0.dev0', 'feat_extract_dropout': 0.0, 'model_type': 'wav2vec2', 'num_feat_extract_layers': 7, 'hidden_size': 1280, 'feat_extract_norm': 'layer', 'feat_extract_activation': 'gelu', 'conv_dim': [512, 512, 512, 512, 512, 512, 512], 'conv_stride': [5, 2, 2, 2, 2, 2, 2], 'conv_kernel': [10, 3, 3, 3, 3, 2, 2], 'conv_bias': True, 'num_conv_pos_embeddings': 128, 'num_conv_pos_embedding_groups': 16, 'num_hidden_layers': 48, 'intermediate_size': 5120, 'hidden_act': 'gelu', 'num_attention_heads': 16, 'hidden_dropout': 0.0, 'attention_dropout': 0.0, 'activation_dropout': 0.0, 'feat_proj_dropout': 0.1, 'final_dropout': 0.0, 'layerdrop': 0.0, 'layer_norm_eps': 1e-05, 'initializer_range': 0.02, 'vocab_size': 39, 'do_stable_layer_norm': True, 'use_weighted_layer_sum': False, 'apply_spec_augment': True, 'mask_time_prob': 0.1, 'mask_time_length': 10, 'mask_time_min_masks': 2, 'mask_feature_prob': 0.0, 'mask_feature_length': 10, 'mask_feature_min_masks': 0, 'num_codevectors_per_group': 320, 'num_codevector_groups': 2, 'contrastive_logits_temperature': 0.1, 'feat_quantizer_dropout': 0.0, 'num_negatives': 100, 'codevector_dim': 1024, 'proj_codevector_dim': 1024, 'diversity_loss_weight': 0.1, 'ctc_loss_reduction': 'mean', 'ctc_zero_infinity': False, 'add_adapter': False, 'adapter_kernel_size': 3, 'adapter_stride': 2, 'num_adapter_layers': 3, 'output_hidden_size': 1280, 'classifier_proj_size': 256, 'tdnn_dim': [512, 512, 512, 512, 1500], 'tdnn_kernel': [5, 3, 3, 1, 1], 'tdnn_dilation': [1, 2, 3, 1, 1], 'xvector_output_dim': 512, 'output_dir': './1B', 'overwrite_output_dir': True, 'do_train': True, 'do_eval': True, 'do_predict': False, 'evaluation_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 48, 'per_device_eval_batch_size': 48, 'per_gpu_train_batch_size': 'None', 'per_gpu_eval_batch_size': 'None', 'gradient_accumulation_steps': 2, 'eval_accumulation_steps': 'None', 'learning_rate': 5e-05, 'weight_decay': 0.0, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 100.0, 'max_steps': -1, 'lr_scheduler_type': 'cosine', 'warmup_ratio': 0.0, 'warmup_steps': 500, 'log_level': -1, 'log_level_replica': -1, 'log_on_each_node': True, 'logging_dir': './1B/runs/Jan26_12-15-06_ganymede.eafit.edu.co', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 100, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 1000, 'save_total_limit': 1, 'save_on_each_node': False, 'no_cuda': False, 'seed': 42, 'bf16': False, 'fp16': True, 'fp16_opt_level': 'O1', 'half_precision_backend': 'amp', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': 'None', 'local_rank': -1, 'xpu_backend': 'None', 'tpu_num_cores': 'None', 'tpu_metrics_debug': False, 'debug': '[]', 'dataloader_drop_last': False, 'eval_steps': 250, 'dataloader_num_workers': 0, 'past_index': -1, 'run_name': 'cosine+drop_proj+low_specaugment-1b', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': 'None', 'load_best_model_at_end': False, 'metric_for_best_model': 'None', 'greater_is_better': 'None', 'ignore_data_skip': False, 'sharded_ddp': '[]', 'deepspeed': 'None', 'label_smoothing_factor': 0.0, 'optim': 'adamw_hf', 'adafactor': False, 'group_by_length': True, 'length_column_name': 'input_length', 'report_to': "['wandb']", 'ddp_find_unused_parameters': 'None', 'ddp_bucket_cap_mb': 'None', 'dataloader_pin_memory': True, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': False, 'resume_from_checkpoint': 'None', 'hub_model_id': 'None', 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'gradient_checkpointing': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': 'None', 'push_to_hub_organization': 'None', 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', '_n_gpu': 1, 'mp_parameters': '', 'train_batch_size': 48, 'eval_batch_size': 48}
24
+ 2022-01-26 12:15:55,344 INFO MainThread:2226158 [wandb_watch.py:watch():43] Watching
wandb/run-20220126_121554-295enqix/run-295enqix.wandb ADDED
Binary file (13.1 kB). View file