Training in progress, step 1000
Browse files- config.json +63 -135
- model.safetensors +2 -2
- preprocessor_config.json +7 -10
- runs/Jun01_16-38-57_dn001/events.out.tfevents.1717245539.dn001.984470.0 +3 -0
- runs/Jun01_16-48-57_dn001/events.out.tfevents.1717246139.dn001.984470.2 +3 -0
- runs/May31_13-48-33_dn001/events.out.tfevents.1717148915.dn001.910825.0 +2 -2
- runs/May31_15-49-38_dn001/events.out.tfevents.1717156179.dn001.917884.0 +3 -0
- runs/May31_16-19-24_dn001/events.out.tfevents.1717157981.dn001.917884.1 +3 -0
- runs/May31_16-24-36_dn001/events.out.tfevents.1717158283.dn001.917884.2 +3 -0
- runs/May31_16-27-24_dn001/events.out.tfevents.1717158446.dn001.917884.3 +3 -0
- runs/May31_16-33-03_dn001/events.out.tfevents.1717158785.dn001.917884.4 +3 -0
- runs/May31_16-41-56_dn001/events.out.tfevents.1717159317.dn001.917884.5 +3 -0
- runs/May31_16-47-30_dn001/events.out.tfevents.1717159659.dn001.917884.6 +3 -0
- runs/May31_16-47-30_dn001/events.out.tfevents.1717159751.dn001.917884.7 +3 -0
- runs/May31_17-14-02_dn001/events.out.tfevents.1717161243.dn001.917884.8 +3 -0
- training_args.bin +2 -2
config.json
CHANGED
@@ -1,154 +1,82 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "
|
3 |
"activation_dropout": 0.0,
|
4 |
-
"
|
|
|
|
|
|
|
5 |
"apply_spec_augment": false,
|
6 |
"architectures": [
|
7 |
-
"
|
8 |
],
|
9 |
"attention_dropout": 0.0,
|
10 |
-
"
|
11 |
-
|
12 |
-
|
13 |
-
|
14 |
-
"
|
15 |
-
"
|
16 |
-
"
|
17 |
-
"
|
18 |
-
"
|
19 |
-
"
|
20 |
-
"
|
21 |
-
"
|
22 |
-
"
|
23 |
-
"
|
24 |
-
"
|
25 |
-
"
|
26 |
-
"
|
27 |
-
"
|
28 |
-
"
|
29 |
-
|
30 |
-
|
31 |
-
|
32 |
-
],
|
33 |
-
[
|
34 |
-
2,
|
35 |
-
50359
|
36 |
-
],
|
37 |
-
[
|
38 |
-
3,
|
39 |
-
50363
|
40 |
-
]
|
41 |
-
],
|
42 |
-
"init_std": 0.02,
|
43 |
-
"is_encoder_decoder": true,
|
44 |
"mask_feature_length": 10,
|
45 |
"mask_feature_min_masks": 0,
|
46 |
"mask_feature_prob": 0.0,
|
47 |
"mask_time_length": 10,
|
48 |
"mask_time_min_masks": 2,
|
49 |
-
"mask_time_prob": 0.
|
50 |
-
"
|
51 |
-
"
|
52 |
-
"
|
53 |
-
"
|
54 |
-
"
|
|
|
55 |
"num_hidden_layers": 24,
|
56 |
-
"
|
57 |
-
"
|
58 |
-
"
|
59 |
-
"
|
|
|
|
|
|
|
|
|
60 |
1,
|
61 |
2,
|
62 |
-
|
63 |
-
|
64 |
-
|
65 |
-
|
66 |
-
|
67 |
-
|
68 |
-
|
69 |
-
|
70 |
-
|
71 |
-
|
72 |
-
|
73 |
-
|
74 |
-
|
75 |
-
|
76 |
-
|
77 |
-
|
78 |
-
|
79 |
-
90,
|
80 |
-
91,
|
81 |
-
92,
|
82 |
-
93,
|
83 |
-
359,
|
84 |
-
503,
|
85 |
-
522,
|
86 |
-
542,
|
87 |
-
873,
|
88 |
-
893,
|
89 |
-
902,
|
90 |
-
918,
|
91 |
-
922,
|
92 |
-
931,
|
93 |
-
1350,
|
94 |
-
1853,
|
95 |
-
1982,
|
96 |
-
2460,
|
97 |
-
2627,
|
98 |
-
3246,
|
99 |
-
3253,
|
100 |
-
3268,
|
101 |
-
3536,
|
102 |
-
3846,
|
103 |
-
3961,
|
104 |
-
4183,
|
105 |
-
4667,
|
106 |
-
6585,
|
107 |
-
6647,
|
108 |
-
7273,
|
109 |
-
9061,
|
110 |
-
9383,
|
111 |
-
10428,
|
112 |
-
10929,
|
113 |
-
11938,
|
114 |
-
12033,
|
115 |
-
12331,
|
116 |
-
12562,
|
117 |
-
13793,
|
118 |
-
14157,
|
119 |
-
14635,
|
120 |
-
15265,
|
121 |
-
15618,
|
122 |
-
16553,
|
123 |
-
16604,
|
124 |
-
18362,
|
125 |
-
18956,
|
126 |
-
20075,
|
127 |
-
21675,
|
128 |
-
22520,
|
129 |
-
26130,
|
130 |
-
26161,
|
131 |
-
26435,
|
132 |
-
28279,
|
133 |
-
29464,
|
134 |
-
31650,
|
135 |
-
32302,
|
136 |
-
32470,
|
137 |
-
36865,
|
138 |
-
42863,
|
139 |
-
47425,
|
140 |
-
49870,
|
141 |
-
50254,
|
142 |
-
50258,
|
143 |
-
50358,
|
144 |
-
50359,
|
145 |
-
50360,
|
146 |
-
50361,
|
147 |
-
50362
|
148 |
],
|
149 |
"torch_dtype": "float32",
|
150 |
"transformers_version": "4.41.1",
|
151 |
-
"
|
152 |
"use_weighted_layer_sum": false,
|
153 |
-
"vocab_size":
|
|
|
154 |
}
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "facebook/w2v-bert-2.0",
|
3 |
"activation_dropout": 0.0,
|
4 |
+
"adapter_act": "relu",
|
5 |
+
"adapter_kernel_size": 3,
|
6 |
+
"adapter_stride": 2,
|
7 |
+
"add_adapter": true,
|
8 |
"apply_spec_augment": false,
|
9 |
"architectures": [
|
10 |
+
"Wav2Vec2BertForCTC"
|
11 |
],
|
12 |
"attention_dropout": 0.0,
|
13 |
+
"bos_token_id": 1,
|
14 |
+
"classifier_proj_size": 768,
|
15 |
+
"codevector_dim": 768,
|
16 |
+
"conformer_conv_dropout": 0.1,
|
17 |
+
"contrastive_logits_temperature": 0.1,
|
18 |
+
"conv_depthwise_kernel_size": 31,
|
19 |
+
"ctc_loss_reduction": "mean",
|
20 |
+
"ctc_zero_infinity": false,
|
21 |
+
"diversity_loss_weight": 0.1,
|
22 |
+
"eos_token_id": 2,
|
23 |
+
"feat_proj_dropout": 0.0,
|
24 |
+
"feat_quantizer_dropout": 0.0,
|
25 |
+
"feature_projection_input_dim": 160,
|
26 |
+
"final_dropout": 0.1,
|
27 |
+
"hidden_act": "swish",
|
28 |
+
"hidden_dropout": 0.0,
|
29 |
+
"hidden_size": 1024,
|
30 |
+
"initializer_range": 0.02,
|
31 |
+
"intermediate_size": 4096,
|
32 |
+
"layer_norm_eps": 1e-05,
|
33 |
+
"layerdrop": 0.0,
|
34 |
+
"left_max_position_embeddings": 64,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
35 |
"mask_feature_length": 10,
|
36 |
"mask_feature_min_masks": 0,
|
37 |
"mask_feature_prob": 0.0,
|
38 |
"mask_time_length": 10,
|
39 |
"mask_time_min_masks": 2,
|
40 |
+
"mask_time_prob": 0.0,
|
41 |
+
"max_source_positions": 5000,
|
42 |
+
"model_type": "wav2vec2-bert",
|
43 |
+
"num_adapter_layers": 1,
|
44 |
+
"num_attention_heads": 16,
|
45 |
+
"num_codevector_groups": 2,
|
46 |
+
"num_codevectors_per_group": 320,
|
47 |
"num_hidden_layers": 24,
|
48 |
+
"num_negatives": 100,
|
49 |
+
"output_hidden_size": 1024,
|
50 |
+
"pad_token_id": 14,
|
51 |
+
"position_embeddings_type": "relative_key",
|
52 |
+
"proj_codevector_dim": 768,
|
53 |
+
"right_max_position_embeddings": 8,
|
54 |
+
"rotary_embedding_base": 10000,
|
55 |
+
"tdnn_dilation": [
|
56 |
1,
|
57 |
2,
|
58 |
+
3,
|
59 |
+
1,
|
60 |
+
1
|
61 |
+
],
|
62 |
+
"tdnn_dim": [
|
63 |
+
512,
|
64 |
+
512,
|
65 |
+
512,
|
66 |
+
512,
|
67 |
+
1500
|
68 |
+
],
|
69 |
+
"tdnn_kernel": [
|
70 |
+
5,
|
71 |
+
3,
|
72 |
+
3,
|
73 |
+
1,
|
74 |
+
1
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
75 |
],
|
76 |
"torch_dtype": "float32",
|
77 |
"transformers_version": "4.41.1",
|
78 |
+
"use_intermediate_ffn_before_adapter": false,
|
79 |
"use_weighted_layer_sum": false,
|
80 |
+
"vocab_size": 17,
|
81 |
+
"xvector_output_dim": 512
|
82 |
}
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:594874eb0f7c44449ace15783df7baef4e67935884a768920d5ceba64bce0115
|
3 |
+
size 2422884252
|
preprocessor_config.json
CHANGED
@@ -1,14 +1,11 @@
|
|
1 |
{
|
2 |
-
"
|
3 |
-
"feature_extractor_type": "WhisperFeatureExtractor",
|
4 |
"feature_size": 80,
|
5 |
-
"
|
6 |
-
"n_fft": 400,
|
7 |
-
"n_samples": 480000,
|
8 |
-
"nb_max_frames": 3000,
|
9 |
"padding_side": "right",
|
10 |
-
"padding_value":
|
11 |
-
"processor_class": "
|
12 |
-
"return_attention_mask":
|
13 |
-
"sampling_rate": 16000
|
|
|
14 |
}
|
|
|
1 |
{
|
2 |
+
"feature_extractor_type": "SeamlessM4TFeatureExtractor",
|
|
|
3 |
"feature_size": 80,
|
4 |
+
"num_mel_bins": 80,
|
|
|
|
|
|
|
5 |
"padding_side": "right",
|
6 |
+
"padding_value": 1,
|
7 |
+
"processor_class": "Wav2Vec2BertProcessor",
|
8 |
+
"return_attention_mask": true,
|
9 |
+
"sampling_rate": 16000,
|
10 |
+
"stride": 2
|
11 |
}
|
runs/Jun01_16-38-57_dn001/events.out.tfevents.1717245539.dn001.984470.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92bf6c5a280c50a04fca582167815832f1347fb5bca7efdef24ff1f2c8ac0978
|
3 |
+
size 6068
|
runs/Jun01_16-48-57_dn001/events.out.tfevents.1717246139.dn001.984470.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d480e6d099076f87fbc1693afaff5c2fbf1a7924d21a75bdad7959ff59ae837
|
3 |
+
size 13336
|
runs/May31_13-48-33_dn001/events.out.tfevents.1717148915.dn001.910825.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be2ad8c73f28a98538c131717a4f72850b4be8eec3cd431cfcaf46d988f7a495
|
3 |
+
size 34803
|
runs/May31_15-49-38_dn001/events.out.tfevents.1717156179.dn001.917884.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8755044d411142c0eaacc685c3de3f8e5da71cde572fe97630113a82563763eb
|
3 |
+
size 9221
|
runs/May31_16-19-24_dn001/events.out.tfevents.1717157981.dn001.917884.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:22d8e07b6486ebb083d43d79afe11ee1b9be51d095859ee714336fa993e80a24
|
3 |
+
size 6068
|
runs/May31_16-24-36_dn001/events.out.tfevents.1717158283.dn001.917884.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89decf9201ce2dc70ce1d7dee094e3d23c1056fdd97d85c5707be1658f11924d
|
3 |
+
size 6068
|
runs/May31_16-27-24_dn001/events.out.tfevents.1717158446.dn001.917884.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:033cf34efd8aa0b4a43fa10fe5115b4c274fffcab69389869880395fd5890229
|
3 |
+
size 6068
|
runs/May31_16-33-03_dn001/events.out.tfevents.1717158785.dn001.917884.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:626d4fedf5630c49ba5bd5c6ba61f31fa6707a2b17bc6e40e7aa7c56a56fcc39
|
3 |
+
size 6068
|
runs/May31_16-41-56_dn001/events.out.tfevents.1717159317.dn001.917884.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b38d16340c99f068610117aa57460c595b09611c880aa4c0f11108714f3a394
|
3 |
+
size 6065
|
runs/May31_16-47-30_dn001/events.out.tfevents.1717159659.dn001.917884.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2793f5cb3e640f96ee438f1ebc8c9957398bb1e98e11f8f872e97305a57aaf84
|
3 |
+
size 6065
|
runs/May31_16-47-30_dn001/events.out.tfevents.1717159751.dn001.917884.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ffa6a531385f288cdc8c877d9b839f8a67aabf6d08a00e911dababdf411fc54
|
3 |
+
size 6065
|
runs/May31_17-14-02_dn001/events.out.tfevents.1717161243.dn001.917884.8
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c550ca7bd401335e7a90f2552a2ada2a92fa6041abaacc92e525522970cc8d6
|
3 |
+
size 6068
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ced86ba208755db4360e15b144b19529e1d21ed980204e83101764ad038626e9
|
3 |
+
size 5048
|