nguyenvulebinh
commited on
Commit
•
efb533c
1
Parent(s):
f43567e
add model voice-filter
Browse files- config.json +3 -32
- pytorch_model.bin +2 -2
- xvector_sincnet.pt +0 -3
config.json
CHANGED
@@ -1,20 +1,8 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "./model-bin/voice_enhancing",
|
3 |
"architectures": [
|
4 |
-
"
|
5 |
],
|
6 |
"audio_max_lengh": 20,
|
7 |
-
"blank_token_id": 30,
|
8 |
-
"ctc_zero_infinity": true,
|
9 |
-
"d_dec": 640,
|
10 |
-
"d_enc": 256,
|
11 |
-
"d_inner": 0,
|
12 |
-
"dec_drop": 0.2,
|
13 |
-
"do_asr": false,
|
14 |
-
"do_enh": true,
|
15 |
-
"dropout": 0.2,
|
16 |
-
"emb_drop": 0.2,
|
17 |
-
"enc_drop": 0.2,
|
18 |
"enh_args": {
|
19 |
"batch_size": 8,
|
20 |
"batch_type": "folded",
|
@@ -104,25 +92,8 @@
|
|
104 |
"xvector_emb_dim": 512
|
105 |
},
|
106 |
"enh_chunk_size": 5,
|
107 |
-
"
|
108 |
-
"freq_std": 2,
|
109 |
-
"ignore_token_id": -1,
|
110 |
-
"label_smooth": 0.1,
|
111 |
-
"loss_reduction": "mean",
|
112 |
-
"model_type": "asr_voicefilter",
|
113 |
-
"n_classes_ctc": 33,
|
114 |
-
"n_classes_s2s": 5003,
|
115 |
-
"n_dec": 1,
|
116 |
-
"n_enc": 16,
|
117 |
-
"n_fft": 512,
|
118 |
-
"n_head": 4,
|
119 |
-
"n_kernel": 25,
|
120 |
-
"n_mels": 80,
|
121 |
"sample_rate": 16000,
|
122 |
-
"shared_emb": true,
|
123 |
-
"teacher_force": 0.7,
|
124 |
-
"time_ds": 1,
|
125 |
"torch_dtype": "float32",
|
126 |
-
"transformers_version": "4.
|
127 |
-
"use_cnn": true
|
128 |
}
|
|
|
1 |
{
|
|
|
2 |
"architectures": [
|
3 |
+
"VoiceFilter"
|
4 |
],
|
5 |
"audio_max_lengh": 20,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
6 |
"enh_args": {
|
7 |
"batch_size": 8,
|
8 |
"batch_type": "folded",
|
|
|
92 |
"xvector_emb_dim": 512
|
93 |
},
|
94 |
"enh_chunk_size": 5,
|
95 |
+
"model_type": "voicefilter",
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
96 |
"sample_rate": 16000,
|
|
|
|
|
|
|
97 |
"torch_dtype": "float32",
|
98 |
+
"transformers_version": "4.25.1"
|
|
|
99 |
}
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:493efe8f21ce5d9ca8aff7b9b9700f03883f64ba453ca2be4cf7c389445fe151
|
3 |
+
size 217276167
|
xvector_sincnet.pt
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:4bcec986de13da7af7ac88736572692359950df63669989c4f78b294934c9089
|
3 |
-
size 96383626
|
|
|
|
|
|
|
|