mvijay97 commited on
Commit
c215727
1 Parent(s): 67d6442

Add model files

Browse files
.DS_Store ADDED
Binary file (6.15 kB). View file
 
RESULTS.md ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <!-- Generated by scripts/utils/show_asr_result.sh -->
2
+ # RESULTS
3
+ ## Environments
4
+ - date: `Sat Mar 19 15:43:43 UTC 2022`
5
+ - python version: `3.9.10 | packaged by conda-forge | (main, Feb 1 2022, 21:24:11) [GCC 9.4.0]`
6
+ - espnet version: `espnet 0.10.7a1`
7
+ - pytorch version: `pytorch 1.10.1`
8
+ - Git hash: `d9691d77b34124627f53942fe906077adc4a4e69`
9
+ - Commit date: `Thu Mar 17 15:50:03 2022 -0400`
10
+
11
+ ## asr_train_asr_conformer5_raw_bpe150_sp
12
+ ### WER
13
+
14
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
15
+ |---|---|---|---|---|---|---|---|---|
16
+ |decode_asr_asr_model_valid.acc.ave/test|515|2941|80.6|17.1|2.4|10.1|29.5|61.4|
17
+ |decode_asr_asr_model_valid.acc.ave/valid|480|3127|86.8|12.2|1.0|1.5|14.7|57.3|
18
+
19
+ ### CER
20
+
21
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
22
+ |---|---|---|---|---|---|---|---|---|
23
+ |decode_asr_asr_model_valid.acc.ave/test|515|16056|92.3|3.8|3.9|2.4|10.1|61.4|
24
+ |decode_asr_asr_model_valid.acc.ave/valid|480|15986|96.4|0.5|3.1|1.4|5.1|57.3|
25
+
26
+ ### TER
27
+
28
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
29
+ |---|---|---|---|---|---|---|---|---|
30
+ |decode_asr_asr_model_valid.acc.ave/test|515|8266|82.6|8.0|9.4|2.1|19.5|61.4|
31
+ |decode_asr_asr_model_valid.acc.ave/valid|480|7598|93.3|1.2|5.5|1.6|8.2|57.3|
32
+
exp/.DS_Store ADDED
Binary file (8.2 kB). View file
 
exp/asr_stats_raw_bpe150_sp/.DS_Store ADDED
Binary file (6.15 kB). View file
 
exp/asr_stats_raw_bpe150_sp/train/.DS_Store ADDED
Binary file (6.15 kB). View file
 
exp/asr_stats_raw_bpe150_sp/train/feats_stats.npz ADDED
Binary file (1.4 kB). View file
 
exp/asr_train_asr_conformer5_raw_bpe150_sp/.DS_Store ADDED
Binary file (6.15 kB). View file
 
exp/asr_train_asr_conformer5_raw_bpe150_sp/RESULTS.md ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <!-- Generated by scripts/utils/show_asr_result.sh -->
2
+ # RESULTS
3
+ ## Environments
4
+ - date: `Sat Mar 19 15:43:43 UTC 2022`
5
+ - python version: `3.9.10 | packaged by conda-forge | (main, Feb 1 2022, 21:24:11) [GCC 9.4.0]`
6
+ - espnet version: `espnet 0.10.7a1`
7
+ - pytorch version: `pytorch 1.10.1`
8
+ - Git hash: `d9691d77b34124627f53942fe906077adc4a4e69`
9
+ - Commit date: `Thu Mar 17 15:50:03 2022 -0400`
10
+
11
+ ## asr_train_asr_conformer5_raw_bpe150_sp
12
+ ### WER
13
+
14
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
15
+ |---|---|---|---|---|---|---|---|---|
16
+ |decode_asr_asr_model_valid.acc.ave/test|515|2941|80.6|17.1|2.4|10.1|29.5|61.4|
17
+ |decode_asr_asr_model_valid.acc.ave/valid|480|3127|86.8|12.2|1.0|1.5|14.7|57.3|
18
+
19
+ ### CER
20
+
21
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
22
+ |---|---|---|---|---|---|---|---|---|
23
+ |decode_asr_asr_model_valid.acc.ave/test|515|16056|92.3|3.8|3.9|2.4|10.1|61.4|
24
+ |decode_asr_asr_model_valid.acc.ave/valid|480|15986|96.4|0.5|3.1|1.4|5.1|57.3|
25
+
26
+ ### TER
27
+
28
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
29
+ |---|---|---|---|---|---|---|---|---|
30
+ |decode_asr_asr_model_valid.acc.ave/test|515|8266|82.6|8.0|9.4|2.1|19.5|61.4|
31
+ |decode_asr_asr_model_valid.acc.ave/valid|480|7598|93.3|1.2|5.5|1.6|8.2|57.3|
32
+
exp/asr_train_asr_conformer5_raw_bpe150_sp/config.yaml ADDED
@@ -0,0 +1,339 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/tuning/train_asr_conformer5.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ dry_run: false
5
+ iterator_type: sequence
6
+ output_dir: exp/asr_train_asr_conformer5_raw_bpe150_sp
7
+ ngpu: 1
8
+ seed: 0
9
+ num_workers: 1
10
+ num_att_plot: 3
11
+ dist_backend: nccl
12
+ dist_init_method: env://
13
+ dist_world_size: null
14
+ dist_rank: null
15
+ local_rank: 0
16
+ dist_master_addr: null
17
+ dist_master_port: null
18
+ dist_launcher: null
19
+ multiprocessing_distributed: false
20
+ unused_parameters: false
21
+ sharded_ddp: false
22
+ cudnn_enabled: true
23
+ cudnn_benchmark: false
24
+ cudnn_deterministic: false
25
+ collect_stats: false
26
+ write_collected_feats: false
27
+ max_epoch: 50
28
+ patience: null
29
+ val_scheduler_criterion:
30
+ - valid
31
+ - loss
32
+ early_stopping_criterion:
33
+ - valid
34
+ - loss
35
+ - min
36
+ best_model_criterion:
37
+ - - valid
38
+ - acc
39
+ - max
40
+ keep_nbest_models: 10
41
+ nbest_averaging_interval: 0
42
+ grad_clip: 3
43
+ grad_clip_type: 2.0
44
+ grad_noise: false
45
+ accum_grad: 1
46
+ no_forward_run: false
47
+ resume: true
48
+ train_dtype: float32
49
+ use_amp: true
50
+ log_interval: null
51
+ use_matplotlib: true
52
+ use_tensorboard: true
53
+ use_wandb: false
54
+ wandb_project: null
55
+ wandb_id: null
56
+ wandb_entity: null
57
+ wandb_name: null
58
+ wandb_model_log_interval: -1
59
+ detect_anomaly: false
60
+ pretrain_path: null
61
+ init_param: []
62
+ ignore_init_mismatch: false
63
+ freeze_param: []
64
+ num_iters_per_epoch: null
65
+ batch_size: 20
66
+ valid_batch_size: null
67
+ batch_bins: 2500000
68
+ valid_batch_bins: null
69
+ train_shape_file:
70
+ - exp/asr_stats_raw_bpe150_sp/train/speech_shape
71
+ - exp/asr_stats_raw_bpe150_sp/train/text_shape.bpe
72
+ valid_shape_file:
73
+ - exp/asr_stats_raw_bpe150_sp/valid/speech_shape
74
+ - exp/asr_stats_raw_bpe150_sp/valid/text_shape.bpe
75
+ batch_type: numel
76
+ valid_batch_type: null
77
+ fold_length:
78
+ - 80000
79
+ - 150
80
+ sort_in_batch: descending
81
+ sort_batch: descending
82
+ multiple_iterator: false
83
+ chunk_length: 500
84
+ chunk_shift_ratio: 0.5
85
+ num_cache_chunks: 1024
86
+ train_data_path_and_name_and_type:
87
+ - - dump/raw/train_sp/wav.scp
88
+ - speech
89
+ - sound
90
+ - - dump/raw/train_sp/text
91
+ - text
92
+ - text
93
+ valid_data_path_and_name_and_type:
94
+ - - dump/raw/valid/wav.scp
95
+ - speech
96
+ - sound
97
+ - - dump/raw/valid/text
98
+ - text
99
+ - text
100
+ allow_variable_data_keys: false
101
+ max_cache_size: 0.0
102
+ max_cache_fd: 32
103
+ valid_max_cache_size: null
104
+ optim: adam
105
+ optim_conf:
106
+ lr: 4.0
107
+ scheduler: noamlr
108
+ scheduler_conf:
109
+ model_size: 256
110
+ warmup_steps: 25000
111
+ token_list:
112
+ - <blank>
113
+ - <unk>
114
+ - ▁
115
+ - s
116
+ - i
117
+ - o
118
+ - e
119
+ - a
120
+ - n
121
+ - u
122
+ - t
123
+ - r
124
+ - ▁c
125
+ - ▁a
126
+ - é
127
+ - c
128
+ - l
129
+ - ▁de
130
+ - ▁d
131
+ - d
132
+ - ▁est
133
+ - m
134
+ - ▁le
135
+ - p
136
+ - er
137
+ - v
138
+ - f
139
+ - ▁l
140
+ - ▁s
141
+ - à
142
+ - ▁m
143
+ - ▁la
144
+ - ▁p
145
+ - re
146
+ - ▁un
147
+ - ▁il
148
+ - ▁vous
149
+ - nt
150
+ - g
151
+ - te
152
+ - ur
153
+ - in
154
+ - ▁qu
155
+ - il
156
+ - ce
157
+ - ▁en
158
+ - ▁je
159
+ - tre
160
+ - et
161
+ - ez
162
+ - h
163
+ - le
164
+ - ▁pas
165
+ - ▁b
166
+ - or
167
+ - ve
168
+ - b
169
+ - x
170
+ - ▁une
171
+ - ▁y
172
+ - ▁au
173
+ - ▁bien
174
+ - ▁vo
175
+ - ge
176
+ - ir
177
+ - ▁t
178
+ - ▁on
179
+ - ▁oui
180
+ - ▁j
181
+ - ▁n
182
+ - ment
183
+ - ▁ma
184
+ - ▁tr
185
+ - ▁re
186
+ - que
187
+ - ▁dan
188
+ - ▁par
189
+ - ▁du
190
+ - ▁que
191
+ - è
192
+ - ont
193
+ - ▁ici
194
+ - ▁euh
195
+ - ▁se
196
+ - ▁ne
197
+ - ▁pour
198
+ - aire
199
+ - z
200
+ - ▁ave
201
+ - j
202
+ - ▁nous
203
+ - ▁bon
204
+ - ▁tout
205
+ - ▁mais
206
+ - ▁monsieur
207
+ - ette
208
+ - ▁tou
209
+ - ement
210
+ - ▁va
211
+ - ▁sur
212
+ - ê
213
+ - ▁médecin
214
+ - tion
215
+ - rès
216
+ - elle
217
+ - ▁alors
218
+ - ▁sui
219
+ - y
220
+ - ▁voir
221
+ - ▁ou
222
+ - ▁allez
223
+ - ▁che
224
+ - ▁eau
225
+ - and
226
+ - ait
227
+ - ▁comme
228
+ - ▁manivelle
229
+ - ▁plaît
230
+ - ▁cric
231
+ - vous
232
+ - ▁bonjour
233
+ - puis
234
+ - ▁peut
235
+ - ▁plus
236
+ - ▁malade
237
+ - ommes
238
+ - ▁route
239
+ - ▁deux
240
+ - ▁alle
241
+ - ▁fait
242
+ - droit
243
+ - ▁aussi
244
+ - vien
245
+ - ▁hui
246
+ - ▁pharmacie
247
+ - ▁merci
248
+ - ▁heure
249
+ - ▁gauche
250
+ - ▁camarade
251
+ - û
252
+ - ô
253
+ - w
254
+ - œ
255
+ - k
256
+ - ù
257
+ - â
258
+ - î
259
+ - ç
260
+ - q
261
+ - <sos/eos>
262
+ init: null
263
+ input_size: null
264
+ ctc_conf:
265
+ dropout_rate: 0.0
266
+ ctc_type: builtin
267
+ reduce: true
268
+ ignore_nan_grad: true
269
+ joint_net_conf: null
270
+ model_conf:
271
+ ctc_weight: 0.3
272
+ lsm_weight: 0.1
273
+ length_normalized_loss: false
274
+ use_preprocessor: true
275
+ token_type: bpe
276
+ bpemodel: data/token_list/bpe_unigram150/bpe.model
277
+ non_linguistic_symbols: null
278
+ cleaner: null
279
+ g2p: null
280
+ speech_volume_normalize: null
281
+ rir_scp: null
282
+ rir_apply_prob: 1.0
283
+ noise_scp: null
284
+ noise_apply_prob: 1.0
285
+ noise_db_range: '13_15'
286
+ frontend: default
287
+ frontend_conf:
288
+ n_fft: 512
289
+ win_length: 400
290
+ hop_length: 160
291
+ fs: 16k
292
+ specaug: specaug
293
+ specaug_conf:
294
+ apply_time_warp: true
295
+ time_warp_window: 5
296
+ time_warp_mode: bicubic
297
+ apply_freq_mask: true
298
+ freq_mask_width_range:
299
+ - 0
300
+ - 30
301
+ num_freq_mask: 2
302
+ apply_time_mask: true
303
+ time_mask_width_range:
304
+ - 0
305
+ - 40
306
+ num_time_mask: 2
307
+ normalize: global_mvn
308
+ normalize_conf:
309
+ stats_file: exp/asr_stats_raw_bpe150_sp/train/feats_stats.npz
310
+ preencoder: null
311
+ preencoder_conf: {}
312
+ encoder: conformer
313
+ encoder_conf:
314
+ input_layer: conv2d
315
+ num_blocks: 12
316
+ linear_units: 2048
317
+ dropout_rate: 0.1
318
+ output_size: 256
319
+ attention_heads: 4
320
+ attention_dropout_rate: 0.0
321
+ pos_enc_layer_type: rel_pos
322
+ selfattention_layer_type: rel_selfattn
323
+ activation_type: swish
324
+ macaron_style: true
325
+ use_cnn_module: true
326
+ cnn_module_kernel: 15
327
+ postencoder: null
328
+ postencoder_conf: {}
329
+ decoder: transformer
330
+ decoder_conf:
331
+ input_layer: embed
332
+ num_blocks: 6
333
+ linear_units: 2048
334
+ dropout_rate: 0.1
335
+ required:
336
+ - output_dir
337
+ - token_list
338
+ version: 0.10.7a1
339
+ distributed: false
exp/asr_train_asr_conformer5_raw_bpe150_sp/images/acc.png ADDED
exp/asr_train_asr_conformer5_raw_bpe150_sp/images/backward_time.png ADDED
exp/asr_train_asr_conformer5_raw_bpe150_sp/images/cer.png ADDED
exp/asr_train_asr_conformer5_raw_bpe150_sp/images/cer_ctc.png ADDED
exp/asr_train_asr_conformer5_raw_bpe150_sp/images/forward_time.png ADDED
exp/asr_train_asr_conformer5_raw_bpe150_sp/images/gpu_max_cached_mem_GB.png ADDED
exp/asr_train_asr_conformer5_raw_bpe150_sp/images/iter_time.png ADDED
exp/asr_train_asr_conformer5_raw_bpe150_sp/images/loss.png ADDED
exp/asr_train_asr_conformer5_raw_bpe150_sp/images/loss_att.png ADDED
exp/asr_train_asr_conformer5_raw_bpe150_sp/images/loss_ctc.png ADDED
exp/asr_train_asr_conformer5_raw_bpe150_sp/images/optim0_lr0.png ADDED
exp/asr_train_asr_conformer5_raw_bpe150_sp/images/optim_step_time.png ADDED
exp/asr_train_asr_conformer5_raw_bpe150_sp/images/train_time.png ADDED
exp/asr_train_asr_conformer5_raw_bpe150_sp/images/wer.png ADDED
exp/asr_train_asr_conformer5_raw_bpe150_sp/valid.acc.ave_10best.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b56a7b4e09106b8c45b2986c9c4d456c4cb4c5436817a11bb833fd027a3f58e1
3
+ size 172558757