Fhrozen commited on
Commit
5721441
1 Parent(s): 7e23dea

Update model

Browse files
Files changed (30) hide show
  1. README.md +419 -0
  2. data/en_token_list/bpe_unigram30/bpe.model +3 -0
  3. exp/asr_stats_raw_en_bpe30/train/feats_stats.npz +0 -0
  4. exp/asr_train_raw_en_bpe30/2epoch.pth +3 -0
  5. exp/asr_train_raw_en_bpe30/RESULTS.md +32 -0
  6. exp/asr_train_raw_en_bpe30/config.yaml +196 -0
  7. exp/asr_train_raw_en_bpe30/images/acc.png +0 -0
  8. exp/asr_train_raw_en_bpe30/images/backward_time.png +0 -0
  9. exp/asr_train_raw_en_bpe30/images/cer.png +0 -0
  10. exp/asr_train_raw_en_bpe30/images/cer_ctc.png +0 -0
  11. exp/asr_train_raw_en_bpe30/images/forward_time.png +0 -0
  12. exp/asr_train_raw_en_bpe30/images/iter_time.png +0 -0
  13. exp/asr_train_raw_en_bpe30/images/loss.png +0 -0
  14. exp/asr_train_raw_en_bpe30/images/loss_att.png +0 -0
  15. exp/asr_train_raw_en_bpe30/images/loss_ctc.png +0 -0
  16. exp/asr_train_raw_en_bpe30/images/optim0_lr0.png +0 -0
  17. exp/asr_train_raw_en_bpe30/images/optim_step_time.png +0 -0
  18. exp/asr_train_raw_en_bpe30/images/train_time.png +0 -0
  19. exp/asr_train_raw_en_bpe30/images/wer.png +0 -0
  20. exp/lm_train_lm_en_bpe30/39epoch.pth +3 -0
  21. exp/lm_train_lm_en_bpe30/config.yaml +146 -0
  22. exp/lm_train_lm_en_bpe30/images/backward_time.png +0 -0
  23. exp/lm_train_lm_en_bpe30/images/forward_time.png +0 -0
  24. exp/lm_train_lm_en_bpe30/images/iter_time.png +0 -0
  25. exp/lm_train_lm_en_bpe30/images/loss.png +0 -0
  26. exp/lm_train_lm_en_bpe30/images/optim0_lr0.png +0 -0
  27. exp/lm_train_lm_en_bpe30/images/optim_step_time.png +0 -0
  28. exp/lm_train_lm_en_bpe30/images/train_time.png +0 -0
  29. exp/lm_train_lm_en_bpe30/perplexity_test/ppl +1 -0
  30. meta.yaml +10 -0
README.md ADDED
@@ -0,0 +1,419 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - espnet
4
+ - audio
5
+ - automatic-speech-recognition
6
+ language: en
7
+ datasets:
8
+ - an4
9
+ license: cc-by-4.0
10
+ ---
11
+
12
+ ## ESPnet2 ASR model
13
+
14
+ ### `Fhrozen/test_an4`
15
+
16
+ This model was trained by Fhrozen using an4 recipe in [espnet](https://github.com/espnet/espnet/).
17
+
18
+ ### Demo: How to use in ESPnet2
19
+
20
+ ```bash
21
+ cd espnet
22
+ git checkout b8df4c928e132acff78d196988bdb68a66987952
23
+ pip install -e .
24
+ cd egs2/an4/asr1
25
+ ./run.sh --skip_data_prep false --skip_train true --download_model Fhrozen/test_an4
26
+ ```
27
+
28
+ <!-- Generated by scripts/utils/show_asr_result.sh -->
29
+ # RESULTS
30
+ ## Environments
31
+ - date: `Wed Oct 20 00:00:46 JST 2021`
32
+ - python version: `3.9.7 (default, Sep 16 2021, 13:09:58) [GCC 7.5.0]`
33
+ - espnet version: `espnet 0.10.4a1`
34
+ - pytorch version: `pytorch 1.9.0`
35
+ - Git hash: `b8df4c928e132acff78d196988bdb68a66987952`
36
+ - Commit date: `Tue Oct 19 07:48:11 2021 -0400`
37
+
38
+ ## asr_train_raw_en_bpe30
39
+ ### WER
40
+
41
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
42
+ |---|---|---|---|---|---|---|---|---|
43
+ |inference_lm_lm_train_lm_en_bpe30_valid.loss.ave_asr_model_valid.acc.best/test|130|773|4.0|22.3|73.7|0.1|96.1|100.0|
44
+ |inference_lm_lm_train_lm_en_bpe30_valid.loss.ave_asr_model_valid.acc.best/train_dev|100|591|2.7|21.8|75.5|0.0|97.3|100.0|
45
+
46
+ ### CER
47
+
48
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
49
+ |---|---|---|---|---|---|---|---|---|
50
+ |inference_lm_lm_train_lm_en_bpe30_valid.loss.ave_asr_model_valid.acc.best/test|130|2565|17.2|16.4|66.4|1.0|83.8|100.0|
51
+ |inference_lm_lm_train_lm_en_bpe30_valid.loss.ave_asr_model_valid.acc.best/train_dev|100|1915|15.5|16.4|68.1|0.9|85.5|100.0|
52
+
53
+ ### TER
54
+
55
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
56
+ |---|---|---|---|---|---|---|---|---|
57
+ |inference_lm_lm_train_lm_en_bpe30_valid.loss.ave_asr_model_valid.acc.best/test|130|2695|21.1|15.6|63.3|0.9|79.9|100.0|
58
+ |inference_lm_lm_train_lm_en_bpe30_valid.loss.ave_asr_model_valid.acc.best/train_dev|100|2015|19.4|15.6|65.0|0.9|81.5|100.0|
59
+
60
+ ## ASR config
61
+
62
+ <details><summary>expand</summary>
63
+
64
+ ```
65
+ config: null
66
+ print_config: false
67
+ log_level: INFO
68
+ dry_run: false
69
+ iterator_type: sequence
70
+ output_dir: exp/asr_train_raw_en_bpe30
71
+ ngpu: 0
72
+ seed: 0
73
+ num_workers: 1
74
+ num_att_plot: 3
75
+ dist_backend: nccl
76
+ dist_init_method: env://
77
+ dist_world_size: null
78
+ dist_rank: null
79
+ local_rank: null
80
+ dist_master_addr: null
81
+ dist_master_port: null
82
+ dist_launcher: null
83
+ multiprocessing_distributed: false
84
+ unused_parameters: false
85
+ sharded_ddp: false
86
+ cudnn_enabled: true
87
+ cudnn_benchmark: false
88
+ cudnn_deterministic: true
89
+ collect_stats: false
90
+ write_collected_feats: false
91
+ max_epoch: 40
92
+ patience: null
93
+ val_scheduler_criterion:
94
+ - valid
95
+ - loss
96
+ early_stopping_criterion:
97
+ - valid
98
+ - loss
99
+ - min
100
+ best_model_criterion:
101
+ - - train
102
+ - loss
103
+ - min
104
+ - - valid
105
+ - loss
106
+ - min
107
+ - - train
108
+ - acc
109
+ - max
110
+ - - valid
111
+ - acc
112
+ - max
113
+ keep_nbest_models:
114
+ - 10
115
+ grad_clip: 5.0
116
+ grad_clip_type: 2.0
117
+ grad_noise: false
118
+ accum_grad: 1
119
+ no_forward_run: false
120
+ resume: true
121
+ train_dtype: float32
122
+ use_amp: false
123
+ log_interval: null
124
+ use_tensorboard: true
125
+ use_wandb: false
126
+ wandb_project: null
127
+ wandb_id: null
128
+ wandb_entity: null
129
+ wandb_name: null
130
+ wandb_model_log_interval: -1
131
+ detect_anomaly: false
132
+ pretrain_path: null
133
+ init_param: []
134
+ ignore_init_mismatch: false
135
+ freeze_param: []
136
+ num_iters_per_epoch: null
137
+ batch_size: 20
138
+ valid_batch_size: null
139
+ batch_bins: 1000000
140
+ valid_batch_bins: null
141
+ train_shape_file:
142
+ - exp/asr_stats_raw_en_bpe30/train/speech_shape
143
+ - exp/asr_stats_raw_en_bpe30/train/text_shape.bpe
144
+ valid_shape_file:
145
+ - exp/asr_stats_raw_en_bpe30/valid/speech_shape
146
+ - exp/asr_stats_raw_en_bpe30/valid/text_shape.bpe
147
+ batch_type: folded
148
+ valid_batch_type: null
149
+ fold_length:
150
+ - 80000
151
+ - 150
152
+ sort_in_batch: descending
153
+ sort_batch: descending
154
+ multiple_iterator: false
155
+ chunk_length: 500
156
+ chunk_shift_ratio: 0.5
157
+ num_cache_chunks: 1024
158
+ train_data_path_and_name_and_type:
159
+ - - dump/raw/train_nodev/wav.scp
160
+ - speech
161
+ - sound
162
+ - - dump/raw/train_nodev/text
163
+ - text
164
+ - text
165
+ valid_data_path_and_name_and_type:
166
+ - - dump/raw/train_dev/wav.scp
167
+ - speech
168
+ - sound
169
+ - - dump/raw/train_dev/text
170
+ - text
171
+ - text
172
+ allow_variable_data_keys: false
173
+ max_cache_size: 0.0
174
+ max_cache_fd: 32
175
+ valid_max_cache_size: null
176
+ optim: adadelta
177
+ optim_conf: {}
178
+ scheduler: null
179
+ scheduler_conf: {}
180
+ token_list:
181
+ - <blank>
182
+ - <unk>
183
+ - ▁
184
+ - T
185
+ - E
186
+ - O
187
+ - R
188
+ - Y
189
+ - A
190
+ - H
191
+ - U
192
+ - S
193
+ - I
194
+ - F
195
+ - B
196
+ - L
197
+ - P
198
+ - D
199
+ - G
200
+ - M
201
+ - C
202
+ - V
203
+ - X
204
+ - J
205
+ - K
206
+ - Z
207
+ - W
208
+ - N
209
+ - Q
210
+ - <sos/eos>
211
+ init: null
212
+ input_size: null
213
+ ctc_conf:
214
+ dropout_rate: 0.0
215
+ ctc_type: builtin
216
+ reduce: true
217
+ ignore_nan_grad: true
218
+ model_conf:
219
+ ctc_weight: 0.5
220
+ ignore_id: -1
221
+ lsm_weight: 0.0
222
+ length_normalized_loss: false
223
+ report_cer: true
224
+ report_wer: true
225
+ sym_space: <space>
226
+ sym_blank: <blank>
227
+ extract_feats_in_collect_stats: true
228
+ use_preprocessor: true
229
+ token_type: bpe
230
+ bpemodel: data/en_token_list/bpe_unigram30/bpe.model
231
+ non_linguistic_symbols: null
232
+ cleaner: null
233
+ g2p: null
234
+ speech_volume_normalize: null
235
+ rir_scp: null
236
+ rir_apply_prob: 1.0
237
+ noise_scp: null
238
+ noise_apply_prob: 1.0
239
+ noise_db_range: '13_15'
240
+ frontend: default
241
+ frontend_conf:
242
+ fs: 16k
243
+ specaug: null
244
+ specaug_conf: {}
245
+ normalize: global_mvn
246
+ normalize_conf:
247
+ stats_file: exp/asr_stats_raw_en_bpe30/train/feats_stats.npz
248
+ preencoder: null
249
+ preencoder_conf: {}
250
+ encoder: rnn
251
+ encoder_conf: {}
252
+ postencoder: null
253
+ postencoder_conf: {}
254
+ decoder: rnn
255
+ decoder_conf: {}
256
+ required:
257
+ - output_dir
258
+ - token_list
259
+ version: 0.10.4a1
260
+ distributed: false
261
+ ```
262
+
263
+ </details>
264
+
265
+ ## LM config
266
+
267
+ <details><summary>expand</summary>
268
+
269
+ ```
270
+ config: conf/train_lm.yaml
271
+ print_config: false
272
+ log_level: INFO
273
+ dry_run: false
274
+ iterator_type: sequence
275
+ output_dir: exp/lm_train_lm_en_bpe30
276
+ ngpu: 0
277
+ seed: 0
278
+ num_workers: 1
279
+ num_att_plot: 3
280
+ dist_backend: nccl
281
+ dist_init_method: env://
282
+ dist_world_size: null
283
+ dist_rank: null
284
+ local_rank: null
285
+ dist_master_addr: null
286
+ dist_master_port: null
287
+ dist_launcher: null
288
+ multiprocessing_distributed: false
289
+ unused_parameters: false
290
+ sharded_ddp: false
291
+ cudnn_enabled: true
292
+ cudnn_benchmark: false
293
+ cudnn_deterministic: true
294
+ collect_stats: false
295
+ write_collected_feats: false
296
+ max_epoch: 40
297
+ patience: null
298
+ val_scheduler_criterion:
299
+ - valid
300
+ - loss
301
+ early_stopping_criterion:
302
+ - valid
303
+ - loss
304
+ - min
305
+ best_model_criterion:
306
+ - - valid
307
+ - loss
308
+ - min
309
+ keep_nbest_models: 1
310
+ grad_clip: 5.0
311
+ grad_clip_type: 2.0
312
+ grad_noise: false
313
+ accum_grad: 1
314
+ no_forward_run: false
315
+ resume: true
316
+ train_dtype: float32
317
+ use_amp: false
318
+ log_interval: null
319
+ use_tensorboard: true
320
+ use_wandb: false
321
+ wandb_project: null
322
+ wandb_id: null
323
+ wandb_entity: null
324
+ wandb_name: null
325
+ wandb_model_log_interval: -1
326
+ detect_anomaly: false
327
+ pretrain_path: null
328
+ init_param: []
329
+ ignore_init_mismatch: false
330
+ freeze_param: []
331
+ num_iters_per_epoch: null
332
+ batch_size: 256
333
+ valid_batch_size: null
334
+ batch_bins: 1000000
335
+ valid_batch_bins: null
336
+ train_shape_file:
337
+ - exp/lm_stats_en_bpe30/train/text_shape.bpe
338
+ valid_shape_file:
339
+ - exp/lm_stats_en_bpe30/valid/text_shape.bpe
340
+ batch_type: folded
341
+ valid_batch_type: null
342
+ fold_length:
343
+ - 150
344
+ sort_in_batch: descending
345
+ sort_batch: descending
346
+ multiple_iterator: false
347
+ chunk_length: 500
348
+ chunk_shift_ratio: 0.5
349
+ num_cache_chunks: 1024
350
+ train_data_path_and_name_and_type:
351
+ - - dump/raw/lm_train.txt
352
+ - text
353
+ - text
354
+ valid_data_path_and_name_and_type:
355
+ - - dump/raw/train_dev/text
356
+ - text
357
+ - text
358
+ allow_variable_data_keys: false
359
+ max_cache_size: 0.0
360
+ max_cache_fd: 32
361
+ valid_max_cache_size: null
362
+ optim: adam
363
+ optim_conf:
364
+ lr: 0.1
365
+ scheduler: null
366
+ scheduler_conf: {}
367
+ token_list:
368
+ - <blank>
369
+ - <unk>
370
+ - ▁
371
+ - T
372
+ - E
373
+ - O
374
+ - R
375
+ - Y
376
+ - A
377
+ - H
378
+ - U
379
+ - S
380
+ - I
381
+ - F
382
+ - B
383
+ - L
384
+ - P
385
+ - D
386
+ - G
387
+ - M
388
+ - C
389
+ - V
390
+ - X
391
+ - J
392
+ - K
393
+ - Z
394
+ - W
395
+ - N
396
+ - Q
397
+ - <sos/eos>
398
+ init: null
399
+ model_conf:
400
+ ignore_id: 0
401
+ use_preprocessor: true
402
+ token_type: bpe
403
+ bpemodel: data/en_token_list/bpe_unigram30/bpe.model
404
+ non_linguistic_symbols: null
405
+ cleaner: null
406
+ g2p: null
407
+ lm: seq_rnn
408
+ lm_conf:
409
+ unit: 650
410
+ nlayers: 2
411
+ required:
412
+ - output_dir
413
+ - token_list
414
+ version: 0.10.4a1
415
+ distributed: false
416
+ ```
417
+
418
+ </details>
419
+
data/en_token_list/bpe_unigram30/bpe.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37b8ea90f6f41bb62fa8f73850f8e1f40bf78987dadfe88567b3908c3e1751d1
3
+ size 237994
exp/asr_stats_raw_en_bpe30/train/feats_stats.npz ADDED
Binary file (1.4 kB). View file
 
exp/asr_train_raw_en_bpe30/2epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6853bb9dad5af6eaca2ad7adb234ec7769cbe655bba9b38fe147e85cd116b53a
3
+ size 33105716
exp/asr_train_raw_en_bpe30/RESULTS.md ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <!-- Generated by scripts/utils/show_asr_result.sh -->
2
+ # RESULTS
3
+ ## Environments
4
+ - date: `Wed Oct 20 00:00:46 JST 2021`
5
+ - python version: `3.9.7 (default, Sep 16 2021, 13:09:58) [GCC 7.5.0]`
6
+ - espnet version: `espnet 0.10.4a1`
7
+ - pytorch version: `pytorch 1.9.0`
8
+ - Git hash: `b8df4c928e132acff78d196988bdb68a66987952`
9
+ - Commit date: `Tue Oct 19 07:48:11 2021 -0400`
10
+
11
+ ## asr_train_raw_en_bpe30
12
+ ### WER
13
+
14
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
15
+ |---|---|---|---|---|---|---|---|---|
16
+ |inference_lm_lm_train_lm_en_bpe30_valid.loss.ave_asr_model_valid.acc.best/test|130|773|4.0|22.3|73.7|0.1|96.1|100.0|
17
+ |inference_lm_lm_train_lm_en_bpe30_valid.loss.ave_asr_model_valid.acc.best/train_dev|100|591|2.7|21.8|75.5|0.0|97.3|100.0|
18
+
19
+ ### CER
20
+
21
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
22
+ |---|---|---|---|---|---|---|---|---|
23
+ |inference_lm_lm_train_lm_en_bpe30_valid.loss.ave_asr_model_valid.acc.best/test|130|2565|17.2|16.4|66.4|1.0|83.8|100.0|
24
+ |inference_lm_lm_train_lm_en_bpe30_valid.loss.ave_asr_model_valid.acc.best/train_dev|100|1915|15.5|16.4|68.1|0.9|85.5|100.0|
25
+
26
+ ### TER
27
+
28
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
29
+ |---|---|---|---|---|---|---|---|---|
30
+ |inference_lm_lm_train_lm_en_bpe30_valid.loss.ave_asr_model_valid.acc.best/test|130|2695|21.1|15.6|63.3|0.9|79.9|100.0|
31
+ |inference_lm_lm_train_lm_en_bpe30_valid.loss.ave_asr_model_valid.acc.best/train_dev|100|2015|19.4|15.6|65.0|0.9|81.5|100.0|
32
+
exp/asr_train_raw_en_bpe30/config.yaml ADDED
@@ -0,0 +1,196 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: null
2
+ print_config: false
3
+ log_level: INFO
4
+ dry_run: false
5
+ iterator_type: sequence
6
+ output_dir: exp/asr_train_raw_en_bpe30
7
+ ngpu: 0
8
+ seed: 0
9
+ num_workers: 1
10
+ num_att_plot: 3
11
+ dist_backend: nccl
12
+ dist_init_method: env://
13
+ dist_world_size: null
14
+ dist_rank: null
15
+ local_rank: null
16
+ dist_master_addr: null
17
+ dist_master_port: null
18
+ dist_launcher: null
19
+ multiprocessing_distributed: false
20
+ unused_parameters: false
21
+ sharded_ddp: false
22
+ cudnn_enabled: true
23
+ cudnn_benchmark: false
24
+ cudnn_deterministic: true
25
+ collect_stats: false
26
+ write_collected_feats: false
27
+ max_epoch: 40
28
+ patience: null
29
+ val_scheduler_criterion:
30
+ - valid
31
+ - loss
32
+ early_stopping_criterion:
33
+ - valid
34
+ - loss
35
+ - min
36
+ best_model_criterion:
37
+ - - train
38
+ - loss
39
+ - min
40
+ - - valid
41
+ - loss
42
+ - min
43
+ - - train
44
+ - acc
45
+ - max
46
+ - - valid
47
+ - acc
48
+ - max
49
+ keep_nbest_models:
50
+ - 10
51
+ grad_clip: 5.0
52
+ grad_clip_type: 2.0
53
+ grad_noise: false
54
+ accum_grad: 1
55
+ no_forward_run: false
56
+ resume: true
57
+ train_dtype: float32
58
+ use_amp: false
59
+ log_interval: null
60
+ use_tensorboard: true
61
+ use_wandb: false
62
+ wandb_project: null
63
+ wandb_id: null
64
+ wandb_entity: null
65
+ wandb_name: null
66
+ wandb_model_log_interval: -1
67
+ detect_anomaly: false
68
+ pretrain_path: null
69
+ init_param: []
70
+ ignore_init_mismatch: false
71
+ freeze_param: []
72
+ num_iters_per_epoch: null
73
+ batch_size: 20
74
+ valid_batch_size: null
75
+ batch_bins: 1000000
76
+ valid_batch_bins: null
77
+ train_shape_file:
78
+ - exp/asr_stats_raw_en_bpe30/train/speech_shape
79
+ - exp/asr_stats_raw_en_bpe30/train/text_shape.bpe
80
+ valid_shape_file:
81
+ - exp/asr_stats_raw_en_bpe30/valid/speech_shape
82
+ - exp/asr_stats_raw_en_bpe30/valid/text_shape.bpe
83
+ batch_type: folded
84
+ valid_batch_type: null
85
+ fold_length:
86
+ - 80000
87
+ - 150
88
+ sort_in_batch: descending
89
+ sort_batch: descending
90
+ multiple_iterator: false
91
+ chunk_length: 500
92
+ chunk_shift_ratio: 0.5
93
+ num_cache_chunks: 1024
94
+ train_data_path_and_name_and_type:
95
+ - - dump/raw/train_nodev/wav.scp
96
+ - speech
97
+ - sound
98
+ - - dump/raw/train_nodev/text
99
+ - text
100
+ - text
101
+ valid_data_path_and_name_and_type:
102
+ - - dump/raw/train_dev/wav.scp
103
+ - speech
104
+ - sound
105
+ - - dump/raw/train_dev/text
106
+ - text
107
+ - text
108
+ allow_variable_data_keys: false
109
+ max_cache_size: 0.0
110
+ max_cache_fd: 32
111
+ valid_max_cache_size: null
112
+ optim: adadelta
113
+ optim_conf: {}
114
+ scheduler: null
115
+ scheduler_conf: {}
116
+ token_list:
117
+ - <blank>
118
+ - <unk>
119
+ - ▁
120
+ - T
121
+ - E
122
+ - O
123
+ - R
124
+ - Y
125
+ - A
126
+ - H
127
+ - U
128
+ - S
129
+ - I
130
+ - F
131
+ - B
132
+ - L
133
+ - P
134
+ - D
135
+ - G
136
+ - M
137
+ - C
138
+ - V
139
+ - X
140
+ - J
141
+ - K
142
+ - Z
143
+ - W
144
+ - N
145
+ - Q
146
+ - <sos/eos>
147
+ init: null
148
+ input_size: null
149
+ ctc_conf:
150
+ dropout_rate: 0.0
151
+ ctc_type: builtin
152
+ reduce: true
153
+ ignore_nan_grad: true
154
+ model_conf:
155
+ ctc_weight: 0.5
156
+ ignore_id: -1
157
+ lsm_weight: 0.0
158
+ length_normalized_loss: false
159
+ report_cer: true
160
+ report_wer: true
161
+ sym_space: <space>
162
+ sym_blank: <blank>
163
+ extract_feats_in_collect_stats: true
164
+ use_preprocessor: true
165
+ token_type: bpe
166
+ bpemodel: data/en_token_list/bpe_unigram30/bpe.model
167
+ non_linguistic_symbols: null
168
+ cleaner: null
169
+ g2p: null
170
+ speech_volume_normalize: null
171
+ rir_scp: null
172
+ rir_apply_prob: 1.0
173
+ noise_scp: null
174
+ noise_apply_prob: 1.0
175
+ noise_db_range: '13_15'
176
+ frontend: default
177
+ frontend_conf:
178
+ fs: 16k
179
+ specaug: null
180
+ specaug_conf: {}
181
+ normalize: global_mvn
182
+ normalize_conf:
183
+ stats_file: exp/asr_stats_raw_en_bpe30/train/feats_stats.npz
184
+ preencoder: null
185
+ preencoder_conf: {}
186
+ encoder: rnn
187
+ encoder_conf: {}
188
+ postencoder: null
189
+ postencoder_conf: {}
190
+ decoder: rnn
191
+ decoder_conf: {}
192
+ required:
193
+ - output_dir
194
+ - token_list
195
+ version: 0.10.4a1
196
+ distributed: false
exp/asr_train_raw_en_bpe30/images/acc.png ADDED
exp/asr_train_raw_en_bpe30/images/backward_time.png ADDED
exp/asr_train_raw_en_bpe30/images/cer.png ADDED
exp/asr_train_raw_en_bpe30/images/cer_ctc.png ADDED
exp/asr_train_raw_en_bpe30/images/forward_time.png ADDED
exp/asr_train_raw_en_bpe30/images/iter_time.png ADDED
exp/asr_train_raw_en_bpe30/images/loss.png ADDED
exp/asr_train_raw_en_bpe30/images/loss_att.png ADDED
exp/asr_train_raw_en_bpe30/images/loss_ctc.png ADDED
exp/asr_train_raw_en_bpe30/images/optim0_lr0.png ADDED
exp/asr_train_raw_en_bpe30/images/optim_step_time.png ADDED
exp/asr_train_raw_en_bpe30/images/train_time.png ADDED
exp/asr_train_raw_en_bpe30/images/wer.png ADDED
exp/lm_train_lm_en_bpe30/39epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e588e2a3843cd37c3880170e99b0d0f60fb36aed888dc501f2a8aaace230b5d
3
+ size 27240836
exp/lm_train_lm_en_bpe30/config.yaml ADDED
@@ -0,0 +1,146 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/train_lm.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ dry_run: false
5
+ iterator_type: sequence
6
+ output_dir: exp/lm_train_lm_en_bpe30
7
+ ngpu: 0
8
+ seed: 0
9
+ num_workers: 1
10
+ num_att_plot: 3
11
+ dist_backend: nccl
12
+ dist_init_method: env://
13
+ dist_world_size: null
14
+ dist_rank: null
15
+ local_rank: null
16
+ dist_master_addr: null
17
+ dist_master_port: null
18
+ dist_launcher: null
19
+ multiprocessing_distributed: false
20
+ unused_parameters: false
21
+ sharded_ddp: false
22
+ cudnn_enabled: true
23
+ cudnn_benchmark: false
24
+ cudnn_deterministic: true
25
+ collect_stats: false
26
+ write_collected_feats: false
27
+ max_epoch: 40
28
+ patience: null
29
+ val_scheduler_criterion:
30
+ - valid
31
+ - loss
32
+ early_stopping_criterion:
33
+ - valid
34
+ - loss
35
+ - min
36
+ best_model_criterion:
37
+ - - valid
38
+ - loss
39
+ - min
40
+ keep_nbest_models: 1
41
+ grad_clip: 5.0
42
+ grad_clip_type: 2.0
43
+ grad_noise: false
44
+ accum_grad: 1
45
+ no_forward_run: false
46
+ resume: true
47
+ train_dtype: float32
48
+ use_amp: false
49
+ log_interval: null
50
+ use_tensorboard: true
51
+ use_wandb: false
52
+ wandb_project: null
53
+ wandb_id: null
54
+ wandb_entity: null
55
+ wandb_name: null
56
+ wandb_model_log_interval: -1
57
+ detect_anomaly: false
58
+ pretrain_path: null
59
+ init_param: []
60
+ ignore_init_mismatch: false
61
+ freeze_param: []
62
+ num_iters_per_epoch: null
63
+ batch_size: 256
64
+ valid_batch_size: null
65
+ batch_bins: 1000000
66
+ valid_batch_bins: null
67
+ train_shape_file:
68
+ - exp/lm_stats_en_bpe30/train/text_shape.bpe
69
+ valid_shape_file:
70
+ - exp/lm_stats_en_bpe30/valid/text_shape.bpe
71
+ batch_type: folded
72
+ valid_batch_type: null
73
+ fold_length:
74
+ - 150
75
+ sort_in_batch: descending
76
+ sort_batch: descending
77
+ multiple_iterator: false
78
+ chunk_length: 500
79
+ chunk_shift_ratio: 0.5
80
+ num_cache_chunks: 1024
81
+ train_data_path_and_name_and_type:
82
+ - - dump/raw/lm_train.txt
83
+ - text
84
+ - text
85
+ valid_data_path_and_name_and_type:
86
+ - - dump/raw/train_dev/text
87
+ - text
88
+ - text
89
+ allow_variable_data_keys: false
90
+ max_cache_size: 0.0
91
+ max_cache_fd: 32
92
+ valid_max_cache_size: null
93
+ optim: adam
94
+ optim_conf:
95
+ lr: 0.1
96
+ scheduler: null
97
+ scheduler_conf: {}
98
+ token_list:
99
+ - <blank>
100
+ - <unk>
101
+ - ▁
102
+ - T
103
+ - E
104
+ - O
105
+ - R
106
+ - Y
107
+ - A
108
+ - H
109
+ - U
110
+ - S
111
+ - I
112
+ - F
113
+ - B
114
+ - L
115
+ - P
116
+ - D
117
+ - G
118
+ - M
119
+ - C
120
+ - V
121
+ - X
122
+ - J
123
+ - K
124
+ - Z
125
+ - W
126
+ - N
127
+ - Q
128
+ - <sos/eos>
129
+ init: null
130
+ model_conf:
131
+ ignore_id: 0
132
+ use_preprocessor: true
133
+ token_type: bpe
134
+ bpemodel: data/en_token_list/bpe_unigram30/bpe.model
135
+ non_linguistic_symbols: null
136
+ cleaner: null
137
+ g2p: null
138
+ lm: seq_rnn
139
+ lm_conf:
140
+ unit: 650
141
+ nlayers: 2
142
+ required:
143
+ - output_dir
144
+ - token_list
145
+ version: 0.10.4a1
146
+ distributed: false
exp/lm_train_lm_en_bpe30/images/backward_time.png ADDED
exp/lm_train_lm_en_bpe30/images/forward_time.png ADDED
exp/lm_train_lm_en_bpe30/images/iter_time.png ADDED
exp/lm_train_lm_en_bpe30/images/loss.png ADDED
exp/lm_train_lm_en_bpe30/images/optim0_lr0.png ADDED
exp/lm_train_lm_en_bpe30/images/optim_step_time.png ADDED
exp/lm_train_lm_en_bpe30/images/train_time.png ADDED
exp/lm_train_lm_en_bpe30/perplexity_test/ppl ADDED
@@ -0,0 +1 @@
 
 
1
+ 8.770004779236807
meta.yaml ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ espnet: 0.10.4a1
2
+ files:
3
+ asr_model_file: exp/asr_train_raw_en_bpe30/2epoch.pth
4
+ lm_file: exp/lm_train_lm_en_bpe30/39epoch.pth
5
+ python: "3.9.7 (default, Sep 16 2021, 13:09:58) \n[GCC 7.5.0]"
6
+ timestamp: 1634655646.769093
7
+ torch: 1.9.0
8
+ yaml_files:
9
+ asr_train_config: exp/asr_train_raw_en_bpe30/config.yaml
10
+ lm_train_config: exp/lm_train_lm_en_bpe30/config.yaml