ftshijt commited on
Commit
993c486
1 Parent(s): 2d41bf9

Update model

Browse files
Files changed (32) hide show
  1. README.md +526 -0
  2. data/token_list/bpe_unigram250/bpe.model +3 -0
  3. exp/asr_stats_raw_bpe250_sp/train/feats_stats.npz +0 -0
  4. exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/73epoch.pth +3 -0
  5. exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/RESULTS.md +32 -0
  6. exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/config.yaml +426 -0
  7. exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/acc.png +0 -0
  8. exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/backward_time.png +0 -0
  9. exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/cer.png +0 -0
  10. exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/cer_ctc.png +0 -0
  11. exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/forward_time.png +0 -0
  12. exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/gpu_max_cached_mem_GB.png +0 -0
  13. exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/iter_time.png +0 -0
  14. exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/loss.png +0 -0
  15. exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/loss_att.png +0 -0
  16. exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/loss_ctc.png +0 -0
  17. exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/optim0_lr0.png +0 -0
  18. exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/optim_step_time.png +0 -0
  19. exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/train_time.png +0 -0
  20. exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/wer.png +0 -0
  21. exp/lm_train_bpe250/config.yaml +373 -0
  22. exp/lm_train_bpe250/images/backward_time.png +0 -0
  23. exp/lm_train_bpe250/images/forward_time.png +0 -0
  24. exp/lm_train_bpe250/images/gpu_max_cached_mem_GB.png +0 -0
  25. exp/lm_train_bpe250/images/iter_time.png +0 -0
  26. exp/lm_train_bpe250/images/loss.png +0 -0
  27. exp/lm_train_bpe250/images/optim0_lr0.png +0 -0
  28. exp/lm_train_bpe250/images/optim_step_time.png +0 -0
  29. exp/lm_train_bpe250/images/train_time.png +0 -0
  30. exp/lm_train_bpe250/perplexity_test/ppl +1 -0
  31. exp/lm_train_bpe250/valid.loss.ave_10best.pth +3 -0
  32. meta.yaml +10 -0
README.md ADDED
@@ -0,0 +1,526 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - espnet
4
+ - audio
5
+ - automatic-speech-recognition
6
+ language: noinfo
7
+ datasets:
8
+ - totonac
9
+ license: cc-by-4.0
10
+ ---
11
+
12
+ ## ESPnet2 ASR model
13
+
14
+ ### `espnet/ftshijt_espnet2_asr_totonac_transformer`
15
+
16
+ This model was trained by ftshijt using totonac recipe in [espnet](https://github.com/espnet/espnet/).
17
+
18
+ ### Demo: How to use in ESPnet2
19
+
20
+ ```bash
21
+ cd espnet
22
+
23
+ pip install -e .
24
+ cd els/totonac/asr1
25
+ ./run.sh --skip_data_prep false --skip_train true --download_model espnet/ftshijt_espnet2_asr_totonac_transformer
26
+ ```
27
+
28
+ <!-- Generated by scripts/utils/show_asr_result.sh -->
29
+ # RESULTS
30
+ ## Environments
31
+ - date: `Sun Nov 7 09:22:09 EST 2021`
32
+ - python version: `3.9.7 (default, Sep 16 2021, 13:09:58) [GCC 7.5.0]`
33
+ - espnet version: `espnet 0.10.4a1`
34
+ - pytorch version: `pytorch 1.9.0`
35
+ - Git hash: ``
36
+ - Commit date: ``
37
+
38
+ ## asr_train_asr_transformer_specaug_raw_bpe250_sp
39
+ ### WER
40
+
41
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
42
+ |---|---|---|---|---|---|---|---|---|
43
+ |decode_asr_lm_lm_train_bpe250_valid.loss.ave_asr_model_valid.acc.best/dev|530|3547|59.8|32.9|7.3|6.5|46.7|87.4|
44
+ |decode_asr_lm_lm_train_bpe250_valid.loss.ave_asr_model_valid.acc.best/test|704|5018|55.5|35.7|8.8|6.1|50.6|92.0|
45
+
46
+ ### CER
47
+
48
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
49
+ |---|---|---|---|---|---|---|---|---|
50
+ |decode_asr_lm_lm_train_bpe250_valid.loss.ave_asr_model_valid.acc.best/dev|530|22510|88.1|4.4|7.4|3.9|15.8|87.4|
51
+ |decode_asr_lm_lm_train_bpe250_valid.loss.ave_asr_model_valid.acc.best/test|704|32990|86.9|4.3|8.8|4.0|17.1|92.0|
52
+
53
+ ### TER
54
+
55
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
56
+ |---|---|---|---|---|---|---|---|---|
57
+ |decode_asr_lm_lm_train_bpe250_valid.loss.ave_asr_model_valid.acc.best/dev|530|9360|70.3|15.8|13.8|4.3|34.0|87.4|
58
+ |decode_asr_lm_lm_train_bpe250_valid.loss.ave_asr_model_valid.acc.best/test|704|13835|70.5|16.0|13.6|4.4|33.9|92.0|
59
+
60
+ ## ASR config
61
+
62
+ <details><summary>expand</summary>
63
+
64
+ ```
65
+ config: conf/tuning/train_asr_transformer_specaug.yaml
66
+ print_config: false
67
+ log_level: INFO
68
+ dry_run: false
69
+ iterator_type: sequence
70
+ output_dir: exp/asr_train_asr_transformer_specaug_raw_bpe250_sp
71
+ ngpu: 1
72
+ seed: 0
73
+ num_workers: 1
74
+ num_att_plot: 3
75
+ dist_backend: nccl
76
+ dist_init_method: env://
77
+ dist_world_size: null
78
+ dist_rank: null
79
+ local_rank: 0
80
+ dist_master_addr: null
81
+ dist_master_port: null
82
+ dist_launcher: null
83
+ multiprocessing_distributed: false
84
+ unused_parameters: false
85
+ sharded_ddp: false
86
+ cudnn_enabled: true
87
+ cudnn_benchmark: false
88
+ cudnn_deterministic: true
89
+ collect_stats: false
90
+ write_collected_feats: false
91
+ max_epoch: 100
92
+ patience: 15
93
+ val_scheduler_criterion:
94
+ - valid
95
+ - loss
96
+ early_stopping_criterion:
97
+ - valid
98
+ - loss
99
+ - min
100
+ best_model_criterion:
101
+ - - valid
102
+ - acc
103
+ - max
104
+ keep_nbest_models: 10
105
+ grad_clip: 5
106
+ grad_clip_type: 2.0
107
+ grad_noise: false
108
+ accum_grad: 2
109
+ no_forward_run: false
110
+ resume: true
111
+ train_dtype: float32
112
+ use_amp: false
113
+ log_interval: null
114
+ use_tensorboard: true
115
+ use_wandb: false
116
+ wandb_project: null
117
+ wandb_id: null
118
+ wandb_entity: null
119
+ wandb_name: null
120
+ wandb_model_log_interval: -1
121
+ detect_anomaly: false
122
+ pretrain_path: null
123
+ init_param: []
124
+ ignore_init_mismatch: false
125
+ freeze_param: []
126
+ num_iters_per_epoch: null
127
+ batch_size: 32
128
+ valid_batch_size: null
129
+ batch_bins: 1000000
130
+ valid_batch_bins: null
131
+ train_shape_file:
132
+ - exp/asr_stats_raw_bpe250_sp/train/speech_shape
133
+ - exp/asr_stats_raw_bpe250_sp/train/text_shape.bpe
134
+ valid_shape_file:
135
+ - exp/asr_stats_raw_bpe250_sp/valid/speech_shape
136
+ - exp/asr_stats_raw_bpe250_sp/valid/text_shape.bpe
137
+ batch_type: folded
138
+ valid_batch_type: null
139
+ fold_length:
140
+ - 80000
141
+ - 150
142
+ sort_in_batch: descending
143
+ sort_batch: descending
144
+ multiple_iterator: false
145
+ chunk_length: 500
146
+ chunk_shift_ratio: 0.5
147
+ num_cache_chunks: 1024
148
+ train_data_path_and_name_and_type:
149
+ - - /tmp/jiatong-7359.okvPvI3Z/raw/train_sp/wav.scp
150
+ - speech
151
+ - kaldi_ark
152
+ - - /tmp/jiatong-7359.okvPvI3Z/raw/train_sp/text
153
+ - text
154
+ - text
155
+ valid_data_path_and_name_and_type:
156
+ - - /tmp/jiatong-7359.okvPvI3Z/raw/dev/wav.scp
157
+ - speech
158
+ - kaldi_ark
159
+ - - /tmp/jiatong-7359.okvPvI3Z/raw/dev/text
160
+ - text
161
+ - text
162
+ allow_variable_data_keys: false
163
+ max_cache_size: 0.0
164
+ max_cache_fd: 32
165
+ valid_max_cache_size: null
166
+ optim: adam
167
+ optim_conf:
168
+ lr: 1.0
169
+ scheduler: noamlr
170
+ scheduler_conf:
171
+ warmup_steps: 4000
172
+ token_list:
173
+ - <blank>
174
+ - <unk>
175
+ - ':'
176
+ - ▁N
177
+ - NI
178
+ - N
179
+ - ▁IYMA
180
+ - ▁NA
181
+ - NA
182
+ - ▁WA
183
+ - WA
184
+ - ▁
185
+ - ''''
186
+ - KA
187
+ - ▁MA
188
+ - MA
189
+ - T
190
+ - ▁XA
191
+ - TA
192
+ - NCHU
193
+ - WI
194
+ - ▁LI
195
+ - ▁NI
196
+ - PA
197
+ - YI
198
+ - ▁PUS
199
+ - K
200
+ - ▁PI
201
+ - ▁X
202
+ - S
203
+ - ▁TA
204
+ - YA
205
+ - ▁LA
206
+ - Q
207
+ - QA
208
+ - TI
209
+ - ▁KA
210
+ - QO
211
+ - W
212
+ - ▁KAH
213
+ - ▁PALA
214
+ - H
215
+ - X
216
+ - XA
217
+ - ▁KI
218
+ - A
219
+ - LH
220
+ - I
221
+ - LA
222
+ - ▁CHA
223
+ - ▁A
224
+ - ▁XLI
225
+ - ▁LHI
226
+ - U
227
+ - ▁K
228
+ - KANI
229
+ - KU
230
+ - Y
231
+ - ▁LU
232
+ - Á
233
+ - ▁CHU
234
+ - O
235
+ - KI
236
+ - ▁KIWI
237
+ - NTLA
238
+ - ▁TLA
239
+ - M
240
+ - ▁TAWA
241
+ - ▁TI
242
+ - ▁S
243
+ - WANI
244
+ - CHA
245
+ - LHI
246
+ - LI
247
+ - ▁TU
248
+ - ▁PALHA
249
+ - Í
250
+ - ▁CHANÁ
251
+ - ▁KILHWAMPA
252
+ - KÁN
253
+ - ▁WAYMA
254
+ - E
255
+ - SA
256
+ - ▁E
257
+ - ▁LHU
258
+ - LHA
259
+ - PU
260
+ - ▁LHA
261
+ - ▁PA
262
+ - ▁LAK
263
+ - ▁ANTA
264
+ - ▁KITI
265
+ - NCHÚ
266
+ - SI
267
+ - TLA
268
+ - PI
269
+ - ▁KINI
270
+ - CHI
271
+ - ▁PEROH
272
+ - ▁PU
273
+ - QÓ
274
+ - QALHCHIWINA
275
+ - TU
276
+ - ▁TLHA
277
+ - ▁WI
278
+ - NÁ
279
+ - ▁KAN
280
+ - ▁NAYI
281
+ - CH
282
+ - 'NO'
283
+ - ▁U
284
+ - TSA
285
+ - MÁ
286
+ - NQO
287
+ - ▁ANA
288
+ - ▁LIKWA
289
+ - ▁XTA
290
+ - J
291
+ - ▁QALH
292
+ - TO
293
+ - TÁ
294
+ - ▁USA
295
+ - ▁PORQUE
296
+ - ▁MI
297
+ - L
298
+ - ▁TAWÁ
299
+ - XI
300
+ - LHAQAPASA
301
+ - P
302
+ - CHIWI
303
+ - WÁ
304
+ - NTI
305
+ - ▁JKA
306
+ - Ú
307
+ - NTLHA
308
+ - R
309
+ - TSI
310
+ - C
311
+ - STA
312
+ - ▁LH
313
+ - LHU
314
+ - MPI
315
+ - ▁I
316
+ - ▁NILH
317
+ - ▁KATSI
318
+ - ▁LHAK
319
+ - MAKLHAKASKI
320
+ - ▁WANIKÁN
321
+ - ▁WIXI
322
+ - ▁TSI
323
+ - KÚ
324
+ - NÍ
325
+ - ▁PAKS
326
+ - NU
327
+ - TLHA
328
+ - YÁ
329
+ - KUCHAN
330
+ - XAQATLI
331
+ - ▁MAX
332
+ - ▁LAQAPASA
333
+ - ▁LAQ
334
+ - QALH
335
+ - KATSI
336
+ - Ó
337
+ - LAQAPASA
338
+ - ▁J
339
+ - ▁QAMA
340
+ - NTU
341
+ - MI
342
+ - KIWI
343
+ - ▁KIN
344
+ - ▁XANAT
345
+ - ▁CHI
346
+ - JA
347
+ - ▁IY
348
+ - ▁TSU
349
+ - MAKLAKAS
350
+ - ▁MAQA
351
+ - LÁ
352
+ - ▁KATSIYA
353
+ - ▁TLANKA
354
+ - ▁STAK
355
+ - ▁XLA
356
+ - ▁LHIKWA
357
+ - ▁SQA
358
+ - ▁P
359
+ - TAHNA
360
+ - ▁TLAQ
361
+ - ▁JKATSI
362
+ - MAKLAKASKINKA
363
+ - YÁW
364
+ - WATIYA
365
+ - CHÁ
366
+ - ▁IPORQUEI
367
+ - ▁AKXNI
368
+ - TSU
369
+ - ▁TSINÓ
370
+ - ▁STAKA
371
+ - ▁AKXNÍ
372
+ - LAKATA
373
+ - KATSÍ
374
+ - ▁XALHAK
375
+ - TLAWAYA
376
+ - SPUT
377
+ - ▁XATAWA
378
+ - QALHCHIWI
379
+ - PÁ
380
+ - JU
381
+ - ▁XAXANAT
382
+ - ▁PÉREZ
383
+ - ▁AKTSU
384
+ - ▁JKI
385
+ - NTÚ
386
+ - ▁KATSIYÁ
387
+ - ▁IESTEI
388
+ - LAQAPASÁ
389
+ - ▁MASKI
390
+ - ▁LAQSQATÁ
391
+ - ▁TLHANKA
392
+ - ▁WANIKANI
393
+ - ▁LÓPEZ
394
+ - MAKLAKASKINKÁN
395
+ - ▁ANTÁ
396
+ - ▁TACHIWÍ
397
+ - ▁SEBAST
398
+ - ▁CANO
399
+ - ▁XKUTNI
400
+ - ▁UKXILH
401
+ - TANKAH
402
+ - LAKASKINQO
403
+ - LAKAPASTAK
404
+ - ▁XCHACHAT
405
+ - TAKAWANÍ
406
+ - ▁TLÁ
407
+ - ▁TSINOH
408
+ - KAXTLAWA
409
+ - ▁NÚÑEZ
410
+ - ▁XLAKASKINKA
411
+ - ▁WÁTIYA
412
+ - ONCE
413
+ - Z
414
+ - É
415
+ - D
416
+ - Ñ
417
+ - V
418
+ - F
419
+ - G
420
+ - '1'
421
+ - B
422
+ - <sos/eos>
423
+ init: xavier_uniform
424
+ input_size: null
425
+ ctc_conf:
426
+ dropout_rate: 0.0
427
+ ctc_type: builtin
428
+ reduce: true
429
+ ignore_nan_grad: true
430
+ model_conf:
431
+ ctc_weight: 0.3
432
+ lsm_weight: 0.1
433
+ length_normalized_loss: false
434
+ use_preprocessor: true
435
+ token_type: bpe
436
+ bpemodel: data/token_list/bpe_unigram250/bpe.model
437
+ non_linguistic_symbols: null
438
+ cleaner: null
439
+ g2p: null
440
+ speech_volume_normalize: null
441
+ rir_scp: null
442
+ rir_apply_prob: 1.0
443
+ noise_scp: null
444
+ noise_apply_prob: 1.0
445
+ noise_db_range: '13_15'
446
+ frontend: default
447
+ frontend_conf:
448
+ fs: 16k
449
+ specaug: specaug
450
+ specaug_conf:
451
+ apply_time_warp: true
452
+ time_warp_window: 5
453
+ time_warp_mode: bicubic
454
+ apply_freq_mask: true
455
+ freq_mask_width_range:
456
+ - 0
457
+ - 30
458
+ num_freq_mask: 2
459
+ apply_time_mask: true
460
+ time_mask_width_range:
461
+ - 0
462
+ - 40
463
+ num_time_mask: 2
464
+ normalize: global_mvn
465
+ normalize_conf:
466
+ stats_file: exp/asr_stats_raw_bpe250_sp/train/feats_stats.npz
467
+ preencoder: null
468
+ preencoder_conf: {}
469
+ encoder: transformer
470
+ encoder_conf:
471
+ input_layer: conv2d
472
+ num_blocks: 12
473
+ linear_units: 2048
474
+ dropout_rate: 0.1
475
+ output_size: 256
476
+ attention_heads: 4
477
+ attention_dropout_rate: 0.0
478
+ postencoder: null
479
+ postencoder_conf: {}
480
+ decoder: transformer
481
+ decoder_conf:
482
+ input_layer: embed
483
+ num_blocks: 6
484
+ linear_units: 2048
485
+ dropout_rate: 0.1
486
+ required:
487
+ - output_dir
488
+ - token_list
489
+ version: 0.10.4a1
490
+ distributed: false
491
+ ```
492
+
493
+ </details>
494
+
495
+
496
+
497
+ ### Citing ESPnet
498
+
499
+ ```BibTex
500
+ @inproceedings{watanabe2018espnet,
501
+ author={Shinji Watanabe and Takaaki Hori and Shigeki Karita and Tomoki Hayashi and Jiro Nishitoba and Yuya Unno and Nelson Yalta and Jahn Heymann and Matthew Wiesner and Nanxin Chen and Adithya Renduchintala and Tsubasa Ochiai},
502
+ title={{ESPnet}: End-to-End Speech Processing Toolkit},
503
+ year={2018},
504
+ booktitle={Proceedings of Interspeech},
505
+ pages={2207--2211},
506
+ doi={10.21437/Interspeech.2018-1456},
507
+ url={http://dx.doi.org/10.21437/Interspeech.2018-1456}
508
+ }
509
+
510
+
511
+
512
+
513
+ ```
514
+
515
+ or arXiv:
516
+
517
+ ```bibtex
518
+ @misc{watanabe2018espnet,
519
+ title={ESPnet: End-to-End Speech Processing Toolkit},
520
+ author={Shinji Watanabe and Takaaki Hori and Shigeki Karita and Tomoki Hayashi and Jiro Nishitoba and Yuya Unno and Nelson Yalta and Jahn Heymann and Matthew Wiesner and Nanxin Chen and Adithya Renduchintala and Tsubasa Ochiai},
521
+ year={2018},
522
+ eprint={1804.00015},
523
+ archivePrefix={arXiv},
524
+ primaryClass={cs.CL}
525
+ }
526
+ ```
data/token_list/bpe_unigram250/bpe.model ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28c4aa9cc4fb4f2dcc54e7a91661189d4985730af7d75468f84baa98ceebd157
3
+ size 241202
exp/asr_stats_raw_bpe250_sp/train/feats_stats.npz ADDED
Binary file (1.4 kB). View file
exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/73epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62e89e5b8cea7c5337d0945d576728edea3f495fc94e3212449028ee94aa6610
3
+ size 109361573
exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/RESULTS.md ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <!-- Generated by scripts/utils/show_asr_result.sh -->
2
+ # RESULTS
3
+ ## Environments
4
+ - date: `Sun Nov 7 09:22:09 EST 2021`
5
+ - python version: `3.9.7 (default, Sep 16 2021, 13:09:58) [GCC 7.5.0]`
6
+ - espnet version: `espnet 0.10.4a1`
7
+ - pytorch version: `pytorch 1.9.0`
8
+ - Git hash: ``
9
+ - Commit date: ``
10
+
11
+ ## asr_train_asr_transformer_specaug_raw_bpe250_sp
12
+ ### WER
13
+
14
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
15
+ |---|---|---|---|---|---|---|---|---|
16
+ |decode_asr_lm_lm_train_bpe250_valid.loss.ave_asr_model_valid.acc.best/dev|530|3547|59.8|32.9|7.3|6.5|46.7|87.4|
17
+ |decode_asr_lm_lm_train_bpe250_valid.loss.ave_asr_model_valid.acc.best/test|704|5018|55.5|35.7|8.8|6.1|50.6|92.0|
18
+
19
+ ### CER
20
+
21
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
22
+ |---|---|---|---|---|---|---|---|---|
23
+ |decode_asr_lm_lm_train_bpe250_valid.loss.ave_asr_model_valid.acc.best/dev|530|22510|88.1|4.4|7.4|3.9|15.8|87.4|
24
+ |decode_asr_lm_lm_train_bpe250_valid.loss.ave_asr_model_valid.acc.best/test|704|32990|86.9|4.3|8.8|4.0|17.1|92.0|
25
+
26
+ ### TER
27
+
28
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
29
+ |---|---|---|---|---|---|---|---|---|
30
+ |decode_asr_lm_lm_train_bpe250_valid.loss.ave_asr_model_valid.acc.best/dev|530|9360|70.3|15.8|13.8|4.3|34.0|87.4|
31
+ |decode_asr_lm_lm_train_bpe250_valid.loss.ave_asr_model_valid.acc.best/test|704|13835|70.5|16.0|13.6|4.4|33.9|92.0|
32
+
exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/config.yaml ADDED
@@ -0,0 +1,426 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/tuning/train_asr_transformer_specaug.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ dry_run: false
5
+ iterator_type: sequence
6
+ output_dir: exp/asr_train_asr_transformer_specaug_raw_bpe250_sp
7
+ ngpu: 1
8
+ seed: 0
9
+ num_workers: 1
10
+ num_att_plot: 3
11
+ dist_backend: nccl
12
+ dist_init_method: env://
13
+ dist_world_size: null
14
+ dist_rank: null
15
+ local_rank: 0
16
+ dist_master_addr: null
17
+ dist_master_port: null
18
+ dist_launcher: null
19
+ multiprocessing_distributed: false
20
+ unused_parameters: false
21
+ sharded_ddp: false
22
+ cudnn_enabled: true
23
+ cudnn_benchmark: false
24
+ cudnn_deterministic: true
25
+ collect_stats: false
26
+ write_collected_feats: false
27
+ max_epoch: 100
28
+ patience: 15
29
+ val_scheduler_criterion:
30
+ - valid
31
+ - loss
32
+ early_stopping_criterion:
33
+ - valid
34
+ - loss
35
+ - min
36
+ best_model_criterion:
37
+ - - valid
38
+ - acc
39
+ - max
40
+ keep_nbest_models: 10
41
+ grad_clip: 5
42
+ grad_clip_type: 2.0
43
+ grad_noise: false
44
+ accum_grad: 2
45
+ no_forward_run: false
46
+ resume: true
47
+ train_dtype: float32
48
+ use_amp: false
49
+ log_interval: null
50
+ use_tensorboard: true
51
+ use_wandb: false
52
+ wandb_project: null
53
+ wandb_id: null
54
+ wandb_entity: null
55
+ wandb_name: null
56
+ wandb_model_log_interval: -1
57
+ detect_anomaly: false
58
+ pretrain_path: null
59
+ init_param: []
60
+ ignore_init_mismatch: false
61
+ freeze_param: []
62
+ num_iters_per_epoch: null
63
+ batch_size: 32
64
+ valid_batch_size: null
65
+ batch_bins: 1000000
66
+ valid_batch_bins: null
67
+ train_shape_file:
68
+ - exp/asr_stats_raw_bpe250_sp/train/speech_shape
69
+ - exp/asr_stats_raw_bpe250_sp/train/text_shape.bpe
70
+ valid_shape_file:
71
+ - exp/asr_stats_raw_bpe250_sp/valid/speech_shape
72
+ - exp/asr_stats_raw_bpe250_sp/valid/text_shape.bpe
73
+ batch_type: folded
74
+ valid_batch_type: null
75
+ fold_length:
76
+ - 80000
77
+ - 150
78
+ sort_in_batch: descending
79
+ sort_batch: descending
80
+ multiple_iterator: false
81
+ chunk_length: 500
82
+ chunk_shift_ratio: 0.5
83
+ num_cache_chunks: 1024
84
+ train_data_path_and_name_and_type:
85
+ - - /tmp/jiatong-7359.okvPvI3Z/raw/train_sp/wav.scp
86
+ - speech
87
+ - kaldi_ark
88
+ - - /tmp/jiatong-7359.okvPvI3Z/raw/train_sp/text
89
+ - text
90
+ - text
91
+ valid_data_path_and_name_and_type:
92
+ - - /tmp/jiatong-7359.okvPvI3Z/raw/dev/wav.scp
93
+ - speech
94
+ - kaldi_ark
95
+ - - /tmp/jiatong-7359.okvPvI3Z/raw/dev/text
96
+ - text
97
+ - text
98
+ allow_variable_data_keys: false
99
+ max_cache_size: 0.0
100
+ max_cache_fd: 32
101
+ valid_max_cache_size: null
102
+ optim: adam
103
+ optim_conf:
104
+ lr: 1.0
105
+ scheduler: noamlr
106
+ scheduler_conf:
107
+ warmup_steps: 4000
108
+ token_list:
109
+ - <blank>
110
+ - <unk>
111
+ - ':'
112
+ - ▁N
113
+ - NI
114
+ - N
115
+ - ▁IYMA
116
+ - ▁NA
117
+ - NA
118
+ - ▁WA
119
+ - WA
120
+ - ▁
121
+ - ''''
122
+ - KA
123
+ - ▁MA
124
+ - MA
125
+ - T
126
+ - ▁XA
127
+ - TA
128
+ - NCHU
129
+ - WI
130
+ - ▁LI
131
+ - ▁NI
132
+ - PA
133
+ - YI
134
+ - ▁PUS
135
+ - K
136
+ - ▁PI
137
+ - ▁X
138
+ - S
139
+ - ▁TA
140
+ - YA
141
+ - ▁LA
142
+ - Q
143
+ - QA
144
+ - TI
145
+ - ▁KA
146
+ - QO
147
+ - W
148
+ - ▁KAH
149
+ - ▁PALA
150
+ - H
151
+ - X
152
+ - XA
153
+ - ▁KI
154
+ - A
155
+ - LH
156
+ - I
157
+ - LA
158
+ - ▁CHA
159
+ - ▁A
160
+ - ▁XLI
161
+ - ▁LHI
162
+ - U
163
+ - ▁K
164
+ - KANI
165
+ - KU
166
+ - Y
167
+ - ▁LU
168
+ - Á
169
+ - ▁CHU
170
+ - O
171
+ - KI
172
+ - ▁KIWI
173
+ - NTLA
174
+ - ▁TLA
175
+ - M
176
+ - ▁TAWA
177
+ - ▁TI
178
+ - ▁S
179
+ - WANI
180
+ - CHA
181
+ - LHI
182
+ - LI
183
+ - ▁TU
184
+ - ▁PALHA
185
+ - Í
186
+ - ▁CHANÁ
187
+ - ▁KILHWAMPA
188
+ - KÁN
189
+ - ▁WAYMA
190
+ - E
191
+ - SA
192
+ - ▁E
193
+ - ▁LHU
194
+ - LHA
195
+ - PU
196
+ - ▁LHA
197
+ - ▁PA
198
+ - ▁LAK
199
+ - ▁ANTA
200
+ - ▁KITI
201
+ - NCHÚ
202
+ - SI
203
+ - TLA
204
+ - PI
205
+ - ▁KINI
206
+ - CHI
207
+ - ▁PEROH
208
+ - ▁PU
209
+ - QÓ
210
+ - QALHCHIWINA
211
+ - TU
212
+ - ▁TLHA
213
+ - ▁WI
214
+ - NÁ
215
+ - ▁KAN
216
+ - ▁NAYI
217
+ - CH
218
+ - 'NO'
219
+ - ▁U
220
+ - TSA
221
+ - MÁ
222
+ - NQO
223
+ - ▁ANA
224
+ - ▁LIKWA
225
+ - ▁XTA
226
+ - J
227
+ - ▁QALH
228
+ - TO
229
+ - TÁ
230
+ - ▁USA
231
+ - ▁PORQUE
232
+ - ▁MI
233
+ - L
234
+ - ▁TAWÁ
235
+ - XI
236
+ - LHAQAPASA
237
+ - P
238
+ - CHIWI
239
+ - WÁ
240
+ - NTI
241
+ - ▁JKA
242
+ - Ú
243
+ - NTLHA
244
+ - R
245
+ - TSI
246
+ - C
247
+ - STA
248
+ - ▁LH
249
+ - LHU
250
+ - MPI
251
+ - ▁I
252
+ - ▁NILH
253
+ - ▁KATSI
254
+ - ▁LHAK
255
+ - MAKLHAKASKI
256
+ - ▁WANIKÁN
257
+ - ▁WIXI
258
+ - ▁TSI
259
+ - KÚ
260
+ - NÍ
261
+ - ▁PAKS
262
+ - NU
263
+ - TLHA
264
+ - YÁ
265
+ - KUCHAN
266
+ - XAQATLI
267
+ - ▁MAX
268
+ - ▁LAQAPASA
269
+ - ▁LAQ
270
+ - QALH
271
+ - KATSI
272
+ - Ó
273
+ - LAQAPASA
274
+ - ▁J
275
+ - ▁QAMA
276
+ - NTU
277
+ - MI
278
+ - KIWI
279
+ - ▁KIN
280
+ - ▁XANAT
281
+ - ▁CHI
282
+ - JA
283
+ - ▁IY
284
+ - ▁TSU
285
+ - MAKLAKAS
286
+ - ▁MAQA
287
+ - LÁ
288
+ - ▁KATSIYA
289
+ - ▁TLANKA
290
+ - ▁STAK
291
+ - ▁XLA
292
+ - ▁LHIKWA
293
+ - ▁SQA
294
+ - ▁P
295
+ - TAHNA
296
+ - ▁TLAQ
297
+ - ▁JKATSI
298
+ - MAKLAKASKINKA
299
+ - YÁW
300
+ - WATIYA
301
+ - CHÁ
302
+ - ▁IPORQUEI
303
+ - ▁AKXNI
304
+ - TSU
305
+ - ▁TSINÓ
306
+ - ▁STAKA
307
+ - ▁AKXNÍ
308
+ - LAKATA
309
+ - KATSÍ
310
+ - ▁XALHAK
311
+ - TLAWAYA
312
+ - SPUT
313
+ - ▁XATAWA
314
+ - QALHCHIWI
315
+ - PÁ
316
+ - JU
317
+ - ▁XAXANAT
318
+ - ▁PÉREZ
319
+ - ▁AKTSU
320
+ - ▁JKI
321
+ - NTÚ
322
+ - ▁KATSIYÁ
323
+ - ▁IESTEI
324
+ - LAQAPASÁ
325
+ - ▁MASKI
326
+ - ▁LAQSQATÁ
327
+ - ▁TLHANKA
328
+ - ▁WANIKANI
329
+ - ▁LÓPEZ
330
+ - MAKLAKASKINKÁN
331
+ - ▁ANTÁ
332
+ - ▁TACHIWÍ
333
+ - ▁SEBAST
334
+ - ▁CANO
335
+ - ▁XKUTNI
336
+ - ▁UKXILH
337
+ - TANKAH
338
+ - LAKASKINQO
339
+ - LAKAPASTAK
340
+ - ▁XCHACHAT
341
+ - TAKAWANÍ
342
+ - ▁TLÁ
343
+ - ▁TSINOH
344
+ - KAXTLAWA
345
+ - ▁NÚÑEZ
346
+ - ▁XLAKASKINKA
347
+ - ▁WÁTIYA
348
+ - ONCE
349
+ - Z
350
+ - É
351
+ - D
352
+ - Ñ
353
+ - V
354
+ - F
355
+ - G
356
+ - '1'
357
+ - B
358
+ - <sos/eos>
359
+ init: xavier_uniform
360
+ input_size: null
361
+ ctc_conf:
362
+ dropout_rate: 0.0
363
+ ctc_type: builtin
364
+ reduce: true
365
+ ignore_nan_grad: true
366
+ model_conf:
367
+ ctc_weight: 0.3
368
+ lsm_weight: 0.1
369
+ length_normalized_loss: false
370
+ use_preprocessor: true
371
+ token_type: bpe
372
+ bpemodel: data/token_list/bpe_unigram250/bpe.model
373
+ non_linguistic_symbols: null
374
+ cleaner: null
375
+ g2p: null
376
+ speech_volume_normalize: null
377
+ rir_scp: null
378
+ rir_apply_prob: 1.0
379
+ noise_scp: null
380
+ noise_apply_prob: 1.0
381
+ noise_db_range: '13_15'
382
+ frontend: default
383
+ frontend_conf:
384
+ fs: 16k
385
+ specaug: specaug
386
+ specaug_conf:
387
+ apply_time_warp: true
388
+ time_warp_window: 5
389
+ time_warp_mode: bicubic
390
+ apply_freq_mask: true
391
+ freq_mask_width_range:
392
+ - 0
393
+ - 30
394
+ num_freq_mask: 2
395
+ apply_time_mask: true
396
+ time_mask_width_range:
397
+ - 0
398
+ - 40
399
+ num_time_mask: 2
400
+ normalize: global_mvn
401
+ normalize_conf:
402
+ stats_file: exp/asr_stats_raw_bpe250_sp/train/feats_stats.npz
403
+ preencoder: null
404
+ preencoder_conf: {}
405
+ encoder: transformer
406
+ encoder_conf:
407
+ input_layer: conv2d
408
+ num_blocks: 12
409
+ linear_units: 2048
410
+ dropout_rate: 0.1
411
+ output_size: 256
412
+ attention_heads: 4
413
+ attention_dropout_rate: 0.0
414
+ postencoder: null
415
+ postencoder_conf: {}
416
+ decoder: transformer
417
+ decoder_conf:
418
+ input_layer: embed
419
+ num_blocks: 6
420
+ linear_units: 2048
421
+ dropout_rate: 0.1
422
+ required:
423
+ - output_dir
424
+ - token_list
425
+ version: 0.10.4a1
426
+ distributed: false
exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/acc.png ADDED
exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/backward_time.png ADDED
exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/cer.png ADDED
exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/cer_ctc.png ADDED
exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/forward_time.png ADDED
exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/gpu_max_cached_mem_GB.png ADDED
exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/iter_time.png ADDED
exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/loss.png ADDED
exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/loss_att.png ADDED
exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/loss_ctc.png ADDED
exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/optim0_lr0.png ADDED
exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/optim_step_time.png ADDED
exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/train_time.png ADDED
exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/images/wer.png ADDED
exp/lm_train_bpe250/config.yaml ADDED
@@ -0,0 +1,373 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: null
2
+ print_config: false
3
+ log_level: INFO
4
+ dry_run: false
5
+ iterator_type: sequence
6
+ output_dir: exp/lm_train_bpe250
7
+ ngpu: 1
8
+ seed: 0
9
+ num_workers: 1
10
+ num_att_plot: 3
11
+ dist_backend: nccl
12
+ dist_init_method: env://
13
+ dist_world_size: null
14
+ dist_rank: null
15
+ local_rank: 0
16
+ dist_master_addr: null
17
+ dist_master_port: null
18
+ dist_launcher: null
19
+ multiprocessing_distributed: false
20
+ unused_parameters: false
21
+ sharded_ddp: false
22
+ cudnn_enabled: true
23
+ cudnn_benchmark: false
24
+ cudnn_deterministic: true
25
+ collect_stats: false
26
+ write_collected_feats: false
27
+ max_epoch: 40
28
+ patience: null
29
+ val_scheduler_criterion:
30
+ - valid
31
+ - loss
32
+ early_stopping_criterion:
33
+ - valid
34
+ - loss
35
+ - min
36
+ best_model_criterion:
37
+ - - train
38
+ - loss
39
+ - min
40
+ - - valid
41
+ - loss
42
+ - min
43
+ - - train
44
+ - acc
45
+ - max
46
+ - - valid
47
+ - acc
48
+ - max
49
+ keep_nbest_models:
50
+ - 10
51
+ grad_clip: 5.0
52
+ grad_clip_type: 2.0
53
+ grad_noise: false
54
+ accum_grad: 1
55
+ no_forward_run: false
56
+ resume: true
57
+ train_dtype: float32
58
+ use_amp: false
59
+ log_interval: null
60
+ use_tensorboard: true
61
+ use_wandb: false
62
+ wandb_project: null
63
+ wandb_id: null
64
+ wandb_entity: null
65
+ wandb_name: null
66
+ wandb_model_log_interval: -1
67
+ detect_anomaly: false
68
+ pretrain_path: null
69
+ init_param: []
70
+ ignore_init_mismatch: false
71
+ freeze_param: []
72
+ num_iters_per_epoch: null
73
+ batch_size: 20
74
+ valid_batch_size: null
75
+ batch_bins: 1000000
76
+ valid_batch_bins: null
77
+ train_shape_file:
78
+ - exp/lm_stats_bpe250/train/text_shape.bpe
79
+ valid_shape_file:
80
+ - exp/lm_stats_bpe250/valid/text_shape.bpe
81
+ batch_type: folded
82
+ valid_batch_type: null
83
+ fold_length:
84
+ - 150
85
+ sort_in_batch: descending
86
+ sort_batch: descending
87
+ multiple_iterator: false
88
+ chunk_length: 500
89
+ chunk_shift_ratio: 0.5
90
+ num_cache_chunks: 1024
91
+ train_data_path_and_name_and_type:
92
+ - - dump/raw/lm_train.txt
93
+ - text
94
+ - text
95
+ valid_data_path_and_name_and_type:
96
+ - - dump/raw/dev/text
97
+ - text
98
+ - text
99
+ allow_variable_data_keys: false
100
+ max_cache_size: 0.0
101
+ max_cache_fd: 32
102
+ valid_max_cache_size: null
103
+ optim: adadelta
104
+ optim_conf: {}
105
+ scheduler: null
106
+ scheduler_conf: {}
107
+ token_list:
108
+ - <blank>
109
+ - <unk>
110
+ - ':'
111
+ - ▁N
112
+ - NI
113
+ - N
114
+ - ▁IYMA
115
+ - ▁NA
116
+ - NA
117
+ - ▁WA
118
+ - WA
119
+ - ▁
120
+ - ''''
121
+ - KA
122
+ - ▁MA
123
+ - MA
124
+ - T
125
+ - ▁XA
126
+ - TA
127
+ - NCHU
128
+ - WI
129
+ - ▁LI
130
+ - ▁NI
131
+ - PA
132
+ - YI
133
+ - ▁PUS
134
+ - K
135
+ - ▁PI
136
+ - ▁X
137
+ - S
138
+ - ▁TA
139
+ - YA
140
+ - ▁LA
141
+ - Q
142
+ - QA
143
+ - TI
144
+ - ▁KA
145
+ - QO
146
+ - W
147
+ - ▁KAH
148
+ - ▁PALA
149
+ - H
150
+ - X
151
+ - XA
152
+ - ▁KI
153
+ - A
154
+ - LH
155
+ - I
156
+ - LA
157
+ - ▁CHA
158
+ - ▁A
159
+ - ▁XLI
160
+ - ▁LHI
161
+ - U
162
+ - ▁K
163
+ - KANI
164
+ - KU
165
+ - Y
166
+ - ▁LU
167
+ - Á
168
+ - ▁CHU
169
+ - O
170
+ - KI
171
+ - ▁KIWI
172
+ - NTLA
173
+ - ▁TLA
174
+ - M
175
+ - ▁TAWA
176
+ - ▁TI
177
+ - ▁S
178
+ - WANI
179
+ - CHA
180
+ - LHI
181
+ - LI
182
+ - ▁TU
183
+ - ▁PALHA
184
+ - Í
185
+ - ▁CHANÁ
186
+ - ▁KILHWAMPA
187
+ - KÁN
188
+ - ▁WAYMA
189
+ - E
190
+ - SA
191
+ - ▁E
192
+ - ▁LHU
193
+ - LHA
194
+ - PU
195
+ - ▁LHA
196
+ - ▁PA
197
+ - ▁LAK
198
+ - ▁ANTA
199
+ - ▁KITI
200
+ - NCHÚ
201
+ - SI
202
+ - TLA
203
+ - PI
204
+ - ▁KINI
205
+ - CHI
206
+ - ▁PEROH
207
+ - ▁PU
208
+ - QÓ
209
+ - QALHCHIWINA
210
+ - TU
211
+ - ▁TLHA
212
+ - ▁WI
213
+ - NÁ
214
+ - ▁KAN
215
+ - ▁NAYI
216
+ - CH
217
+ - 'NO'
218
+ - ▁U
219
+ - TSA
220
+ - MÁ
221
+ - NQO
222
+ - ▁ANA
223
+ - ▁LIKWA
224
+ - ▁XTA
225
+ - J
226
+ - ▁QALH
227
+ - TO
228
+ - TÁ
229
+ - ▁USA
230
+ - ▁PORQUE
231
+ - ▁MI
232
+ - L
233
+ - ▁TAWÁ
234
+ - XI
235
+ - LHAQAPASA
236
+ - P
237
+ - CHIWI
238
+ - WÁ
239
+ - NTI
240
+ - ▁JKA
241
+ - Ú
242
+ - NTLHA
243
+ - R
244
+ - TSI
245
+ - C
246
+ - STA
247
+ - ▁LH
248
+ - LHU
249
+ - MPI
250
+ - ▁I
251
+ - ▁NILH
252
+ - ▁KATSI
253
+ - ▁LHAK
254
+ - MAKLHAKASKI
255
+ - ▁WANIKÁN
256
+ - ▁WIXI
257
+ - ▁TSI
258
+ - KÚ
259
+ - NÍ
260
+ - ▁PAKS
261
+ - NU
262
+ - TLHA
263
+ - YÁ
264
+ - KUCHAN
265
+ - XAQATLI
266
+ - ▁MAX
267
+ - ▁LAQAPASA
268
+ - ▁LAQ
269
+ - QALH
270
+ - KATSI
271
+ - Ó
272
+ - LAQAPASA
273
+ - ▁J
274
+ - ▁QAMA
275
+ - NTU
276
+ - MI
277
+ - KIWI
278
+ - ▁KIN
279
+ - ▁XANAT
280
+ - ▁CHI
281
+ - JA
282
+ - ▁IY
283
+ - ▁TSU
284
+ - MAKLAKAS
285
+ - ▁MAQA
286
+ - LÁ
287
+ - ▁KATSIYA
288
+ - ▁TLANKA
289
+ - ▁STAK
290
+ - ▁XLA
291
+ - ▁LHIKWA
292
+ - ▁SQA
293
+ - ▁P
294
+ - TAHNA
295
+ - ▁TLAQ
296
+ - ▁JKATSI
297
+ - MAKLAKASKINKA
298
+ - YÁW
299
+ - WATIYA
300
+ - CHÁ
301
+ - ▁IPORQUEI
302
+ - ▁AKXNI
303
+ - TSU
304
+ - ▁TSINÓ
305
+ - ▁STAKA
306
+ - ▁AKXNÍ
307
+ - LAKATA
308
+ - KATSÍ
309
+ - ▁XALHAK
310
+ - TLAWAYA
311
+ - SPUT
312
+ - ▁XATAWA
313
+ - QALHCHIWI
314
+ - PÁ
315
+ - JU
316
+ - ▁XAXANAT
317
+ - ▁PÉREZ
318
+ - ▁AKTSU
319
+ - ▁JKI
320
+ - NTÚ
321
+ - ▁KATSIYÁ
322
+ - ▁IESTEI
323
+ - LAQAPASÁ
324
+ - ▁MASKI
325
+ - ▁LAQSQATÁ
326
+ - ▁TLHANKA
327
+ - ▁WANIKANI
328
+ - ▁LÓPEZ
329
+ - MAKLAKASKINKÁN
330
+ - ▁ANTÁ
331
+ - ▁TACHIWÍ
332
+ - ▁SEBAST
333
+ - ▁CANO
334
+ - ▁XKUTNI
335
+ - ▁UKXILH
336
+ - TANKAH
337
+ - LAKASKINQO
338
+ - LAKAPASTAK
339
+ - ▁XCHACHAT
340
+ - TAKAWANÍ
341
+ - ▁TLÁ
342
+ - ▁TSINOH
343
+ - KAXTLAWA
344
+ - ▁NÚÑEZ
345
+ - ▁XLAKASKINKA
346
+ - ▁WÁTIYA
347
+ - ONCE
348
+ - Z
349
+ - É
350
+ - D
351
+ - Ñ
352
+ - V
353
+ - F
354
+ - G
355
+ - '1'
356
+ - B
357
+ - <sos/eos>
358
+ init: null
359
+ model_conf:
360
+ ignore_id: 0
361
+ use_preprocessor: true
362
+ token_type: bpe
363
+ bpemodel: data/token_list/bpe_unigram250/bpe.model
364
+ non_linguistic_symbols: null
365
+ cleaner: null
366
+ g2p: null
367
+ lm: seq_rnn
368
+ lm_conf: {}
369
+ required:
370
+ - output_dir
371
+ - token_list
372
+ version: 0.10.3a3
373
+ distributed: false
exp/lm_train_bpe250/images/backward_time.png ADDED
exp/lm_train_bpe250/images/forward_time.png ADDED
exp/lm_train_bpe250/images/gpu_max_cached_mem_GB.png ADDED
exp/lm_train_bpe250/images/iter_time.png ADDED
exp/lm_train_bpe250/images/loss.png ADDED
exp/lm_train_bpe250/images/optim0_lr0.png ADDED
exp/lm_train_bpe250/images/optim_step_time.png ADDED
exp/lm_train_bpe250/images/train_time.png ADDED
exp/lm_train_bpe250/perplexity_test/ppl ADDED
@@ -0,0 +1 @@
 
1
+ 18.3045965777891
exp/lm_train_bpe250/valid.loss.ave_10best.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b143d75fce3b31b97930dab08414419abaf4f90edca5797f22a5d8eb5b79e5c8
3
+ size 28385796
meta.yaml ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
1
+ espnet: 0.10.5a1
2
+ files:
3
+ asr_model_file: exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/73epoch.pth
4
+ lm_file: exp/lm_train_bpe250/valid.loss.ave_10best.pth
5
+ python: "3.9.7 (default, Sep 16 2021, 13:09:58) \n[GCC 7.5.0]"
6
+ timestamp: 1640102996.550734
7
+ torch: 1.9.0
8
+ yaml_files:
9
+ asr_train_config: exp/asr_train_asr_transformer_specaug_raw_bpe250_sp/config.yaml
10
+ lm_train_config: exp/lm_train_bpe250/config.yaml