karthik commited on
Commit
ec498ec
1 Parent(s): ebddda9

Add model files

Browse files
Files changed (3) hide show
  1. RESULTS.md +29 -0
  2. config.yaml +236 -0
  3. valid.acc.ave_5best.pth +3 -0
RESULTS.md ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <!-- Generated by scripts/utils/show_asr_result.sh -->
2
+ # RESULTS
3
+ ## Environments
4
+ - date: `Tue Dec 21 23:42:15 EST 2021`
5
+ - python version: `3.9.5 (default, Jun 4 2021, 12:28:51) [GCC 7.5.0]`
6
+ - espnet version: `espnet 0.10.3a3`
7
+ - pytorch version: `pytorch 1.8.1+cu102`
8
+ - Git hash: `ea2174b5cef70a9b65a64980ef56283222283af2`
9
+ - Commit date: `Thu Sep 16 21:19:45 2021 +0900`
10
+
11
+ ## asr_train_asr_raw_en_word
12
+ ### WER
13
+
14
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
15
+ |---|---|---|---|---|---|---|---|---|
16
+ |inference_asr_model_valid.acc.ave_5best/test|762|15965|97.2|1.8|1.0|1.3|4.1|13.9|
17
+ |inference_asr_model_valid.acc.ave_5best/valid|763|15853|96.4|2.5|1.1|1.8|5.5|16.3|
18
+
19
+ ### CER
20
+
21
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
22
+ |---|---|---|---|---|---|---|---|---|
23
+ |inference_asr_model_valid.acc.ave_5best/test|762|41332|97.8|1.4|0.8|1.0|3.2|13.9|
24
+ |inference_asr_model_valid.acc.ave_5best/valid|763|41124|97.3|1.9|0.8|1.4|4.1|16.3|
25
+
26
+ ### TER
27
+
28
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
29
+ |---|---|---|---|---|---|---|---|---|
config.yaml ADDED
@@ -0,0 +1,236 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/train_asr.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ dry_run: false
5
+ iterator_type: sequence
6
+ output_dir: exp/asr_train_asr_raw_en_word
7
+ ngpu: 1
8
+ seed: 0
9
+ num_workers: 1
10
+ num_att_plot: 3
11
+ dist_backend: nccl
12
+ dist_init_method: env://
13
+ dist_world_size: null
14
+ dist_rank: null
15
+ local_rank: 0
16
+ dist_master_addr: null
17
+ dist_master_port: null
18
+ dist_launcher: null
19
+ multiprocessing_distributed: false
20
+ unused_parameters: false
21
+ sharded_ddp: false
22
+ cudnn_enabled: true
23
+ cudnn_benchmark: false
24
+ cudnn_deterministic: true
25
+ collect_stats: false
26
+ write_collected_feats: false
27
+ max_epoch: 50
28
+ patience: null
29
+ val_scheduler_criterion:
30
+ - valid
31
+ - loss
32
+ early_stopping_criterion:
33
+ - valid
34
+ - loss
35
+ - min
36
+ best_model_criterion:
37
+ - - train
38
+ - loss
39
+ - min
40
+ - - valid
41
+ - loss
42
+ - min
43
+ - - train
44
+ - acc
45
+ - max
46
+ - - valid
47
+ - acc
48
+ - max
49
+ keep_nbest_models: 5
50
+ grad_clip: 5.0
51
+ grad_clip_type: 2.0
52
+ grad_noise: false
53
+ accum_grad: 1
54
+ no_forward_run: false
55
+ resume: true
56
+ train_dtype: float32
57
+ use_amp: false
58
+ log_interval: null
59
+ use_tensorboard: true
60
+ use_wandb: false
61
+ wandb_project: null
62
+ wandb_id: null
63
+ wandb_entity: null
64
+ wandb_name: null
65
+ wandb_model_log_interval: -1
66
+ detect_anomaly: false
67
+ pretrain_path: null
68
+ init_param: []
69
+ ignore_init_mismatch: false
70
+ freeze_param: []
71
+ num_iters_per_epoch: null
72
+ batch_size: 20
73
+ valid_batch_size: null
74
+ batch_bins: 1000000
75
+ valid_batch_bins: null
76
+ train_shape_file:
77
+ - exp/asr_stats_raw_en_word/train/speech_shape
78
+ - exp/asr_stats_raw_en_word/train/text_shape.word
79
+ valid_shape_file:
80
+ - exp/asr_stats_raw_en_word/valid/speech_shape
81
+ - exp/asr_stats_raw_en_word/valid/text_shape.word
82
+ batch_type: folded
83
+ valid_batch_type: null
84
+ fold_length:
85
+ - 80000
86
+ - 150
87
+ sort_in_batch: descending
88
+ sort_batch: descending
89
+ multiple_iterator: false
90
+ chunk_length: 500
91
+ chunk_shift_ratio: 0.5
92
+ num_cache_chunks: 1024
93
+ train_data_path_and_name_and_type:
94
+ - - dump/raw/train/wav.scp
95
+ - speech
96
+ - sound
97
+ - - dump/raw/train/text
98
+ - text
99
+ - text
100
+ valid_data_path_and_name_and_type:
101
+ - - dump/raw/valid/wav.scp
102
+ - speech
103
+ - sound
104
+ - - dump/raw/valid/text
105
+ - text
106
+ - text
107
+ allow_variable_data_keys: false
108
+ max_cache_size: 0.0
109
+ max_cache_fd: 32
110
+ valid_max_cache_size: null
111
+ optim: adam
112
+ optim_conf:
113
+ lr: 0.0002
114
+ scheduler: warmuplr
115
+ scheduler_conf:
116
+ warmup_steps: 25000
117
+ token_list:
118
+ - <blank>
119
+ - <unk>
120
+ - ්
121
+ - න
122
+ - ම
123
+ - ක
124
+ - ල
125
+ - ි
126
+ - ු
127
+ - ග
128
+ - ේ
129
+ - ර
130
+ - ත
131
+ - ද
132
+ - ව
133
+ - ට
134
+ - ඕ
135
+ - ී
136
+ - ප
137
+ - ය
138
+ - ෙ
139
+ - ස
140
+ - ණ
141
+ - ා
142
+ - ැ
143
+ - RequestAcc.balance
144
+ - Moneywithdraw
145
+ - Moneydeposit
146
+ - Moneytransfer
147
+ - Billpayments
148
+ - බ
149
+ - ඉ
150
+ - ශ
151
+ - ෂ
152
+ - ඩ
153
+ - Creditcardpayments
154
+ - එ
155
+ - ‍
156
+ - හ
157
+ - <sos/eos>
158
+ init: null
159
+ input_size: null
160
+ ctc_conf:
161
+ dropout_rate: 0.0
162
+ ctc_type: builtin
163
+ reduce: true
164
+ ignore_nan_grad: true
165
+ model_conf:
166
+ ctc_weight: 0.5
167
+ ignore_id: -1
168
+ lsm_weight: 0.0
169
+ length_normalized_loss: false
170
+ report_cer: true
171
+ report_wer: true
172
+ sym_space: <space>
173
+ sym_blank: <blank>
174
+ extract_feats_in_collect_stats: true
175
+ use_preprocessor: true
176
+ token_type: word
177
+ bpemodel: null
178
+ non_linguistic_symbols: null
179
+ cleaner: null
180
+ g2p: null
181
+ speech_volume_normalize: null
182
+ rir_scp: null
183
+ rir_apply_prob: 1.0
184
+ noise_scp: null
185
+ noise_apply_prob: 1.0
186
+ noise_db_range: '13_15'
187
+ frontend: default
188
+ frontend_conf:
189
+ fs: 16k
190
+ specaug: specaug
191
+ specaug_conf:
192
+ apply_time_warp: true
193
+ time_warp_window: 5
194
+ time_warp_mode: bicubic
195
+ apply_freq_mask: true
196
+ freq_mask_width_range:
197
+ - 0
198
+ - 30
199
+ num_freq_mask: 2
200
+ apply_time_mask: true
201
+ time_mask_width_range:
202
+ - 0
203
+ - 40
204
+ num_time_mask: 2
205
+ normalize: global_mvn
206
+ normalize_conf:
207
+ stats_file: exp/asr_stats_raw_en_word/train/feats_stats.npz
208
+ preencoder: null
209
+ preencoder_conf: {}
210
+ encoder: transformer
211
+ encoder_conf:
212
+ output_size: 256
213
+ attention_heads: 4
214
+ linear_units: 2048
215
+ num_blocks: 12
216
+ dropout_rate: 0.1
217
+ positional_dropout_rate: 0.1
218
+ attention_dropout_rate: 0.0
219
+ input_layer: conv2d
220
+ normalize_before: true
221
+ postencoder: null
222
+ postencoder_conf: {}
223
+ decoder: transformer
224
+ decoder_conf:
225
+ attention_heads: 4
226
+ linear_units: 2048
227
+ num_blocks: 6
228
+ dropout_rate: 0.1
229
+ positional_dropout_rate: 0.1
230
+ self_attention_dropout_rate: 0.0
231
+ src_attention_dropout_rate: 0.0
232
+ required:
233
+ - output_dir
234
+ - token_list
235
+ version: 0.10.3a3
236
+ distributed: false
valid.acc.ave_5best.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e4e65289c3034a145acb2899d0884f19cf7d8bf259da45728c5945a9c744c8e
3
+ size 108718541