viks66 commited on
Commit
2611e57
1 Parent(s): c2c2993
exp/asr_train_asr_conformer6_n_fft400_hop_length160_raw_bn_char/config.yaml ADDED
@@ -0,0 +1,274 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/tuning/train_asr_conformer6_n_fft400_hop_length160.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ dry_run: false
5
+ iterator_type: sequence
6
+ output_dir: exp/asr_train_asr_conformer6_n_fft400_hop_length160_raw_bn_char
7
+ ngpu: 1
8
+ seed: 0
9
+ num_workers: 1
10
+ num_att_plot: 3
11
+ dist_backend: nccl
12
+ dist_init_method: env://
13
+ dist_world_size: 2
14
+ dist_rank: 0
15
+ local_rank: 0
16
+ dist_master_addr: localhost
17
+ dist_master_port: 41903
18
+ dist_launcher: null
19
+ multiprocessing_distributed: true
20
+ unused_parameters: false
21
+ sharded_ddp: false
22
+ cudnn_enabled: true
23
+ cudnn_benchmark: false
24
+ cudnn_deterministic: true
25
+ collect_stats: false
26
+ write_collected_feats: false
27
+ max_epoch: 35
28
+ patience: null
29
+ val_scheduler_criterion:
30
+ - valid
31
+ - loss
32
+ early_stopping_criterion:
33
+ - valid
34
+ - loss
35
+ - min
36
+ best_model_criterion:
37
+ - - valid
38
+ - acc
39
+ - max
40
+ keep_nbest_models: 3
41
+ nbest_averaging_interval: 0
42
+ grad_clip: 5.0
43
+ grad_clip_type: 2.0
44
+ grad_noise: false
45
+ accum_grad: 1
46
+ no_forward_run: false
47
+ resume: true
48
+ train_dtype: float32
49
+ use_amp: false
50
+ log_interval: null
51
+ use_matplotlib: true
52
+ use_tensorboard: true
53
+ create_graph_in_tensorboard: false
54
+ use_wandb: false
55
+ wandb_project: null
56
+ wandb_id: null
57
+ wandb_entity: null
58
+ wandb_name: null
59
+ wandb_model_log_interval: -1
60
+ detect_anomaly: false
61
+ pretrain_path: null
62
+ init_param: []
63
+ ignore_init_mismatch: false
64
+ freeze_param: []
65
+ num_iters_per_epoch: null
66
+ batch_size: 20
67
+ valid_batch_size: null
68
+ batch_bins: 4000000
69
+ valid_batch_bins: null
70
+ train_shape_file:
71
+ - exp/asr_stats_raw_bn_char/train/speech_shape
72
+ - exp/asr_stats_raw_bn_char/train/text_shape.char
73
+ valid_shape_file:
74
+ - exp/asr_stats_raw_bn_char/valid/speech_shape
75
+ - exp/asr_stats_raw_bn_char/valid/text_shape.char
76
+ batch_type: numel
77
+ valid_batch_type: null
78
+ fold_length:
79
+ - 80000
80
+ - 150
81
+ sort_in_batch: descending
82
+ sort_batch: descending
83
+ multiple_iterator: false
84
+ chunk_length: 500
85
+ chunk_shift_ratio: 0.5
86
+ num_cache_chunks: 1024
87
+ train_data_path_and_name_and_type:
88
+ - - dump/raw/bn/train/wav.scp
89
+ - speech
90
+ - sound
91
+ - - dump/raw/bn/train/text
92
+ - text
93
+ - text
94
+ valid_data_path_and_name_and_type:
95
+ - - dump/raw/bn/dev/wav.scp
96
+ - speech
97
+ - sound
98
+ - - dump/raw/bn/dev/text
99
+ - text
100
+ - text
101
+ allow_variable_data_keys: false
102
+ max_cache_size: 0.0
103
+ max_cache_fd: 32
104
+ valid_max_cache_size: null
105
+ exclude_weight_decay: false
106
+ exclude_weight_decay_conf: {}
107
+ optim: adam
108
+ optim_conf:
109
+ lr: 0.0015
110
+ scheduler: warmuplr
111
+ scheduler_conf:
112
+ warmup_steps: 25000
113
+ token_list:
114
+ - <blank>
115
+ - <unk>
116
+ - <space>
117
+ - ा
118
+ - े
119
+ - क
120
+ - र
121
+ - ल
122
+ - स
123
+ - न
124
+ - म
125
+ - त
126
+ - ी
127
+ - ि
128
+ - ह
129
+ - ब
130
+ - ्
131
+ - प
132
+ - व
133
+ - ो
134
+ - ज
135
+ - ं
136
+ - ख
137
+ - द
138
+ - य
139
+ - ग
140
+ - ट
141
+ - ई
142
+ - ु
143
+ - इ
144
+ - च
145
+ - अ
146
+ - आ
147
+ - उ
148
+ - ू
149
+ - भ
150
+ - ए
151
+ - ै
152
+ - फ
153
+ - ध
154
+ - ड
155
+ - श
156
+ - ड़
157
+ - ौ
158
+ - .
159
+ - ण
160
+ - छ
161
+ - ष
162
+ - थ
163
+ - ढ़
164
+ - ओ
165
+ - ठ
166
+ - घ
167
+ - ृ
168
+ - ॉ
169
+ - ऑ
170
+ - ँ
171
+ - ऋ
172
+ - औ
173
+ - ढ
174
+ - ऊ
175
+ - ज़
176
+ - झ
177
+ - फ़
178
+ - ऐ
179
+ - ऽ
180
+ - ञ
181
+ - ़
182
+ - ख़
183
+ - क़
184
+ - ॅ
185
+ - ः
186
+ - ऱ
187
+ - <sos/eos>
188
+ init: null
189
+ input_size: null
190
+ ctc_conf:
191
+ dropout_rate: 0.0
192
+ ctc_type: builtin
193
+ reduce: true
194
+ ignore_nan_grad: null
195
+ zero_infinity: true
196
+ joint_net_conf: null
197
+ use_preprocessor: true
198
+ token_type: char
199
+ bpemodel: null
200
+ non_linguistic_symbols: null
201
+ cleaner: null
202
+ g2p: null
203
+ speech_volume_normalize: null
204
+ rir_scp: null
205
+ rir_apply_prob: 1.0
206
+ noise_scp: null
207
+ noise_apply_prob: 1.0
208
+ noise_db_range: '13_15'
209
+ short_noise_thres: 0.5
210
+ frontend: default
211
+ frontend_conf:
212
+ n_fft: 400
213
+ hop_length: 160
214
+ fs: 16k
215
+ specaug: specaug
216
+ specaug_conf:
217
+ apply_time_warp: true
218
+ time_warp_window: 5
219
+ time_warp_mode: bicubic
220
+ apply_freq_mask: true
221
+ freq_mask_width_range:
222
+ - 0
223
+ - 30
224
+ num_freq_mask: 2
225
+ apply_time_mask: true
226
+ time_mask_width_range:
227
+ - 0
228
+ - 40
229
+ num_time_mask: 2
230
+ normalize: global_mvn
231
+ normalize_conf:
232
+ stats_file: exp/asr_stats_raw_bn_char/train/feats_stats.npz
233
+ model: espnet
234
+ model_conf:
235
+ ctc_weight: 0.3
236
+ lsm_weight: 0.1
237
+ length_normalized_loss: false
238
+ preencoder: null
239
+ preencoder_conf: {}
240
+ encoder: conformer
241
+ encoder_conf:
242
+ output_size: 512
243
+ attention_heads: 8
244
+ linear_units: 2048
245
+ num_blocks: 12
246
+ dropout_rate: 0.1
247
+ positional_dropout_rate: 0.1
248
+ attention_dropout_rate: 0.1
249
+ input_layer: conv2d
250
+ normalize_before: true
251
+ macaron_style: true
252
+ pos_enc_layer_type: rel_pos
253
+ selfattention_layer_type: rel_selfattn
254
+ activation_type: swish
255
+ use_cnn_module: true
256
+ cnn_module_kernel: 31
257
+ postencoder: null
258
+ postencoder_conf: {}
259
+ decoder: transformer
260
+ decoder_conf:
261
+ attention_heads: 8
262
+ linear_units: 2048
263
+ num_blocks: 6
264
+ dropout_rate: 0.1
265
+ positional_dropout_rate: 0.1
266
+ self_attention_dropout_rate: 0.1
267
+ src_attention_dropout_rate: 0.1
268
+ preprocessor: default
269
+ preprocessor_conf: {}
270
+ required:
271
+ - output_dir
272
+ - token_list
273
+ version: '202211'
274
+ distributed: true
exp/asr_train_asr_conformer6_n_fft400_hop_length160_raw_bn_char/valid.acc.ave_3best.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa1a155c7b7184072d3feaeded51297450e5d830326dabf0b28b8cbec0a0491a
3
+ size 434598181