huseinzol05 commited on
Commit
f6d1140
1 Parent(s): 9e634aa

Upload 2 files

Browse files
Files changed (2) hide show
  1. model_config.yaml +165 -0
  2. model_weights.ckpt +3 -0
model_config.yaml ADDED
@@ -0,0 +1,165 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ sample_rate: 16000
2
+ timesteps: 64
3
+ repeat: 2
4
+ dropout: 0.0
5
+ kernel_size_factor: 1.0
6
+ labels:
7
+ - background
8
+ - speech
9
+ train_ds:
10
+ vad_stream: false
11
+ manifest_filepath: /home/fjia/code/manifest64/train.json
12
+ sample_rate: 16000
13
+ labels:
14
+ - background
15
+ - speech
16
+ batch_size: 128
17
+ num_workers: 20
18
+ shuffle: true
19
+ augmentor:
20
+ shift:
21
+ prob: 0.8
22
+ min_shift_ms: -5.0
23
+ max_shift_ms: 5.0
24
+ white_noise:
25
+ prob: 0.8
26
+ min_level: -90
27
+ max_level: -46
28
+ validation_ds:
29
+ vad_stream: false
30
+ manifest_filepath: /home/fjia/code/manifest64/validation.json
31
+ sample_rate: 16000
32
+ labels:
33
+ - background
34
+ - speech
35
+ batch_size: 128
36
+ shuffle: false
37
+ val_loss_idx: 0
38
+ num_workers: 20
39
+ test_ds:
40
+ vad_stream: false
41
+ manifest_filepath: null
42
+ sample_rate: 16000
43
+ labels:
44
+ - background
45
+ - speech
46
+ batch_size: 128
47
+ shuffle: false
48
+ test_loss_idx: 0
49
+ num_workers: 20
50
+ preprocessor:
51
+ cls: nemo.collections.asr.modules.AudioToMFCCPreprocessor
52
+ params:
53
+ window_size: 0.025
54
+ window_stride: 0.01
55
+ window: hann
56
+ n_mels: 64
57
+ n_mfcc: 64
58
+ n_fft: 512
59
+ spec_augment:
60
+ cls: nemo.collections.asr.modules.SpectrogramAugmentation
61
+ params:
62
+ freq_masks: 2
63
+ time_masks: 2
64
+ freq_width: 15
65
+ time_width: 25
66
+ rect_masks: 5
67
+ rect_time: 25
68
+ rect_freq: 15
69
+ encoder:
70
+ cls: nemo.collections.asr.modules.ConvASREncoder
71
+ params:
72
+ feat_in: 64
73
+ activation: relu
74
+ conv_mask: true
75
+ jasper:
76
+ - filters: 128
77
+ repeat: 1
78
+ kernel:
79
+ - 11
80
+ stride:
81
+ - 1
82
+ dilation:
83
+ - 1
84
+ dropout: 0.0
85
+ residual: false
86
+ separable: true
87
+ kernel_size_factor: 1.0
88
+ - filters: 64
89
+ repeat: 2
90
+ kernel:
91
+ - 13
92
+ stride:
93
+ - 1
94
+ dilation:
95
+ - 1
96
+ dropout: 0.0
97
+ residual: true
98
+ separable: true
99
+ kernel_size_factor: 1.0
100
+ - filters: 64
101
+ repeat: 2
102
+ kernel:
103
+ - 15
104
+ stride:
105
+ - 1
106
+ dilation:
107
+ - 1
108
+ dropout: 0.0
109
+ residual: true
110
+ separable: true
111
+ kernel_size_factor: 1.0
112
+ - filters: 64
113
+ repeat: 2
114
+ kernel:
115
+ - 17
116
+ stride:
117
+ - 1
118
+ dilation:
119
+ - 1
120
+ dropout: 0.0
121
+ residual: true
122
+ separable: true
123
+ kernel_size_factor: 1.0
124
+ - filters: 128
125
+ repeat: 1
126
+ kernel:
127
+ - 29
128
+ stride:
129
+ - 1
130
+ dilation:
131
+ - 2
132
+ dropout: 0.0
133
+ residual: false
134
+ separable: true
135
+ kernel_size_factor: 1.0
136
+ - filters: 128
137
+ repeat: 1
138
+ kernel:
139
+ - 1
140
+ stride:
141
+ - 1
142
+ dilation:
143
+ - 1
144
+ dropout: 0.0
145
+ residual: false
146
+ decoder:
147
+ cls: nemo.collections.asr.modules.ConvASRDecoderClassification
148
+ params:
149
+ feat_in: 128
150
+ num_classes: 2
151
+ return_logits: true
152
+ pooling_type: avg
153
+ optim:
154
+ name: sgd
155
+ lr: 0.01
156
+ weight_decay: 0.001
157
+ sched:
158
+ name: PolynomialHoldDecayAnnealing
159
+ power: 2.0
160
+ warmup_ratio: 0.05
161
+ hold_ratio: 0.45
162
+ min_lr: 0.001
163
+ last_epoch: -1
164
+ momentum: 0.9
165
+ target: nemo.collections.asr.models.classification_models.EncDecClassificationModel
model_weights.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5211412b8e8d36c35dea9742289cc99ef327f98ecabd8259e36d618848ff0ca
3
+ size 481454