Wangyou Zhang commited on
Commit
90acba8
1 Parent(s): 04beea3

Add model files

Browse files
exp/enh_stats_16k/train/feats_stats.npz ADDED
Binary file (742 Bytes). View file
exp/enh_train_enh_dc_crn_mapping_snr_raw/33epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ff556700392793d13541bca5e37ef027da3df79ea9befbfb08d083a27806d1e
3
+ size 33734953
exp/enh_train_enh_dc_crn_mapping_snr_raw/RESULTS.md ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <!-- Generated by ./scripts/utils/show_enh_score.sh -->
2
+ # RESULTS
3
+ ## Environments
4
+ - date: `Tue Mar 29 02:31:59 CST 2022`
5
+ - python version: `3.8.12 (default, Oct 12 2021, 13:49:34) [GCC 7.5.0]`
6
+ - espnet version: `espnet 0.10.7a1`
7
+ - pytorch version: `pytorch 1.10.2+cu102`
8
+ - Git hash: `9c24b3adddbde3402530080cb58ae08a6f4dd642`
9
+ - Commit date: `Wed Feb 23 14:49:15 2022 -0500`
10
+
11
+
12
+ ## enh_train_enh_dc_crn_mapping_snr_raw
13
+
14
+ config: conf/tuning/train_enh_dc_crn_mapping_snr.yaml
15
+
16
+ |dataset|PESQ|STOI|SAR|SDR|SIR|SI_SNR|
17
+ |---|---|---|---|---|---|---|
18
+ |enhanced_dt05_simu_isolated_6ch_track|3.101|0.960|17.818|17.818|0.000|17.593|
19
+ |enhanced_et05_simu_isolated_6ch_track|2.946|0.948|17.334|17.334|0.000|17.041|
20
+
exp/enh_train_enh_dc_crn_mapping_snr_raw/config.yaml ADDED
@@ -0,0 +1,159 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/tuning/train_enh_dc_crn_mapping_snr.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ dry_run: false
5
+ iterator_type: chunk
6
+ output_dir: exp/enh_train_enh_dc_crn_mapping_snr_raw
7
+ ngpu: 1
8
+ seed: 0
9
+ num_workers: 4
10
+ num_att_plot: 3
11
+ dist_backend: nccl
12
+ dist_init_method: env://
13
+ dist_world_size: 2
14
+ dist_rank: 0
15
+ local_rank: 0
16
+ dist_master_addr: localhost
17
+ dist_master_port: 43524
18
+ dist_launcher: null
19
+ multiprocessing_distributed: true
20
+ unused_parameters: false
21
+ sharded_ddp: false
22
+ cudnn_enabled: true
23
+ cudnn_benchmark: false
24
+ cudnn_deterministic: true
25
+ collect_stats: false
26
+ write_collected_feats: false
27
+ max_epoch: 200
28
+ patience: 10
29
+ val_scheduler_criterion:
30
+ - valid
31
+ - loss
32
+ early_stopping_criterion:
33
+ - valid
34
+ - loss
35
+ - min
36
+ best_model_criterion:
37
+ - - valid
38
+ - si_snr
39
+ - max
40
+ - - valid
41
+ - loss
42
+ - min
43
+ keep_nbest_models: 1
44
+ nbest_averaging_interval: 0
45
+ grad_clip: 5
46
+ grad_clip_type: 2.0
47
+ grad_noise: false
48
+ accum_grad: 1
49
+ no_forward_run: false
50
+ resume: true
51
+ train_dtype: float32
52
+ use_amp: false
53
+ log_interval: null
54
+ use_matplotlib: true
55
+ use_tensorboard: true
56
+ use_wandb: false
57
+ wandb_project: null
58
+ wandb_id: null
59
+ wandb_entity: null
60
+ wandb_name: null
61
+ wandb_model_log_interval: -1
62
+ detect_anomaly: false
63
+ pretrain_path: null
64
+ init_param: []
65
+ ignore_init_mismatch: false
66
+ freeze_param: []
67
+ num_iters_per_epoch: null
68
+ batch_size: 16
69
+ valid_batch_size: null
70
+ batch_bins: 1000000
71
+ valid_batch_bins: null
72
+ train_shape_file:
73
+ - exp/enh_stats_16k/train/speech_mix_shape
74
+ - exp/enh_stats_16k/train/speech_ref1_shape
75
+ valid_shape_file:
76
+ - exp/enh_stats_16k/valid/speech_mix_shape
77
+ - exp/enh_stats_16k/valid/speech_ref1_shape
78
+ batch_type: folded
79
+ valid_batch_type: null
80
+ fold_length:
81
+ - 80000
82
+ - 80000
83
+ sort_in_batch: descending
84
+ sort_batch: descending
85
+ multiple_iterator: false
86
+ chunk_length: 32000
87
+ chunk_shift_ratio: 0.5
88
+ num_cache_chunks: 1024
89
+ train_data_path_and_name_and_type:
90
+ - - dump/raw/tr05_simu_isolated_6ch_track/wav.scp
91
+ - speech_mix
92
+ - sound
93
+ - - dump/raw/tr05_simu_isolated_6ch_track/spk1.scp
94
+ - speech_ref1
95
+ - sound
96
+ valid_data_path_and_name_and_type:
97
+ - - dump/raw/dt05_simu_isolated_6ch_track/wav.scp
98
+ - speech_mix
99
+ - sound
100
+ - - dump/raw/dt05_simu_isolated_6ch_track/spk1.scp
101
+ - speech_ref1
102
+ - sound
103
+ allow_variable_data_keys: false
104
+ max_cache_size: 0.0
105
+ max_cache_fd: 32
106
+ valid_max_cache_size: null
107
+ optim: adam
108
+ optim_conf:
109
+ lr: 0.001
110
+ eps: 1.0e-08
111
+ weight_decay: 1.0e-07
112
+ amsgrad: true
113
+ scheduler: steplr
114
+ scheduler_conf:
115
+ step_size: 2
116
+ gamma: 0.98
117
+ init: xavier_uniform
118
+ model_conf:
119
+ stft_consistency: false
120
+ loss_type: mask_mse
121
+ mask_type: null
122
+ criterions:
123
+ - name: snr
124
+ conf:
125
+ eps: 1.0e-07
126
+ wrapper: pit
127
+ wrapper_conf:
128
+ weight: 1.0
129
+ use_preprocessor: false
130
+ encoder: stft
131
+ encoder_conf:
132
+ n_fft: 256
133
+ hop_length: 128
134
+ separator: dc_crn
135
+ separator_conf:
136
+ num_spk: 1
137
+ input_channels:
138
+ - 10
139
+ - 16
140
+ - 32
141
+ - 64
142
+ - 128
143
+ - 256
144
+ enc_hid_channels: 8
145
+ enc_layers: 5
146
+ glstm_groups: 2
147
+ glstm_layers: 2
148
+ glstm_bidirectional: true
149
+ glstm_rearrange: false
150
+ mode: mapping
151
+ ref_channel: 3
152
+ decoder: stft
153
+ decoder_conf:
154
+ n_fft: 256
155
+ hop_length: 128
156
+ required:
157
+ - output_dir
158
+ version: 0.10.7a1
159
+ distributed: true
exp/enh_train_enh_dc_crn_mapping_snr_raw/images/backward_time.png ADDED
exp/enh_train_enh_dc_crn_mapping_snr_raw/images/forward_time.png ADDED
exp/enh_train_enh_dc_crn_mapping_snr_raw/images/gpu_max_cached_mem_GB.png ADDED
exp/enh_train_enh_dc_crn_mapping_snr_raw/images/iter_time.png ADDED
exp/enh_train_enh_dc_crn_mapping_snr_raw/images/loss.png ADDED
exp/enh_train_enh_dc_crn_mapping_snr_raw/images/optim0_lr0.png ADDED
exp/enh_train_enh_dc_crn_mapping_snr_raw/images/optim_step_time.png ADDED
exp/enh_train_enh_dc_crn_mapping_snr_raw/images/snr_loss.png ADDED
exp/enh_train_enh_dc_crn_mapping_snr_raw/images/train_time.png ADDED
exp/enh_train_enh_dc_crn_mapping_snr_raw/valid.loss.best.pth ADDED
@@ -0,0 +1 @@
 
1
+ 33epoch.pth
meta.yaml ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
1
+ espnet: 0.10.7a1
2
+ files:
3
+ model_file: exp/enh_train_enh_dc_crn_mapping_snr_raw/33epoch.pth
4
+ python: "3.8.12 (default, Oct 12 2021, 13:49:34) \n[GCC 7.5.0]"
5
+ timestamp: 1649679148.764176
6
+ torch: 1.10.2+cu102
7
+ yaml_files:
8
+ train_config: exp/enh_train_enh_dc_crn_mapping_snr_raw/config.yaml