Zhaoheng
/

tfgridnet_dns_ins20_epoch33

Model card Files Files and versions Community

Zhaoheng Ni commited on Mar 21

Commit

667c73d

•

1 Parent(s): e384c0a

add model

Browse files

Files changed (17) hide show

exp/enh_train_enh_tfgrid_raw/33epoch.pth +3 -0
exp/enh_train_enh_tfgrid_raw/RESULTS.md +21 -0
exp/enh_train_enh_tfgrid_raw/config.yaml +203 -0
exp/enh_train_enh_tfgrid_raw/images/backward_time.png +0 -0
exp/enh_train_enh_tfgrid_raw/images/clip.png +0 -0
exp/enh_train_enh_tfgrid_raw/images/forward_time.png +0 -0
exp/enh_train_enh_tfgrid_raw/images/gpu_max_cached_mem_GB.png +0 -0
exp/enh_train_enh_tfgrid_raw/images/grad_norm.png +0 -0
exp/enh_train_enh_tfgrid_raw/images/iter_time.png +0 -0
exp/enh_train_enh_tfgrid_raw/images/l1_timedomain+magspec_loss.png +0 -0
exp/enh_train_enh_tfgrid_raw/images/loss.png +0 -0
exp/enh_train_enh_tfgrid_raw/images/loss_scale.png +0 -0
exp/enh_train_enh_tfgrid_raw/images/optim0_lr0.png +0 -0
exp/enh_train_enh_tfgrid_raw/images/optim_step_time.png +0 -0
exp/enh_train_enh_tfgrid_raw/images/si_snr_loss.png +0 -0
exp/enh_train_enh_tfgrid_raw/images/train_time.png +0 -0
meta.yaml +8 -0

exp/enh_train_enh_tfgrid_raw/33epoch.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:613db9fb4dafa7860d9e1390ec8f6bb61bba62cc0a67482bebcfbd0221d865c3
+size 10332558

exp/enh_train_enh_tfgrid_raw/RESULTS.md ADDED Viewed

	@@ -0,0 +1,21 @@

+<!-- Generated by ./scripts/utils/show_enh_score.sh -->
+# RESULTS
+## Environments
+- date: `Wed Mar  6 01:29:02 UTC 2024`
+- python version: `3.10.10 (main, Mar 21 2023, 18:45:11) [GCC 11.2.0]`
+- espnet version: `espnet 202308`
+- pytorch version: `pytorch 2.1.0+cu118`
+- Git hash: `60ce18efa06ca5a5922534682f47e2107ef88b13`
+  - Commit date: `Wed Sep 6 10:17:57 2023 -0700`
+## enh_train_enh_tfgrid_raw
+config: ./conf/tuning/train_enh_tfgrid.yaml
+|dataset|PESQ_WB|STOI|SAR|SDR|SIR|SI_SNR|
+|---|---|---|---|---|---|---|
+|enhanced_cv_synthetic|3.61|99.06|26.04|26.04|0.00|26.44|
+|enhanced_tt_synthetic_no_reverb|3.32|97.88|20.18|20.18|0.00|20.17|
+|enhanced_tt_synthetic_with_reverb|2.79|91.75|15.54|15.54|0.00|15.06|

exp/enh_train_enh_tfgrid_raw/config.yaml ADDED Viewed

	@@ -0,0 +1,203 @@

+config: ./conf/tuning/train_enh_tfgrid.yaml
+print_config: false
+log_level: INFO
+drop_last_iter: false
+dry_run: false
+iterator_type: chunk
+valid_iterator_type: null
+output_dir: exp/enh_train_enh_tfgrid_raw
+ngpu: 1
+seed: 0
+num_workers: 8
+num_att_plot: 3
+dist_backend: nccl
+dist_init_method: env://
+dist_world_size: null
+dist_rank: null
+local_rank: 0
+dist_master_addr: null
+dist_master_port: null
+dist_launcher: null
+multiprocessing_distributed: false
+unused_parameters: false
+sharded_ddp: false
+cudnn_enabled: true
+cudnn_benchmark: false
+cudnn_deterministic: true
+collect_stats: false
+write_collected_feats: false
+max_epoch: 200
+patience: 5
+val_scheduler_criterion:
+- valid
+- loss
+early_stopping_criterion:
+- valid
+- loss
+- min
+best_model_criterion:
+-   - valid
+    - si_snr
+    - max
+-   - valid
+    - loss
+    - min
+keep_nbest_models: 5
+nbest_averaging_interval: 0
+grad_clip: 5.0
+grad_clip_type: 2.0
+grad_noise: false
+accum_grad: 1
+no_forward_run: false
+resume: true
+train_dtype: float32
+use_amp: false
+log_interval: null
+use_matplotlib: true
+use_tensorboard: true
+create_graph_in_tensorboard: false
+use_wandb: false
+wandb_project: null
+wandb_id: null
+wandb_entity: null
+wandb_name: null
+wandb_model_log_interval: -1
+detect_anomaly: false
+pretrain_path: null
+init_param: []
+ignore_init_mismatch: false
+freeze_param: []
+num_iters_per_epoch: 5000
+batch_size: 2
+valid_batch_size: null
+batch_bins: 1000000
+valid_batch_bins: null
+train_shape_file:
+- exp/enh_stats_16k/train/speech_mix_shape
+- exp/enh_stats_16k/train/speech_ref1_shape
+- exp/enh_stats_16k/train/noise_ref1_shape
+valid_shape_file:
+- exp/enh_stats_16k/valid/speech_mix_shape
+- exp/enh_stats_16k/valid/speech_ref1_shape
+- exp/enh_stats_16k/valid/noise_ref1_shape
+batch_type: folded
+valid_batch_type: null
+fold_length:
+- 80000
+- 80000
+- 80000
+sort_in_batch: descending
+shuffle_within_batch: false
+sort_batch: descending
+multiple_iterator: false
+chunk_length: 48000
+chunk_shift_ratio: 0.5
+num_cache_chunks: 1024
+chunk_excluded_key_prefixes: []
+train_data_path_and_name_and_type:
+-   - dump/raw/tr_synthetic/wav.scp
+    - speech_mix
+    - sound
+-   - dump/raw/tr_synthetic/spk1.scp
+    - speech_ref1
+    - sound
+-   - dump/raw/tr_synthetic/noise1.scp
+    - noise_ref1
+    - sound
+valid_data_path_and_name_and_type:
+-   - dump/raw/cv_synthetic/wav.scp
+    - speech_mix
+    - sound
+-   - dump/raw/cv_synthetic/spk1.scp
+    - speech_ref1
+    - sound
+-   - dump/raw/cv_synthetic/noise1.scp
+    - noise_ref1
+    - sound
+allow_variable_data_keys: false
+max_cache_size: 0.0
+max_cache_fd: 32
+valid_max_cache_size: null
+exclude_weight_decay: false
+exclude_weight_decay_conf: {}
+optim: adam
+optim_conf:
+    lr: 0.001
+    eps: 1.0e-08
+    weight_decay: 0
+scheduler: reducelronplateau
+scheduler_conf:
+    mode: min
+    factor: 0.7
+    patience: 1
+init: xavier_uniform
+model_conf:
+    stft_consistency: false
+    loss_type: mask_mse
+    mask_type: null
+    extract_feats_in_collect_stats: false
+criterions:
+-   name: mr_l1_tfd
+    conf:
+        window_sz:
+        - 256
+        - 512
+        - 768
+        - 1024
+        hop_sz: null
+        eps: 1.0e-08
+        time_domain_weight: 0.5
+    wrapper: fixed_order
+    wrapper_conf:
+        weight: 1.0
+-   name: si_snr
+    conf:
+        eps: 1.0e-07
+    wrapper: fixed_order
+    wrapper_conf:
+        weight: 0.0
+speech_volume_normalize: null
+rir_scp: null
+rir_apply_prob: 1.0
+noise_scp: null
+noise_apply_prob: 1.0
+noise_db_range: '13_15'
+short_noise_thres: 0.5
+use_reverberant_ref: false
+num_spk: 1
+num_noise_type: 1
+sample_rate: 8000
+force_single_channel: false
+channel_reordering: false
+categories: []
+dynamic_mixing: false
+utt2spk: null
+dynamic_mixing_gain_db: 0.0
+encoder: same
+encoder_conf: {}
+separator: tfgridnet
+separator_conf:
+    n_srcs: 1
+    n_fft: 512
+    stride: 256
+    window: hann
+    n_imics: 1
+    n_layers: 4
+    lstm_hidden_units: 128
+    attn_n_head: 4
+    attn_approx_qk_dim: 512
+    emb_dim: 32
+    emb_ks: 4
+    emb_hs: 4
+    activation: prelu
+    eps: 1.0e-05
+decoder: same
+decoder_conf: {}
+mask_module: multi_mask
+mask_module_conf: {}
+preprocessor: null
+preprocessor_conf: {}
+required:
+- output_dir
+version: '202308'
+distributed: false

exp/enh_train_enh_tfgrid_raw/images/backward_time.png ADDED Viewed

exp/enh_train_enh_tfgrid_raw/images/clip.png ADDED Viewed

exp/enh_train_enh_tfgrid_raw/images/forward_time.png ADDED Viewed

exp/enh_train_enh_tfgrid_raw/images/gpu_max_cached_mem_GB.png ADDED Viewed

exp/enh_train_enh_tfgrid_raw/images/grad_norm.png ADDED Viewed

exp/enh_train_enh_tfgrid_raw/images/iter_time.png ADDED Viewed

exp/enh_train_enh_tfgrid_raw/images/l1_timedomain+magspec_loss.png ADDED Viewed

exp/enh_train_enh_tfgrid_raw/images/loss.png ADDED Viewed

exp/enh_train_enh_tfgrid_raw/images/loss_scale.png ADDED Viewed

exp/enh_train_enh_tfgrid_raw/images/optim0_lr0.png ADDED Viewed

exp/enh_train_enh_tfgrid_raw/images/optim_step_time.png ADDED Viewed

exp/enh_train_enh_tfgrid_raw/images/si_snr_loss.png ADDED Viewed

exp/enh_train_enh_tfgrid_raw/images/train_time.png ADDED Viewed

meta.yaml ADDED Viewed

	@@ -0,0 +1,8 @@

+espnet: '202308'
+files:
+  model_file: exp/enh_train_enh_tfgrid_raw/33epoch.pth
+python: 3.10.10 (main, Mar 21 2023, 18:45:11) [GCC 11.2.0]
+timestamp: 1711033647.373215
+torch: 2.1.0+cu118
+yaml_files:
+  train_config: exp/enh_train_enh_tfgrid_raw/config.yaml