qingzhengwang commited on
Commit
c597a56
·
1 Parent(s): c7a5ae2

Add model files

Browse files
exp/diar_stats_8k/train/feats_lengths_stats.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:488ffa7ae62201b12edef41fc97c4787f5a6be32bb03725f551f376e0abb3301
3
+ size 778
exp/diar_stats_8k/train/feats_stats.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:398b81c5d3e1ee8674d9776150f59b1ecd02b61958485048f4589ce879e1de8a
3
+ size 946
exp/diar_stats_8k/train/speech_shape ADDED
The diff for this file is too large to render. See raw diff
 
exp/diar_stats_8k/train/spk_labels_shape ADDED
The diff for this file is too large to render. See raw diff
 
exp/diar_train_diar_raw/500epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1c456775d4e4ae3d9d9a2dbb5b02d956a6d003e94e7f41230de1463bdf1818f
3
+ size 8834948
exp/diar_train_diar_raw/RESULTS.md ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <!-- Generated by scripts/utils/show_diar_result.sh -->
2
+ # RESULTS
3
+ ## Environments
4
+ - date: `Thu Dec 19 22:03:53 EST 2024`
5
+ - python version: `3.11.10 (main, Oct 3 2024, 07:29:13) [GCC 11.2.0]`
6
+ - espnet version: `espnet 202409`
7
+ - pytorch version: `pytorch 2.4.0`
8
+ - Git hash: `c12b3d59ca4fd8847edf274e56a1716474d2a30e`
9
+ - Commit date: `Thu Dec 19 21:58:26 2024 -0500`
10
+
11
+ ## diar_train_diar_raw
12
+ ### DER
13
+ diarized_test
14
+ |threshold_median_collar|DER|
15
+ |---|---|
16
+ |result_th0.3_med11_collar0.0|71.73|
17
+ |result_th0.3_med1_collar0.0|74.62|
18
+ |result_th0.4_med11_collar0.0|70.10|
19
+ |result_th0.4_med1_collar0.0|71.98|
20
+ |result_th0.5_med11_collar0.0|70.57|
21
+ |result_th0.5_med1_collar0.0|72.44|
22
+ |result_th0.6_med11_collar0.0|72.64|
23
+ |result_th0.6_med1_collar0.0|74.63|
24
+ |result_th0.7_med11_collar0.0|76.52|
25
+ |result_th0.7_med1_collar0.0|78.41|
26
+ ## diar_train_diar_raw
27
+ ### DER
28
+ diarized_dev
29
+ |threshold_median_collar|DER|
30
+ |---|---|
31
+ |result_th0.3_med11_collar0.0|75.88|
32
+ |result_th0.3_med1_collar0.0|78.21|
33
+ |result_th0.4_med11_collar0.0|71.45|
34
+ |result_th0.4_med1_collar0.0|73.32|
35
+ |result_th0.5_med11_collar0.0|70.53|
36
+ |result_th0.5_med1_collar0.0|72.34|
37
+ |result_th0.6_med11_collar0.0|72.03|
38
+ |result_th0.6_med1_collar0.0|73.96|
39
+ |result_th0.7_med11_collar0.0|76.66|
40
+ |result_th0.7_med1_collar0.0|78.33|
exp/diar_train_diar_raw/config.yaml ADDED
@@ -0,0 +1,180 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/train_diar.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ drop_last_iter: false
5
+ dry_run: false
6
+ iterator_type: sequence
7
+ valid_iterator_type: null
8
+ output_dir: exp/diar_train_diar_raw
9
+ ngpu: 1
10
+ seed: 0
11
+ num_workers: 0
12
+ num_att_plot: 3
13
+ dist_backend: nccl
14
+ dist_init_method: env://
15
+ dist_world_size: null
16
+ dist_rank: null
17
+ local_rank: 0
18
+ dist_master_addr: null
19
+ dist_master_port: null
20
+ dist_launcher: null
21
+ multiprocessing_distributed: false
22
+ unused_parameters: false
23
+ sharded_ddp: false
24
+ use_deepspeed: false
25
+ deepspeed_config: null
26
+ cudnn_enabled: true
27
+ cudnn_benchmark: false
28
+ cudnn_deterministic: true
29
+ use_tf32: false
30
+ collect_stats: false
31
+ write_collected_feats: false
32
+ max_epoch: 500
33
+ patience: null
34
+ val_scheduler_criterion:
35
+ - valid
36
+ - loss
37
+ early_stopping_criterion:
38
+ - valid
39
+ - loss
40
+ - min
41
+ best_model_criterion:
42
+ - - valid
43
+ - acc
44
+ - max
45
+ keep_nbest_models: 10
46
+ nbest_averaging_interval: 0
47
+ grad_clip: 5
48
+ grad_clip_type: 2.0
49
+ grad_noise: false
50
+ accum_grad: 2
51
+ no_forward_run: false
52
+ resume: true
53
+ train_dtype: float32
54
+ use_amp: false
55
+ log_interval: null
56
+ use_matplotlib: true
57
+ use_tensorboard: true
58
+ create_graph_in_tensorboard: false
59
+ use_wandb: false
60
+ wandb_project: null
61
+ wandb_id: null
62
+ wandb_entity: null
63
+ wandb_name: null
64
+ wandb_model_log_interval: -1
65
+ detect_anomaly: false
66
+ use_adapter: false
67
+ adapter: lora
68
+ save_strategy: all
69
+ adapter_conf: {}
70
+ pretrain_path: null
71
+ init_param: []
72
+ ignore_init_mismatch: false
73
+ freeze_param: []
74
+ num_iters_per_epoch: null
75
+ batch_size: 64
76
+ valid_batch_size: 16
77
+ batch_bins: 1000000
78
+ valid_batch_bins: null
79
+ category_sample_size: 10
80
+ train_shape_file:
81
+ - exp/diar_stats_8k/train/speech_shape
82
+ - exp/diar_stats_8k/train/spk_labels_shape
83
+ valid_shape_file:
84
+ - exp/diar_stats_8k/valid/speech_shape
85
+ - exp/diar_stats_8k/valid/spk_labels_shape
86
+ batch_type: unsorted
87
+ valid_batch_type: unsorted
88
+ fold_length:
89
+ - 80000
90
+ - 800
91
+ sort_in_batch: descending
92
+ shuffle_within_batch: false
93
+ sort_batch: descending
94
+ multiple_iterator: false
95
+ chunk_length: 500
96
+ chunk_shift_ratio: 0.5
97
+ num_cache_chunks: 1024
98
+ chunk_excluded_key_prefixes: []
99
+ chunk_default_fs: null
100
+ chunk_max_abs_length: null
101
+ chunk_discard_short_samples: true
102
+ train_data_path_and_name_and_type:
103
+ - - dump/raw/train/wav.scp
104
+ - speech
105
+ - sound
106
+ - - dump/raw/train/espnet_rttm
107
+ - spk_labels
108
+ - rttm
109
+ valid_data_path_and_name_and_type:
110
+ - - dump/raw/dev/wav.scp
111
+ - speech
112
+ - sound
113
+ - - dump/raw/dev/espnet_rttm
114
+ - spk_labels
115
+ - rttm
116
+ multi_task_dataset: false
117
+ allow_variable_data_keys: false
118
+ max_cache_size: 0.0
119
+ max_cache_fd: 32
120
+ allow_multi_rates: false
121
+ valid_max_cache_size: null
122
+ exclude_weight_decay: false
123
+ exclude_weight_decay_conf: {}
124
+ optim: adam
125
+ optim_conf:
126
+ lr: 0.0002
127
+ scheduler: warmuplr
128
+ scheduler_conf:
129
+ warmup_steps: 100000
130
+ num_spk: 4
131
+ init: xavier_uniform
132
+ input_size: 322
133
+ model_conf:
134
+ diar_weight: 1.0
135
+ attractor_weight: 1.0
136
+ context_size: 7
137
+ subsampling: 10
138
+ use_preprocessor: true
139
+ frontend: default
140
+ frontend_conf:
141
+ fs: 8k
142
+ n_fft: 200
143
+ win_length: 200
144
+ hop_length: 128
145
+ n_mels: 23
146
+ specaug: specaug
147
+ specaug_conf:
148
+ apply_time_warp: false
149
+ apply_freq_mask: true
150
+ freq_mask_width_range:
151
+ - 0
152
+ - 30
153
+ num_freq_mask: 2
154
+ apply_time_mask: true
155
+ time_mask_width_range:
156
+ - 0
157
+ - 40
158
+ num_time_mask: 2
159
+ normalize: global_mvn
160
+ normalize_conf:
161
+ stats_file: exp/diar_stats_8k/train/feats_stats.npz
162
+ encoder: transformer
163
+ encoder_conf:
164
+ input_layer: linear
165
+ num_blocks: 4
166
+ linear_units: 512
167
+ dropout_rate: 0.1
168
+ output_size: 256
169
+ attention_heads: 4
170
+ attention_dropout_rate: 0.1
171
+ decoder: linear
172
+ decoder_conf: {}
173
+ label_aggregator: label_aggregator
174
+ label_aggregator_conf: {}
175
+ attractor: null
176
+ attractor_conf: {}
177
+ required:
178
+ - output_dir
179
+ version: '202409'
180
+ distributed: false
exp/diar_train_diar_raw/images/acc.png ADDED
exp/diar_train_diar_raw/images/backward_time.png ADDED
exp/diar_train_diar_raw/images/cf.png ADDED
exp/diar_train_diar_raw/images/clip.png ADDED
exp/diar_train_diar_raw/images/der.png ADDED
exp/diar_train_diar_raw/images/fa.png ADDED
exp/diar_train_diar_raw/images/forward_time.png ADDED
exp/diar_train_diar_raw/images/gpu_max_cached_mem_GB.png ADDED
exp/diar_train_diar_raw/images/grad_norm.png ADDED
exp/diar_train_diar_raw/images/iter_time.png ADDED
exp/diar_train_diar_raw/images/loss.png ADDED
exp/diar_train_diar_raw/images/loss_att.png ADDED
exp/diar_train_diar_raw/images/loss_pit.png ADDED
exp/diar_train_diar_raw/images/loss_scale.png ADDED
exp/diar_train_diar_raw/images/mi.png ADDED
exp/diar_train_diar_raw/images/optim0_lr0.png ADDED
exp/diar_train_diar_raw/images/optim_step_time.png ADDED
exp/diar_train_diar_raw/images/sad_fr.png ADDED
exp/diar_train_diar_raw/images/sad_mr.png ADDED
exp/diar_train_diar_raw/images/train_time.png ADDED