Yosuke Kashiwagi commited on
Commit
92a91e8
1 Parent(s): 3fb58dc

add up to 9 epochs.

Browse files
Files changed (30) hide show
  1. exp/bestrq_stats_raw_en/train/feats_lengths_stats.npz +0 -0
  2. exp/bestrq_stats_raw_en/train/feats_stats.npz +0 -0
  3. exp/bestrq_stats_raw_en/valid/feats_lengths_stats.npz +0 -0
  4. exp/bestrq_stats_raw_en/valid/feats_stats.npz +0 -0
  5. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/1epoch.pth +3 -0
  6. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/2epoch.pth +3 -0
  7. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/3epoch.pth +3 -0
  8. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/4epoch.pth +3 -0
  9. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/5epoch.pth +3 -0
  10. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/6epoch.pth +3 -0
  11. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/7epoch.pth +3 -0
  12. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/8epoch.pth +3 -0
  13. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/9epoch.pth +3 -0
  14. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/config.yaml +162 -0
  15. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/backward_time.png +0 -0
  16. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/forward_time.png +0 -0
  17. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/gpu_max_cached_mem_GB.png +0 -0
  18. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/iter_time.png +0 -0
  19. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/label_coverage.png +0 -0
  20. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/loss.png +0 -0
  21. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/masked_acc.png +0 -0
  22. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/masked_loss.png +0 -0
  23. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/optim0_lr0.png +0 -0
  24. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/optim_step_time.png +0 -0
  25. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/prediction_coverage.png +0 -0
  26. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/train_time.png +0 -0
  27. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/unmasked_acc.png +0 -0
  28. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/unmasked_loss.png +0 -0
  29. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/latest.pth +1 -0
  30. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/valid.masked_acc.best.pth +1 -0
exp/bestrq_stats_raw_en/train/feats_lengths_stats.npz ADDED
Binary file (778 Bytes). View file
 
exp/bestrq_stats_raw_en/train/feats_stats.npz ADDED
Binary file (1.4 kB). View file
 
exp/bestrq_stats_raw_en/valid/feats_lengths_stats.npz ADDED
Binary file (778 Bytes). View file
 
exp/bestrq_stats_raw_en/valid/feats_stats.npz ADDED
Binary file (1.4 kB). View file
 
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/1epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0695cc3c45eb5939faf60b4d16ce9887668df054a37fcfd0cbfcd4e189e364d5
3
+ size 477318768
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/2epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:550e25732071e5b9c7f5806ebc6d89c88e45b241b12607ef0752caf9e59b9eec
3
+ size 477318768
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/3epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e5cb83fe0945168adfade85b039b3c38f3de6be93ff40a4a24af30c487f0743
3
+ size 477318768
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/4epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68bb0a19604a91a4506c52ae3213c6c6efea4214f4f4c193f63cfe10102f90c1
3
+ size 477318768
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/5epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0eac0949065e62fc1520768bd235a5f9c123b92c11838cab89554e8798a013d
3
+ size 477318768
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/6epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6004732a67b5dc0e9ae2f658c49f94d4b1963b8e3df4ad9c687ff515a77391ee
3
+ size 477318768
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/7epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf71204536e931dec0b2c97a9315c3e835e7ff4eaa2b004be7c8e5edbee0a873
3
+ size 477318768
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/8epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5deb80b4b3c4c64c5627cc718e0a41f2c43d82eecd5f5911041b1e855610300
3
+ size 477318768
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/9epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a5ec6f4e976e444c72a1177eb3793cf391c87dfcd322ef5fc2108cb45f4268a
3
+ size 477318768
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/config.yaml ADDED
@@ -0,0 +1,162 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/tuning/train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ dry_run: false
5
+ iterator_type: sequence
6
+ output_dir: exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en
7
+ ngpu: 1
8
+ seed: 0
9
+ num_workers: 1
10
+ num_att_plot: 3
11
+ dist_backend: nccl
12
+ dist_init_method: env://
13
+ dist_world_size: 4
14
+ dist_rank: 0
15
+ local_rank: 0
16
+ dist_master_addr: localhost
17
+ dist_master_port: 44969
18
+ dist_launcher: null
19
+ multiprocessing_distributed: true
20
+ unused_parameters: false
21
+ sharded_ddp: false
22
+ cudnn_enabled: true
23
+ cudnn_benchmark: false
24
+ cudnn_deterministic: false
25
+ collect_stats: false
26
+ write_collected_feats: false
27
+ max_epoch: 500
28
+ patience: null
29
+ val_scheduler_criterion:
30
+ - valid
31
+ - loss
32
+ early_stopping_criterion:
33
+ - valid
34
+ - loss
35
+ - min
36
+ best_model_criterion:
37
+ - - valid
38
+ - masked_acc
39
+ - max
40
+ keep_nbest_models: 300
41
+ nbest_averaging_interval: 0
42
+ grad_clip: 5.0
43
+ grad_clip_type: 2.0
44
+ grad_noise: false
45
+ accum_grad: 8
46
+ no_forward_run: false
47
+ resume: true
48
+ train_dtype: float32
49
+ use_amp: true
50
+ log_interval: null
51
+ use_matplotlib: true
52
+ use_tensorboard: true
53
+ use_wandb: false
54
+ wandb_project: null
55
+ wandb_id: null
56
+ wandb_entity: null
57
+ wandb_name: null
58
+ wandb_model_log_interval: -1
59
+ detect_anomaly: false
60
+ pretrain_path: null
61
+ init_param: []
62
+ ignore_init_mismatch: false
63
+ freeze_param: []
64
+ num_iters_per_epoch: null
65
+ batch_size: 256
66
+ valid_batch_size: null
67
+ batch_bins: 1000000
68
+ valid_batch_bins: null
69
+ train_shape_file:
70
+ - exp/bestrq_stats_raw_en/train/speech_shape
71
+ valid_shape_file:
72
+ - exp/bestrq_stats_raw_en/valid/speech_shape
73
+ batch_type: folded
74
+ valid_batch_type: null
75
+ fold_length:
76
+ - 80000
77
+ sort_in_batch: descending
78
+ sort_batch: descending
79
+ multiple_iterator: false
80
+ chunk_length: 500
81
+ chunk_shift_ratio: 0.5
82
+ num_cache_chunks: 1024
83
+ train_data_path_and_name_and_type:
84
+ - - dump/raw/train_60k/wav.scp
85
+ - speech
86
+ - sound
87
+ valid_data_path_and_name_and_type:
88
+ - - dump/raw/dev/wav.scp
89
+ - speech
90
+ - sound
91
+ allow_variable_data_keys: false
92
+ max_cache_size: 0.0
93
+ max_cache_fd: 32
94
+ valid_max_cache_size: null
95
+ optim: adam
96
+ optim_conf:
97
+ lr: 0.0001
98
+ scheduler: warmuplr
99
+ scheduler_conf:
100
+ warmup_steps: 30000
101
+ init: xavier_uniform
102
+ input_size: null
103
+ model_conf:
104
+ lsm_weight: 0.0
105
+ length_normalized_loss: false
106
+ vector_size: 16
107
+ codebook_size: 8192
108
+ temporal_reduction: 4
109
+ mask_prob: 0.01
110
+ mask_length: 40
111
+ unmasked_region_weight: 0
112
+ apply_l2_normalization: true
113
+ codebook_and_matrix_init_file: data/local/codebook_and_matrix_seed20220404.pth
114
+ frame_chunk_size: 3200
115
+ use_preprocessor: true
116
+ token_type: null
117
+ cleaner: null
118
+ speech_volume_normalize: null
119
+ rir_scp: null
120
+ rir_apply_prob: 1.0
121
+ noise_scp: null
122
+ noise_apply_prob: 1.0
123
+ noise_db_range: '13_15'
124
+ frontend: default
125
+ frontend_conf:
126
+ fs: 16k
127
+ n_fft: 512
128
+ win_length: 400
129
+ hop_length: 160
130
+ frontend_conf: null
131
+ apply_stft: true
132
+ specaug: null
133
+ specaug_conf: {}
134
+ normalize: global_mvn
135
+ normalize_conf:
136
+ stats_file: exp/bestrq_stats_raw_en/train/feats_stats.npz
137
+ preencoder: null
138
+ preencoder_conf: {}
139
+ encoder: conformer
140
+ encoder_conf:
141
+ output_size: 512
142
+ attention_heads: 8
143
+ linear_units: 2048
144
+ num_blocks: 17
145
+ dropout_rate: 0.1
146
+ positional_dropout_rate: 0.1
147
+ attention_dropout_rate: 0.1
148
+ input_layer: conv2d
149
+ normalize_before: true
150
+ macaron_style: true
151
+ rel_pos_type: latest
152
+ pos_enc_layer_type: rel_pos
153
+ selfattention_layer_type: rel_selfattn
154
+ activation_type: swish
155
+ use_cnn_module: true
156
+ cnn_module_kernel: 31
157
+ postencoder: null
158
+ postencoder_conf: {}
159
+ required:
160
+ - output_dir
161
+ version: 0.10.7a1
162
+ distributed: true
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/backward_time.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/forward_time.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/gpu_max_cached_mem_GB.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/iter_time.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/label_coverage.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/loss.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/masked_acc.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/masked_loss.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/optim0_lr0.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/optim_step_time.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/prediction_coverage.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/train_time.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/unmasked_acc.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/unmasked_loss.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/latest.pth ADDED
@@ -0,0 +1 @@
 
 
1
+ 9epoch.pth
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/valid.masked_acc.best.pth ADDED
@@ -0,0 +1 @@
 
 
1
+ 9epoch.pth