Yosuke Kashiwagi commited on
Commit
603c5f7
1 Parent(s): 71180cb

Add 20-22 epochs

Browse files
Files changed (24) hide show
  1. exp/bestrq_stats_raw_en/train/feats_lengths_stats.npz +0 -0
  2. exp/bestrq_stats_raw_en/train/feats_stats.npz +0 -0
  3. exp/bestrq_stats_raw_en/valid/feats_lengths_stats.npz +0 -0
  4. exp/bestrq_stats_raw_en/valid/feats_stats.npz +0 -0
  5. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/20epoch.pth +3 -0
  6. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/21epoch.pth +3 -0
  7. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/22epoch.pth +3 -0
  8. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/config.yaml +162 -0
  9. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/backward_time.png +0 -0
  10. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/forward_time.png +0 -0
  11. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/gpu_max_cached_mem_GB.png +0 -0
  12. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/iter_time.png +0 -0
  13. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/label_coverage.png +0 -0
  14. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/loss.png +0 -0
  15. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/masked_acc.png +0 -0
  16. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/masked_loss.png +0 -0
  17. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/optim0_lr0.png +0 -0
  18. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/optim_step_time.png +0 -0
  19. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/prediction_coverage.png +0 -0
  20. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/train_time.png +0 -0
  21. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/unmasked_acc.png +0 -0
  22. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/unmasked_loss.png +0 -0
  23. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/latest.pth +1 -0
  24. exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/valid.masked_acc.best.pth +1 -0
exp/bestrq_stats_raw_en/train/feats_lengths_stats.npz ADDED
Binary file (778 Bytes). View file
 
exp/bestrq_stats_raw_en/train/feats_stats.npz ADDED
Binary file (1.4 kB). View file
 
exp/bestrq_stats_raw_en/valid/feats_lengths_stats.npz ADDED
Binary file (778 Bytes). View file
 
exp/bestrq_stats_raw_en/valid/feats_stats.npz ADDED
Binary file (1.4 kB). View file
 
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/20epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5514dbcdb61ad10d2a731fbe23ba46097fb2da054258ba044caac84300349ff
3
+ size 477318768
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/21epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90d63175c7266c595e8da32741cd67a4dc14b414afda707fd3ea9adf7b16e61b
3
+ size 477318768
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/22epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db284b5ccc8b6188474125cedf65848830c69e6e273180aae89e0a401525f675
3
+ size 477318768
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/config.yaml ADDED
@@ -0,0 +1,162 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/tuning/train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ dry_run: false
5
+ iterator_type: sequence
6
+ output_dir: exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en
7
+ ngpu: 1
8
+ seed: 0
9
+ num_workers: 1
10
+ num_att_plot: 3
11
+ dist_backend: nccl
12
+ dist_init_method: env://
13
+ dist_world_size: 4
14
+ dist_rank: 0
15
+ local_rank: 0
16
+ dist_master_addr: localhost
17
+ dist_master_port: 54869
18
+ dist_launcher: null
19
+ multiprocessing_distributed: true
20
+ unused_parameters: false
21
+ sharded_ddp: false
22
+ cudnn_enabled: true
23
+ cudnn_benchmark: false
24
+ cudnn_deterministic: false
25
+ collect_stats: false
26
+ write_collected_feats: false
27
+ max_epoch: 500
28
+ patience: null
29
+ val_scheduler_criterion:
30
+ - valid
31
+ - loss
32
+ early_stopping_criterion:
33
+ - valid
34
+ - loss
35
+ - min
36
+ best_model_criterion:
37
+ - - valid
38
+ - masked_acc
39
+ - max
40
+ keep_nbest_models: 300
41
+ nbest_averaging_interval: 0
42
+ grad_clip: 5.0
43
+ grad_clip_type: 2.0
44
+ grad_noise: false
45
+ accum_grad: 8
46
+ no_forward_run: false
47
+ resume: true
48
+ train_dtype: float32
49
+ use_amp: true
50
+ log_interval: null
51
+ use_matplotlib: true
52
+ use_tensorboard: true
53
+ use_wandb: false
54
+ wandb_project: null
55
+ wandb_id: null
56
+ wandb_entity: null
57
+ wandb_name: null
58
+ wandb_model_log_interval: -1
59
+ detect_anomaly: false
60
+ pretrain_path: null
61
+ init_param: []
62
+ ignore_init_mismatch: false
63
+ freeze_param: []
64
+ num_iters_per_epoch: null
65
+ batch_size: 256
66
+ valid_batch_size: null
67
+ batch_bins: 1000000
68
+ valid_batch_bins: null
69
+ train_shape_file:
70
+ - exp/bestrq_stats_raw_en/train/speech_shape
71
+ valid_shape_file:
72
+ - exp/bestrq_stats_raw_en/valid/speech_shape
73
+ batch_type: folded
74
+ valid_batch_type: null
75
+ fold_length:
76
+ - 80000
77
+ sort_in_batch: descending
78
+ sort_batch: descending
79
+ multiple_iterator: false
80
+ chunk_length: 500
81
+ chunk_shift_ratio: 0.5
82
+ num_cache_chunks: 1024
83
+ train_data_path_and_name_and_type:
84
+ - - dump/raw/train_6k/wav.scp
85
+ - speech
86
+ - sound
87
+ valid_data_path_and_name_and_type:
88
+ - - dump/raw/dev/wav.scp
89
+ - speech
90
+ - sound
91
+ allow_variable_data_keys: false
92
+ max_cache_size: 0.0
93
+ max_cache_fd: 32
94
+ valid_max_cache_size: null
95
+ optim: adam
96
+ optim_conf:
97
+ lr: 0.0005
98
+ scheduler: warmuplr
99
+ scheduler_conf:
100
+ warmup_steps: 30000
101
+ init: xavier_uniform
102
+ input_size: null
103
+ model_conf:
104
+ lsm_weight: 0.0
105
+ length_normalized_loss: false
106
+ vector_size: 16
107
+ codebook_size: 8192
108
+ temporal_reduction: 4
109
+ mask_prob: 0.01
110
+ mask_length: 40
111
+ unmasked_region_weight: 0
112
+ apply_l2_normalization: true
113
+ codebook_and_matrix_init_file: data/local/codebook_and_matrix_seed20220404.pth
114
+ frame_chunk_size: 3200
115
+ use_preprocessor: true
116
+ token_type: null
117
+ cleaner: null
118
+ speech_volume_normalize: null
119
+ rir_scp: null
120
+ rir_apply_prob: 1.0
121
+ noise_scp: null
122
+ noise_apply_prob: 1.0
123
+ noise_db_range: '13_15'
124
+ frontend: default
125
+ frontend_conf:
126
+ fs: 16k
127
+ n_fft: 512
128
+ win_length: 400
129
+ hop_length: 160
130
+ frontend_conf: null
131
+ apply_stft: true
132
+ specaug: null
133
+ specaug_conf: {}
134
+ normalize: global_mvn
135
+ normalize_conf:
136
+ stats_file: exp/bestrq_stats_raw_en/train/feats_stats.npz
137
+ preencoder: null
138
+ preencoder_conf: {}
139
+ encoder: conformer
140
+ encoder_conf:
141
+ output_size: 512
142
+ attention_heads: 8
143
+ linear_units: 2048
144
+ num_blocks: 17
145
+ dropout_rate: 0.1
146
+ positional_dropout_rate: 0.1
147
+ attention_dropout_rate: 0.1
148
+ input_layer: conv2d
149
+ normalize_before: true
150
+ macaron_style: true
151
+ rel_pos_type: latest
152
+ pos_enc_layer_type: rel_pos
153
+ selfattention_layer_type: rel_selfattn
154
+ activation_type: swish
155
+ use_cnn_module: true
156
+ cnn_module_kernel: 31
157
+ postencoder: null
158
+ postencoder_conf: {}
159
+ required:
160
+ - output_dir
161
+ version: 0.10.7a1
162
+ distributed: true
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/backward_time.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/forward_time.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/gpu_max_cached_mem_GB.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/iter_time.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/label_coverage.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/loss.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/masked_acc.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/masked_loss.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/optim0_lr0.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/optim_step_time.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/prediction_coverage.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/train_time.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/unmasked_acc.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/images/unmasked_loss.png ADDED
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/latest.pth ADDED
@@ -0,0 +1 @@
 
 
1
+ 22epoch.pth
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr5e-4_seed20220404_chunk3k_raw_en/valid.masked_acc.best.pth ADDED
@@ -0,0 +1 @@
 
 
1
+ 21epoch.pth