youngsheen commited on
Commit
f9499bf
1 Parent(s): 528f777

upload ckpt

Browse files
vq_audio_log/simvq_262k/1second/config.yaml ADDED
@@ -0,0 +1,145 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # lightning.pytorch==2.2.5
2
+ seed_everything: 0
3
+ trainer:
4
+ accelerator: gpu
5
+ strategy: ddp_find_unused_parameters_true
6
+ devices: 2
7
+ num_nodes: 1
8
+ precision: 16-mixed
9
+ logger:
10
+ class_path: lightning.pytorch.loggers.TensorBoardLogger
11
+ init_args:
12
+ save_dir: vq_audio_log/simvq_262k
13
+ name: null
14
+ version: 1second
15
+ log_graph: false
16
+ default_hp_metric: true
17
+ prefix: ''
18
+ sub_dir: null
19
+ comment: ''
20
+ purge_step: null
21
+ max_queue: 10
22
+ flush_secs: 120
23
+ filename_suffix: ''
24
+ callbacks:
25
+ - class_path: lightning.pytorch.callbacks.ModelCheckpoint
26
+ init_args:
27
+ dirpath: vq_audio_log/simvq_262k
28
+ filename: null
29
+ monitor: null
30
+ verbose: false
31
+ save_last: null
32
+ save_top_k: -1
33
+ save_weights_only: false
34
+ mode: min
35
+ auto_insert_metric_name: true
36
+ every_n_train_steps: null
37
+ train_time_interval: null
38
+ every_n_epochs: null
39
+ save_on_train_epoch_end: null
40
+ enable_version_counter: true
41
+ - class_path: lightning.pytorch.callbacks.LearningRateMonitor
42
+ init_args:
43
+ logging_interval: step
44
+ log_momentum: false
45
+ log_weight_decay: false
46
+ fast_dev_run: false
47
+ max_epochs: 50
48
+ min_epochs: null
49
+ max_steps: -1
50
+ min_steps: null
51
+ max_time: null
52
+ limit_train_batches: null
53
+ limit_val_batches: null
54
+ limit_test_batches: null
55
+ limit_predict_batches: null
56
+ overfit_batches: 0.0
57
+ val_check_interval: null
58
+ check_val_every_n_epoch: 1
59
+ num_sanity_val_steps: 0
60
+ log_every_n_steps: 100
61
+ enable_checkpointing: null
62
+ enable_progress_bar: null
63
+ enable_model_summary: null
64
+ accumulate_grad_batches: 1
65
+ gradient_clip_val: null
66
+ gradient_clip_algorithm: null
67
+ deterministic: null
68
+ benchmark: null
69
+ inference_mode: true
70
+ use_distributed_sampler: true
71
+ profiler: null
72
+ detect_anomaly: false
73
+ barebones: false
74
+ plugins: null
75
+ sync_batchnorm: false
76
+ reload_dataloaders_every_n_epochs: 0
77
+ default_root_dir: null
78
+ ckpt_path: null
79
+ model:
80
+ class_path: taming.models.vq_audio.VQModel
81
+ init_args:
82
+ ddconfig:
83
+ causal: true
84
+ dimension: 512
85
+ lossconfig:
86
+ target: taming.modules.losses.stft.VQSTFTWithDiscriminator
87
+ params:
88
+ disc_conditional: false
89
+ disc_in_channels: 1
90
+ disc_start: 0
91
+ codebook_enlarge_ratio: 0
92
+ codebook_enlarge_steps: 2000
93
+ sample_rate: 24000
94
+ commit_weight: 1000.0
95
+ gen_loss_weight: 1.0
96
+ mel_loss_coeff: 45.0
97
+ mrd_loss_coeff: 1.0
98
+ quantconfig:
99
+ target: taming.modules.vqvae.quantize.SimVQ1D
100
+ params:
101
+ n_e: 262144
102
+ e_dim: 512
103
+ beta: 0.25
104
+ legacy: false
105
+ sample_rate: 24000
106
+ target_bandwidths: null
107
+ audio_normalize: false
108
+ segment: None
109
+ ckpt_path: null
110
+ ignore_keys: []
111
+ colorize_nlabels: null
112
+ monitor: null
113
+ learning_rate: 0.0001
114
+ warmup_epochs: 1.0
115
+ scheduler_type: None
116
+ min_learning_rate: 0
117
+ use_ema: true
118
+ stage: null
119
+ data:
120
+ class_path: main.PadDataModuleFromConfig
121
+ init_args:
122
+ batch_size: 64
123
+ train:
124
+ target: taming.data.libritts.LibriTTSTrain
125
+ params:
126
+ config:
127
+ sample_rate: 24000
128
+ channels: 1
129
+ clip_seconds: 1
130
+ validation:
131
+ target: taming.data.libritts.LibriTTSDev
132
+ params:
133
+ config:
134
+ sample_rate: 24000
135
+ channels: 1
136
+ clip_seconds: 1
137
+ test:
138
+ target: taming.data.libritts.LibriTTSTest
139
+ params:
140
+ config:
141
+ sample_rate: 24000
142
+ channels: 1
143
+ clip_seconds: -1
144
+ wrap: false
145
+ num_workers: 8
vq_audio_log/simvq_262k/epoch=49-step=138600.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0626979f252eceb2f4e87264649a2aaf72ae5c9e300aec508695005b43f04617
3
+ size 1857494478
vq_log/simvq_262k/epoch=49-step=250250.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2dff3d7d4b27b1a222fdb1b5453f336b681d0ab5c79d07245aa156a170ebb997
3
+ size 728546835
vq_log/simvq_262k/size128/config.yaml ADDED
@@ -0,0 +1,148 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # lightning.pytorch==2.2.5
2
+ seed_everything: 0
3
+ trainer:
4
+ accelerator: gpu
5
+ strategy: ddp_find_unused_parameters_true
6
+ devices: 4
7
+ num_nodes: 1
8
+ precision: 16-mixed
9
+ logger:
10
+ class_path: lightning.pytorch.loggers.TensorBoardLogger
11
+ init_args:
12
+ save_dir: vq_log/simvq_262k
13
+ name: null
14
+ version: size128
15
+ log_graph: false
16
+ default_hp_metric: true
17
+ prefix: ''
18
+ sub_dir: null
19
+ comment: ''
20
+ purge_step: null
21
+ max_queue: 10
22
+ flush_secs: 120
23
+ filename_suffix: ''
24
+ callbacks:
25
+ - class_path: lightning.pytorch.callbacks.ModelCheckpoint
26
+ init_args:
27
+ dirpath: vq_log/simvq_262k
28
+ filename: null
29
+ monitor: null
30
+ verbose: false
31
+ save_last: null
32
+ save_top_k: -1
33
+ save_weights_only: false
34
+ mode: min
35
+ auto_insert_metric_name: true
36
+ every_n_train_steps: null
37
+ train_time_interval: null
38
+ every_n_epochs: null
39
+ save_on_train_epoch_end: null
40
+ enable_version_counter: true
41
+ - class_path: lightning.pytorch.callbacks.LearningRateMonitor
42
+ init_args:
43
+ logging_interval: step
44
+ log_momentum: false
45
+ log_weight_decay: false
46
+ fast_dev_run: false
47
+ max_epochs: 50
48
+ min_epochs: null
49
+ max_steps: -1
50
+ min_steps: null
51
+ max_time: null
52
+ limit_train_batches: null
53
+ limit_val_batches: null
54
+ limit_test_batches: null
55
+ limit_predict_batches: null
56
+ overfit_batches: 0.0
57
+ val_check_interval: null
58
+ check_val_every_n_epoch: 1
59
+ num_sanity_val_steps: 0
60
+ log_every_n_steps: 100
61
+ enable_checkpointing: null
62
+ enable_progress_bar: null
63
+ enable_model_summary: null
64
+ accumulate_grad_batches: 1
65
+ gradient_clip_val: null
66
+ gradient_clip_algorithm: null
67
+ deterministic: null
68
+ benchmark: null
69
+ inference_mode: true
70
+ use_distributed_sampler: true
71
+ profiler: null
72
+ detect_anomaly: false
73
+ barebones: false
74
+ plugins: null
75
+ sync_batchnorm: false
76
+ reload_dataloaders_every_n_epochs: 0
77
+ default_root_dir: null
78
+ ckpt_path: null
79
+ model:
80
+ class_path: taming.models.vq.VQModel
81
+ init_args:
82
+ ddconfig:
83
+ double_z: false
84
+ z_channels: 128
85
+ resolution: 128
86
+ in_channels: 3
87
+ out_ch: 3
88
+ ch: 128
89
+ ch_mult:
90
+ - 1
91
+ - 2
92
+ - 2
93
+ - 4
94
+ num_res_blocks: 2
95
+ lossconfig:
96
+ target: taming.modules.losses.vqperceptual.VQLPIPSWithDiscriminator
97
+ params:
98
+ disc_conditional: false
99
+ disc_in_channels: 3
100
+ disc_start: 0
101
+ disc_weight: 0.8
102
+ gen_loss_weight: 0.1
103
+ codebook_weight: 0.1
104
+ commit_weight: 1.0
105
+ codebook_enlarge_ratio: 0
106
+ codebook_enlarge_steps: 2000
107
+ quantconfig:
108
+ target: taming.modules.vqvae.quantize.SimVQ
109
+ params:
110
+ n_e: 262144
111
+ e_dim: 128
112
+ beta: 0.25
113
+ legacy: false
114
+ ckpt_path: null
115
+ ignore_keys: []
116
+ image_key: image
117
+ colorize_nlabels: null
118
+ monitor: null
119
+ learning_rate: 0.0001
120
+ warmup_epochs: 1.0
121
+ scheduler_type: None
122
+ min_learning_rate: 0
123
+ use_ema: true
124
+ stage: null
125
+ data:
126
+ class_path: main.DataModuleFromConfig
127
+ init_args:
128
+ batch_size: 64
129
+ train:
130
+ target: taming.data.imagenet.ImageNetTrain
131
+ params:
132
+ config:
133
+ size: 128
134
+ subset: null
135
+ validation:
136
+ target: taming.data.imagenet.ImageNetValidation
137
+ params:
138
+ config:
139
+ size: 128
140
+ subset: null
141
+ test:
142
+ target: taming.data.imagenet.ImageNetValidation
143
+ params:
144
+ config:
145
+ size: 128
146
+ subset: null
147
+ wrap: false
148
+ num_workers: 8