VQGAN_CLIP / taming-transformers /configs /drin_transformer.yaml
akhaliq3
New message for the combined commit
833ef7e
model:
base_learning_rate: 4.5e-06
target: taming.models.cond_transformer.Net2NetTransformer
params:
cond_stage_key: depth
transformer_config:
target: taming.modules.transformer.mingpt.GPT
params:
vocab_size: 1024
block_size: 512
n_layer: 24
n_head: 16
n_embd: 1024
first_stage_config:
target: taming.models.vqgan.VQModel
params:
ckpt_path: logs/2020-09-23T17-56-33_imagenet_vqgan/checkpoints/last.ckpt
embed_dim: 256
n_embed: 1024
ddconfig:
double_z: false
z_channels: 256
resolution: 256
in_channels: 3
out_ch: 3
ch: 128
ch_mult:
- 1
- 1
- 2
- 2
- 4
num_res_blocks: 2
attn_resolutions:
- 16
dropout: 0.0
lossconfig:
target: taming.modules.losses.DummyLoss
cond_stage_config:
target: taming.models.vqgan.VQModel
params:
ckpt_path: logs/2020-11-03T15-34-24_imagenetdepth_vqgan/checkpoints/last.ckpt
embed_dim: 256
n_embed: 1024
ddconfig:
double_z: false
z_channels: 256
resolution: 256
in_channels: 1
out_ch: 1
ch: 128
ch_mult:
- 1
- 1
- 2
- 2
- 4
num_res_blocks: 2
attn_resolutions:
- 16
dropout: 0.0
lossconfig:
target: taming.modules.losses.DummyLoss
data:
target: main.DataModuleFromConfig
params:
batch_size: 2
num_workers: 8
train:
target: taming.data.imagenet.RINTrainWithDepth
params:
size: 256
validation:
target: taming.data.imagenet.RINValidationWithDepth
params:
size: 256