basso4 commited on
Commit
c38c888
β€’
1 Parent(s): 8a9194a

Update configs/test_vitonhd.yaml

Browse files
Files changed (1) hide show
  1. configs/test_vitonhd.yaml +92 -89
configs/test_vitonhd.yaml CHANGED
@@ -1,90 +1,93 @@
1
- model:
2
- base_learning_rate: 3e-05
3
- target: ldm.models.diffusion.control.ControlLDM
4
- params:
5
- linear_start: 0.00085
6
- linear_end: 0.0120
7
- log_every_t: 200
8
- timesteps: 1000
9
- image_size: 64
10
- channels: 4
11
- u_cond_percent: 0.2
12
- scale_factor: 0.18215
13
- use_ema: False
14
-
15
- control_stage_config:
16
- target: ldm.models.diffusion.control.ControlNet
17
- params:
18
- use_checkpoint: True
19
- in_channels: 9
20
- hint_channels: 6
21
- model_channels: 320
22
- attention_resolutions: [ 4, 2, 1 ]
23
- num_res_blocks: 2
24
- channel_mult: [ 1, 2, 4, 4 ]
25
- num_head_channels: 64
26
- transformer_depth: 1
27
- context_dim: 768
28
-
29
- unet_config:
30
- target: ldm.models.diffusion.control.ControlledUnetModel
31
- params:
32
- image_size: 32 # unused
33
- in_channels: 9
34
- out_channels: 4
35
- model_channels: 320
36
- attention_resolutions: [ 4, 2, 1 ]
37
- num_res_blocks: 2
38
- channel_mult: [ 1, 2, 4, 4 ]
39
- num_heads: 8
40
- use_spatial_transformer: True
41
- transformer_depth: 1
42
- context_dim: 768
43
- use_checkpoint: True
44
- legacy: False
45
- add_conv_in_front_of_unet: False
46
-
47
- first_stage_config:
48
- target: ldm.models.autoencoder.AutoencoderKL
49
- params:
50
- embed_dim: 4
51
- monitor: val/rec_loss
52
- ddconfig:
53
- double_z: true
54
- z_channels: 4
55
- resolution: 256
56
- in_channels: 3
57
- out_ch: 3
58
- ch: 128
59
- ch_mult:
60
- - 1
61
- - 2
62
- - 4
63
- - 4
64
- num_res_blocks: 2
65
- attn_resolutions: []
66
- dropout: 0.0
67
- lossconfig:
68
- target: torch.nn.Identity
69
-
70
- cond_stage_config:
71
- target: ldm.modules.encoders.modules.FrozenCLIPImageEmbedder
72
-
73
- data:
74
- target: test.DataModuleFromConfig
75
- params:
76
- batch_size: 1
77
- wrap: False
78
- test:
79
- target: ldm.data.image_vitonhd.OpenImageDataset
80
- params:
81
- state: test
82
- dataset_dir: datasets/vitonhd
83
- type: unpaired
84
-
85
- lightning:
86
- trainer:
87
- num_nodes: 1
88
- profiler: "simple"
89
- accelerator: 'ddp'
 
 
 
90
  gpus: "0,1"
 
1
+ model:
2
+ base_learning_rate: 3e-05
3
+ target: ldm.models.diffusion.control.ControlLDM
4
+ params:
5
+ linear_start: 0.00085
6
+ linear_end: 0.0120
7
+ log_every_t: 200
8
+ timesteps: 1000
9
+ image_size: 64
10
+ channels: 4
11
+ u_cond_percent: 0.2
12
+ scale_factor: 0.18215
13
+ use_ema: False
14
+
15
+ control_stage_config:
16
+ target: ldm.models.diffusion.control.ControlNet
17
+ params:
18
+ use_checkpoint: True
19
+ in_channels: 9
20
+ hint_channels: 6
21
+ model_channels: 320
22
+ attention_resolutions: [ 4, 2, 1 ]
23
+ num_res_blocks: 2
24
+ channel_mult: [ 1, 2, 4, 4 ]
25
+ num_head_channels: 64
26
+ transformer_depth: 1
27
+ context_dim: 768
28
+
29
+ unet_config:
30
+ target: ldm.models.diffusion.control.ControlledUnetModel
31
+ params:
32
+ image_size: 32 # unused
33
+ in_channels: 9
34
+ out_channels: 4
35
+ model_channels: 320
36
+ attention_resolutions: [ 4, 2, 1 ]
37
+ num_res_blocks: 2
38
+ channel_mult: [ 1, 2, 4, 4 ]
39
+ num_heads: 8
40
+ use_spatial_transformer: True
41
+ transformer_depth: 1
42
+ context_dim: 768
43
+ use_checkpoint: True
44
+ legacy: False
45
+ add_conv_in_front_of_unet: False
46
+
47
+ first_stage_config:
48
+ target: ldm.models.autoencoder.AutoencoderKL
49
+ params:
50
+ embed_dim: 4
51
+ monitor: val/rec_loss
52
+ ddconfig:
53
+ double_z: true
54
+ z_channels: 4
55
+ resolution: 256
56
+ in_channels: 3
57
+ out_ch: 3
58
+ ch: 128
59
+ ch_mult:
60
+ - 1
61
+ - 2
62
+ - 4
63
+ - 4
64
+ num_res_blocks: 2
65
+ attn_resolutions: []
66
+ dropout: 0.0
67
+ lossconfig:
68
+ target: torch.nn.Identity
69
+
70
+ cond_stage_config:
71
+ target: ldm.modules.encoders.modules.FrozenCLIPImageEmbedder
72
+
73
+ condi_stage_config:
74
+ target: ldm.modules.encoders.modules.FrozenCLIPTextEmbedder
75
+
76
+ data:
77
+ target: test.DataModuleFromConfig
78
+ params:
79
+ batch_size: 1
80
+ wrap: False
81
+ test:
82
+ target: ldm.data.image_vitonhd.OpenImageDataset
83
+ params:
84
+ state: test
85
+ dataset_dir: D:\Capstone_Project\datasets\vitonhd
86
+ type: unpaired
87
+
88
+ lightning:
89
+ trainer:
90
+ num_nodes: 1
91
+ profiler: "simple"
92
+ accelerator: 'ddp'
93
  gpus: "0,1"