Mariam-Elz commited on
Commit
a5fbc19
·
verified ·
1 Parent(s): c25a471

Upload imagedream/configs/sd_v2_base_ipmv_chin8_zero_snr.yaml with huggingface_hub

Browse files
imagedream/configs/sd_v2_base_ipmv_chin8_zero_snr.yaml ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ target: imagedream.ldm.interface.LatentDiffusionInterface
3
+ params:
4
+ linear_start: 0.00085
5
+ linear_end: 0.0120
6
+ timesteps: 1000
7
+ scale_factor: 0.18215
8
+ parameterization: "eps"
9
+ zero_snr: true
10
+
11
+ unet_config:
12
+ target: imagedream.ldm.modules.diffusionmodules.openaimodel.MultiViewUNetModelStage2
13
+ params:
14
+ image_size: 32 # unused
15
+ in_channels: 8
16
+ out_channels: 4
17
+ model_channels: 320
18
+ attention_resolutions: [ 4, 2, 1 ]
19
+ num_res_blocks: 2
20
+ channel_mult: [ 1, 2, 4, 4 ]
21
+ num_head_channels: 64 # need to fix for flash-attn
22
+ use_spatial_transformer: True
23
+ use_linear_in_transformer: True
24
+ transformer_depth: 1
25
+ context_dim: 1024
26
+ use_checkpoint: False
27
+ legacy: False
28
+ camera_dim: 16
29
+ with_ip: True
30
+ ip_dim: 16 # ip token length
31
+ ip_mode: "local_resample"
32
+
33
+ vae_config:
34
+ target: imagedream.ldm.models.autoencoder.AutoencoderKL
35
+ params:
36
+ embed_dim: 4
37
+ monitor: val/rec_loss
38
+ ddconfig:
39
+ #attn_type: "vanilla-xformers"
40
+ double_z: true
41
+ z_channels: 4
42
+ resolution: 256
43
+ in_channels: 3
44
+ out_ch: 3
45
+ ch: 128
46
+ ch_mult:
47
+ - 1
48
+ - 2
49
+ - 4
50
+ - 4
51
+ num_res_blocks: 2
52
+ attn_resolutions: []
53
+ dropout: 0.0
54
+ lossconfig:
55
+ target: torch.nn.Identity
56
+
57
+ clip_config:
58
+ target: imagedream.ldm.modules.encoders.modules.FrozenOpenCLIPEmbedder
59
+ params:
60
+ freeze: True
61
+ layer: "penultimate"
62
+ ip_mode: "local_resample"