mlchen commited on
Commit
d02f4df
·
verified ·
1 Parent(s): ee6d50c

Upload 2 files

Browse files
nddiffusion/nd_mv_ema.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfaf4c662a542abdf662f7555e1210fc042cebcca50e3e97e44a60658e60731b
3
+ size 4272144515
nddiffusion/txtcond_mvsd-4-objaverse_finetune_wovae.yaml ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # normal depth model
2
+ # finetune from objaverse
3
+ model:
4
+ target: core.extern.ldm_nddiffusion.interface.LatentDiffusionInterface
5
+ params:
6
+ linear_start: 0.00085
7
+ linear_end: 0.0120
8
+ timesteps: 1000
9
+ scale_factor: 0.18215
10
+ parameterization: "eps"
11
+
12
+ unet_config:
13
+ target: core.extern.ldm_nddiffusion.modules.diffusionmodules.openaimodel_v2_1.MultiViewUNetModel
14
+ params:
15
+ use_fp16: False
16
+ image_size: 32 # unused
17
+ in_channels: 4
18
+ out_channels: 4
19
+ model_channels: 320
20
+ # use_checkpoint: True # lead to error need to close
21
+ use_checkpoint: False
22
+ attention_resolutions: [ 4, 2, 1 ]
23
+ num_res_blocks: 2
24
+ channel_mult: [ 1, 2, 4, 4 ]
25
+ num_heads: 8
26
+ use_spatial_transformer: True
27
+ transformer_depth: 1
28
+ context_dim: 768
29
+ legacy: False
30
+ camera_dim: 16
31
+
32
+ first_stage_config:
33
+ target: core.extern.ldm_nddiffusion.models.autoencoder.AutoencoderKL
34
+ params:
35
+ embed_dim: 4
36
+ monitor: val/rec_loss
37
+ ddconfig:
38
+ double_z: true
39
+ z_channels: 4
40
+ resolution: 256
41
+ in_channels: 4
42
+ out_ch: 4
43
+ ch: 128
44
+ ch_mult:
45
+ - 1
46
+ - 2
47
+ - 4
48
+ - 4
49
+ num_res_blocks: 2
50
+ attn_resolutions: []
51
+ dropout: 0.0
52
+ lossconfig:
53
+ target: torch.nn.Identity
54
+ cond_stage_config:
55
+ target: core.extern.ldm_nddiffusion.modules.encoders.modules.FrozenCLIPEmbedder
56
+ params:
57
+ version: 'F:/huggingface/openai/clip-vit-large-patch14'