patrickbdevaney commited on
Commit
e54b8f5
1 Parent(s): f9275f8

Upload 2 files

Browse files
Files changed (2) hide show
  1. config.yaml +96 -0
  2. model.safetensors +3 -0
config.yaml ADDED
@@ -0,0 +1,96 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ cond_image_size: 512
2
+ isosurface_resolution: 160
3
+ radius: 0.87
4
+
5
+ camera_embedder_cls: sf3d.models.camera.LinearCameraEmbedder
6
+ camera_embedder:
7
+ in_channels: 25
8
+ out_channels: 768
9
+ conditions:
10
+ - c2w_cond
11
+ - intrinsic_normed_cond
12
+
13
+ image_tokenizer_cls: sf3d.models.tokenizers.image.DINOV2SingleImageTokenizer
14
+ image_tokenizer:
15
+ pretrained_model_name_or_path: "facebook/dinov2-large"
16
+ width: 512
17
+ height: 512
18
+ modulation_cond_dim: 768
19
+
20
+ tokenizer_cls: sf3d.models.tokenizers.triplane.TriplaneLearnablePositionalEmbedding
21
+ tokenizer:
22
+ plane_size: 96
23
+ num_channels: 1024
24
+
25
+ backbone_cls: sf3d.models.transformers.backbone.TwoStreamInterleaveTransformer
26
+ backbone:
27
+ num_attention_heads: 16
28
+ attention_head_dim: 64
29
+ raw_triplane_channels: 1024
30
+ triplane_channels: 1024
31
+ raw_image_channels: 1024 # DINO features
32
+ num_latents: 1792
33
+ num_blocks: 4
34
+ num_basic_blocks: 3
35
+
36
+ post_processor_cls: sf3d.models.network.PixelShuffleUpsampleNetwork
37
+ post_processor:
38
+ in_channels: 1024
39
+ out_channels: 40
40
+ scale_factor: 4
41
+ conv_layers: 4
42
+
43
+
44
+ decoder_cls: sf3d.models.network.MaterialMLP
45
+ decoder:
46
+ in_channels: 120
47
+ n_neurons: 64
48
+ activation: silu
49
+ heads:
50
+ - name: density
51
+ out_channels: 1
52
+ out_bias: -1.0
53
+ n_hidden_layers: 2
54
+ output_activation: trunc_exp
55
+ - name: features
56
+ out_channels: 3
57
+ n_hidden_layers: 3
58
+ output_activation: sigmoid
59
+ - name: perturb_normal
60
+ out_channels: 3
61
+ n_hidden_layers: 3
62
+ output_activation: normalize_channel_last
63
+ - name: vertex_offset
64
+ out_channels: 3
65
+ n_hidden_layers: 2
66
+
67
+ image_estimator_cls: sf3d.models.image_estimator.clip_based_estimator.ClipBasedHeadEstimator
68
+ image_estimator:
69
+ distribution: beta
70
+ distribution_eval: mode
71
+ heads:
72
+ - name: roughness
73
+ out_channels: 1
74
+ n_hidden_layers: 3
75
+ output_activation: linear
76
+ add_to_decoder_features: true
77
+ output_bias: 1.0
78
+ shape: [-1, 1, 1]
79
+ - name: metallic
80
+ out_channels: 1
81
+ n_hidden_layers: 3
82
+ output_activation: linear
83
+ add_to_decoder_features: true
84
+ output_bias: 1.0
85
+ shape: [-1, 1, 1]
86
+
87
+ global_estimator_cls: sf3d.models.global_estimator.multi_head_estimator.MultiHeadEstimator
88
+ global_estimator:
89
+ triplane_features: 1024
90
+ heads:
91
+ - name: sg_amplitudes
92
+ out_channels: 24
93
+ n_hidden_layers: 3
94
+ output_activation: softplus
95
+ output_bias: 1.0
96
+ shape: [-1, 24, 1]
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3416e1cf654e7d4f5e75f116cec2c3f0a14501a77d30c2f6068bbda178de388
3
+ size 4024289892