bubbliiiing commited on
Commit
f625293
·
1 Parent(s): 821abd1

Update config

Browse files
Files changed (2) hide show
  1. transformer/config.json +2 -0
  2. vae/config.json +40 -25
transformer/config.json CHANGED
@@ -8,9 +8,11 @@
8
  "clip_channels": null,
9
  "dropout": 0.0,
10
  "enable_clip_in_inpaint": false,
 
11
  "flip_sin_to_cos": true,
12
  "freq_shift": 0,
13
  "in_channels": 33,
 
14
  "norm_elementwise_affine": true,
15
  "norm_eps": 1e-05,
16
  "num_attention_heads": 48,
 
8
  "clip_channels": null,
9
  "dropout": 0.0,
10
  "enable_clip_in_inpaint": false,
11
+ "enable_text_attention_mask": false,
12
  "flip_sin_to_cos": true,
13
  "freq_shift": 0,
14
  "in_channels": 33,
15
+ "mmdit_layers": 48,
16
  "norm_elementwise_affine": true,
17
  "norm_eps": 1e-05,
18
  "num_attention_heads": 48,
vae/config.json CHANGED
@@ -1,43 +1,58 @@
1
  {
2
- "_class_name": "AutoencoderKL",
3
- "_diffusers_version": "0.31.0.dev0",
4
  "act_fn": "silu",
5
  "block_out_channels": [
6
- 128,
7
- 256,
8
- 512,
9
- 512
 
 
 
 
 
 
 
 
 
10
  ],
11
  "down_block_types": [
12
- "SpatialDownBlock3D",
13
- "SpatialTemporalDownBlock3D",
14
- "SpatialTemporalDownBlock3D",
15
- "SpatialTemporalDownBlock3D"
16
  ],
17
  "force_upcast": true,
18
  "in_channels": 3,
19
  "latent_channels": 16,
20
  "layers_per_block": 2,
 
 
 
 
 
 
21
  "norm_num_groups": 32,
 
22
  "out_channels": 3,
23
  "sample_size": 256,
24
  "scaling_factor": 0.7125,
25
- "slice_mag_vae": false,
26
  "slice_compression_vae": false,
27
- "cache_compression_vae": false,
28
- "cache_mag_vae": true,
29
- "use_tiling": false,
30
- "use_tiling_encoder": false,
31
- "use_tiling_decoder": false,
32
- "mini_batch_encoder": 4,
33
- "mini_batch_decoder": 1,
34
  "spatial_group_norm": true,
35
- "mid_block_attention_type": "spatial",
 
36
  "up_block_types": [
37
- "SpatialUpBlock3D",
38
- "SpatialTemporalUpBlock3D",
39
- "SpatialTemporalUpBlock3D",
40
- "SpatialTemporalUpBlock3D"
41
- ]
42
- }
 
 
 
 
 
43
 
 
1
  {
2
+ "_class_name": "AutoencoderKLMagvit",
3
+ "_diffusers_version": "0.30.1",
4
  "act_fn": "silu",
5
  "block_out_channels": [
6
+ 128,
7
+ 256,
8
+ 512,
9
+ 512
10
+ ],
11
+ "cache_compression_vae": false,
12
+ "cache_mag_vae": true,
13
+ "ch": 128,
14
+ "ch_mult": [
15
+ 1,
16
+ 2,
17
+ 4,
18
+ 4
19
  ],
20
  "down_block_types": [
21
+ "SpatialDownBlock3D",
22
+ "SpatialTemporalDownBlock3D",
23
+ "SpatialTemporalDownBlock3D",
24
+ "SpatialTemporalDownBlock3D"
25
  ],
26
  "force_upcast": true,
27
  "in_channels": 3,
28
  "latent_channels": 16,
29
  "layers_per_block": 2,
30
+ "mid_block_attention_type": "spatial",
31
+ "mid_block_num_attention_heads": 1,
32
+ "mid_block_type": "MidBlock3D",
33
+ "mid_block_use_attention": true,
34
+ "mini_batch_decoder": 1,
35
+ "mini_batch_encoder": 4,
36
  "norm_num_groups": 32,
37
+ "num_attention_heads": 1,
38
  "out_channels": 3,
39
  "sample_size": 256,
40
  "scaling_factor": 0.7125,
 
41
  "slice_compression_vae": false,
42
+ "slice_mag_vae": false,
 
 
 
 
 
 
43
  "spatial_group_norm": true,
44
+ "tile_overlap_factor": 0.25,
45
+ "tile_sample_min_size": 384,
46
  "up_block_types": [
47
+ "SpatialUpBlock3D",
48
+ "SpatialTemporalUpBlock3D",
49
+ "SpatialTemporalUpBlock3D",
50
+ "SpatialTemporalUpBlock3D"
51
+ ],
52
+ "upcast_vae": false,
53
+ "use_gc_blocks": null,
54
+ "use_tiling": false,
55
+ "use_tiling_decoder": false,
56
+ "use_tiling_encoder": false
57
+ }
58