dn6 HF staff commited on
Commit
c6453e5
1 Parent(s): e3aee2f

update diffusers weights

Browse files
decoder/config.json CHANGED
@@ -1,74 +1,83 @@
1
  {
2
- "_class_name": "StableCascadeUnet",
3
- "_diffusers_version": "0.26.0.dev0",
4
- "_name_or_path": "StableCascade/decoder",
5
- "block_repeat": [
 
 
 
 
 
6
  [
7
- 1,
8
- 1,
9
- 1,
10
- 1
11
  ],
12
  [
13
- 3,
14
- 3,
15
- 2,
16
- 2
17
- ]
18
- ],
19
- "blocks": [
20
  [
21
- 2,
22
- 6,
23
- 28,
24
- 6
25
  ],
26
  [
27
- 6,
28
- 28,
29
- 6,
30
- 2
31
  ]
32
  ],
33
- "c_clip_img": null,
34
- "c_clip_seq": 4,
35
- "c_clip_text": null,
36
- "c_clip_text_pooled": 1280,
37
- "c_cond": 1280,
38
- "c_effnet": 16,
39
- "c_hidden": [
40
- 320,
41
- 640,
42
- 1280,
43
- 1280
 
 
 
 
 
44
  ],
45
- "c_in": 4,
46
- "c_out": 4,
47
- "c_pixels": 3,
48
- "c_r": 64,
49
  "dropout": [
50
  0,
51
  0,
52
  0.1,
53
  0.1
54
  ],
 
 
55
  "kernel_size": 3,
56
- "level_config": [
57
- "CT",
58
- "CT",
59
- "CTA",
60
- "CTA"
61
- ],
62
- "nhead": [
63
- -1,
64
- -1,
65
  20,
66
  20
67
  ],
 
68
  "patch_size": 2,
 
69
  "self_attn": true,
70
  "switch_level": null,
71
- "t_conds": [
72
  "sca"
 
 
 
 
 
 
 
 
 
 
 
 
 
73
  ]
74
  }
 
1
  {
2
+ "_class_name": "StableCascadeUNet",
3
+ "_diffusers_version": "0.27.0.dev0",
4
+ "block_out_channels": [
5
+ 320,
6
+ 640,
7
+ 1280,
8
+ 1280
9
+ ],
10
+ "block_types_per_layer": [
11
  [
12
+ "SDCascadeResBlock",
13
+ "SDCascadeTimestepBlock"
 
 
14
  ],
15
  [
16
+ "SDCascadeResBlock",
17
+ "SDCascadeTimestepBlock"
18
+ ],
 
 
 
 
19
  [
20
+ "SDCascadeResBlock",
21
+ "SDCascadeTimestepBlock",
22
+ "SDCascadeAttnBlock"
 
23
  ],
24
  [
25
+ "SDCascadeResBlock",
26
+ "SDCascadeTimestepBlock",
27
+ "SDCascadeAttnBlock"
 
28
  ]
29
  ],
30
+ "clip_image_in_channels": null,
31
+ "clip_seq": 4,
32
+ "clip_text_in_channels": null,
33
+ "clip_text_pooled_in_channels": 1280,
34
+ "conditioning_dim": 1280,
35
+ "down_blocks_repeat_mappers": [
36
+ 1,
37
+ 1,
38
+ 1,
39
+ 1
40
+ ],
41
+ "down_num_layers_per_block": [
42
+ 2,
43
+ 6,
44
+ 28,
45
+ 6
46
  ],
 
 
 
 
47
  "dropout": [
48
  0,
49
  0,
50
  0.1,
51
  0.1
52
  ],
53
+ "effnet_in_channels": 16,
54
+ "in_channels": 4,
55
  "kernel_size": 3,
56
+ "num_attention_heads": [
57
+ 0,
58
+ 0,
 
 
 
 
 
 
59
  20,
60
  20
61
  ],
62
+ "out_channels": 4,
63
  "patch_size": 2,
64
+ "pixel_mapper_in_channels": 3,
65
  "self_attn": true,
66
  "switch_level": null,
67
+ "timestep_conditioning_type": [
68
  "sca"
69
+ ],
70
+ "timestep_ratio_embedding_dim": 64,
71
+ "up_blocks_repeat_mappers": [
72
+ 3,
73
+ 3,
74
+ 2,
75
+ 2
76
+ ],
77
+ "up_num_layers_per_block": [
78
+ 6,
79
+ 28,
80
+ 6,
81
+ 2
82
  ]
83
  }
decoder/diffusion_pytorch_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1f9575dfa6c2535ad65733d6257d17a7b1e1b54b7eafb251ce9556595f3bc0c9
3
- size 3126071088
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91e8b7d97350689a234bee74e53325e54191ac4146f599cff9551227566a46cb
3
+ size 6251952232
model_index.json CHANGED
@@ -1,10 +1,9 @@
1
  {
2
  "_class_name": "StableCascadeDecoderPipeline",
3
- "_diffusers_version": "0.26.0.dev0",
4
- "_name_or_path": "StableCascade/",
5
  "decoder": [
6
- "stable_cascade",
7
- "StableCascadeUnet"
8
  ],
9
  "latent_dim_scale": 10.67,
10
  "scheduler": [
 
1
  {
2
  "_class_name": "StableCascadeDecoderPipeline",
3
+ "_diffusers_version": "0.27.0.dev0",
 
4
  "decoder": [
5
+ "diffusers",
6
+ "StableCascadeUNet"
7
  ],
8
  "latent_dim_scale": 10.67,
9
  "scheduler": [
scheduler/scheduler_config.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "_class_name": "DDPMWuerstchenScheduler",
3
- "_diffusers_version": "0.26.0.dev0",
4
  "s": 0.008,
5
  "scaler": 1.0
6
  }
 
1
  {
2
  "_class_name": "DDPMWuerstchenScheduler",
3
+ "_diffusers_version": "0.27.0.dev0",
4
  "s": 0.008,
5
  "scaler": 1.0
6
  }
text_encoder/config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "StableCascade/text_encoder",
3
  "architectures": [
4
  "CLIPTextModelWithProjection"
5
  ],
@@ -19,7 +19,7 @@
19
  "num_hidden_layers": 32,
20
  "pad_token_id": 1,
21
  "projection_dim": 1280,
22
- "torch_dtype": "bfloat16",
23
- "transformers_version": "4.38.0.dev0",
24
  "vocab_size": 49408
25
  }
 
1
  {
2
+ "_name_or_path": "laion/CLIP-ViT-bigG-14-laion2B-39B-b160k",
3
  "architectures": [
4
  "CLIPTextModelWithProjection"
5
  ],
 
19
  "num_hidden_layers": 32,
20
  "pad_token_id": 1,
21
  "projection_dim": 1280,
22
+ "torch_dtype": "float32",
23
+ "transformers_version": "4.35.2",
24
  "vocab_size": 49408
25
  }
text_encoder/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:260e0127aca3c89db813637ae659ebb822cb07af71fedc16cbd980e9518dfdcd
3
- size 1389382688
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa5b2e6f4c2efc2d82e4b8312faec1a5540eabfc6415126c9a05c8436a530ef4
3
+ size 2778702264
tokenizer/special_tokens_map.json CHANGED
@@ -9,21 +9,15 @@
9
  "eos_token": {
10
  "content": "<|endoftext|>",
11
  "lstrip": false,
12
- "normalized": false,
13
- "rstrip": false,
14
- "single_word": false
15
- },
16
- "pad_token": {
17
- "content": "<|endoftext|>",
18
- "lstrip": false,
19
- "normalized": false,
20
  "rstrip": false,
21
  "single_word": false
22
  },
 
23
  "unk_token": {
24
  "content": "<|endoftext|>",
25
  "lstrip": false,
26
- "normalized": false,
27
  "rstrip": false,
28
  "single_word": false
29
  }
 
9
  "eos_token": {
10
  "content": "<|endoftext|>",
11
  "lstrip": false,
12
+ "normalized": true,
 
 
 
 
 
 
 
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
+ "pad_token": "<|endoftext|>",
17
  "unk_token": {
18
  "content": "<|endoftext|>",
19
  "lstrip": false,
20
+ "normalized": true,
21
  "rstrip": false,
22
  "single_word": false
23
  }
tokenizer/tokenizer.json CHANGED
@@ -1,14 +1,7 @@
1
  {
2
  "version": "1.0",
3
  "truncation": null,
4
- "padding": {
5
- "strategy": "BatchLongest",
6
- "direction": "Right",
7
- "pad_to_multiple_of": null,
8
- "pad_id": 49407,
9
- "pad_type_id": 0,
10
- "pad_token": "<|endoftext|>"
11
- },
12
  "added_tokens": [
13
  {
14
  "id": 49406,
@@ -25,7 +18,7 @@
25
  "single_word": false,
26
  "lstrip": false,
27
  "rstrip": false,
28
- "normalized": false,
29
  "special": true
30
  }
31
  ],
 
1
  {
2
  "version": "1.0",
3
  "truncation": null,
4
+ "padding": null,
 
 
 
 
 
 
 
5
  "added_tokens": [
6
  {
7
  "id": 49406,
 
18
  "single_word": false,
19
  "lstrip": false,
20
  "rstrip": false,
21
+ "normalized": true,
22
  "special": true
23
  }
24
  ],
tokenizer/tokenizer_config.json CHANGED
@@ -12,7 +12,7 @@
12
  "49407": {
13
  "content": "<|endoftext|>",
14
  "lstrip": false,
15
- "normalized": false,
16
  "rstrip": false,
17
  "single_word": false,
18
  "special": true
 
12
  "49407": {
13
  "content": "<|endoftext|>",
14
  "lstrip": false,
15
+ "normalized": true,
16
  "rstrip": false,
17
  "single_word": false,
18
  "special": true
vqgan/config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "_class_name": "PaellaVQModel",
3
- "_diffusers_version": "0.26.0.dev0",
4
- "_name_or_path": "StableCascade/vqgan",
5
  "bottleneck_blocks": 12,
6
  "embed_dim": 384,
7
  "in_channels": 3,
 
1
  {
2
  "_class_name": "PaellaVQModel",
3
+ "_diffusers_version": "0.27.0.dev0",
4
+ "_name_or_path": "warp-ai/wuerstchen",
5
  "bottleneck_blocks": 12,
6
  "embed_dim": 384,
7
  "in_channels": 3,
vqgan/diffusion_pytorch_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3ac32fab5177329dac907b2480c8c00aeefc712dfd92c2d52263a9c64b426b26
3
- size 36825828
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:052db8852c0d8b117e6d2a59ae3e0c7d7aaae3d00f247e392ef8e9837e11d6c4
3
+ size 73639568