idle Stoev commited on
Commit
2febc40
1 Parent(s): e6e4a31

Config Variation3

Browse files
scheduler/scheduler_config.json CHANGED
@@ -9,8 +9,11 @@
9
  "dynamic_thresholding_ratio": 0.995,
10
  "num_train_timesteps": 1000,
11
  "prediction_type": "v_prediction",
 
 
12
  "set_alpha_to_one": false,
13
  "steps_offset": 1,
14
- "skip_prk_steps": true,
 
15
  "trained_betas": null
16
- }
 
9
  "dynamic_thresholding_ratio": 0.995,
10
  "num_train_timesteps": 1000,
11
  "prediction_type": "v_prediction",
12
+ "rescale_betas_zero_snr": false,
13
+ "sample_max_value": 1.0,
14
  "set_alpha_to_one": false,
15
  "steps_offset": 1,
16
+ "thresholding": false,
17
+ "timestep_spacing": "leading",
18
  "trained_betas": null
19
+ }
text_encoder/config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
-
3
  "architectures": [
4
  "CLIPTextModel"
5
  ],
@@ -19,7 +19,7 @@
19
  "num_hidden_layers": 23,
20
  "pad_token_id": 1,
21
  "projection_dim": 512,
22
- "torch_dtype": "float32",
23
  "transformers_version": "4.31.0",
24
  "vocab_size": 49408
25
- }
 
1
  {
2
+ "_name_or_path": "hf-models/stable-diffusion-v2-768x768/text_encoder",
3
  "architectures": [
4
  "CLIPTextModel"
5
  ],
 
19
  "num_hidden_layers": 23,
20
  "pad_token_id": 1,
21
  "projection_dim": 512,
22
+ "torch_dtype": "float16",
23
  "transformers_version": "4.31.0",
24
  "vocab_size": 49408
25
+ }
unet/config.json CHANGED
@@ -2,6 +2,9 @@
2
  "_class_name": "UNet2DConditionModel",
3
  "_diffusers_version": "0.19.0.dev0",
4
  "act_fn": "silu",
 
 
 
5
  "attention_head_dim": [
6
  5,
7
  10,
@@ -15,7 +18,12 @@
15
  1280
16
  ],
17
  "center_input_sample": false,
 
 
 
 
18
  "cross_attention_dim": 1024,
 
19
  "down_block_types": [
20
  "CrossAttnDownBlock2D",
21
  "CrossAttnDownBlock2D",
@@ -24,24 +32,38 @@
24
  ],
25
  "downsample_padding": 1,
26
  "dual_cross_attention": false,
 
 
27
  "flip_sin_to_cos": true,
28
  "freq_shift": 0,
29
  "in_channels": 4,
30
  "layers_per_block": 2,
 
31
  "mid_block_scale_factor": 1,
 
32
  "norm_eps": 1e-05,
33
  "norm_num_groups": 32,
34
  "num_attention_heads": null,
35
  "num_class_embeds": null,
36
  "only_cross_attention": false,
37
  "out_channels": 4,
38
- "sample_size": 64,
 
 
 
 
 
 
 
 
 
 
39
  "up_block_types": [
40
  "UpBlock2D",
41
  "CrossAttnUpBlock2D",
42
  "CrossAttnUpBlock2D",
43
  "CrossAttnUpBlock2D"
44
  ],
45
- "upcast_attention": false,
46
  "use_linear_projection": true
47
  }
 
2
  "_class_name": "UNet2DConditionModel",
3
  "_diffusers_version": "0.19.0.dev0",
4
  "act_fn": "silu",
5
+ "addition_embed_type": null,
6
+ "addition_embed_type_num_heads": 64,
7
+ "addition_time_embed_dim": null,
8
  "attention_head_dim": [
9
  5,
10
  10,
 
18
  1280
19
  ],
20
  "center_input_sample": false,
21
+ "class_embed_type": null,
22
+ "class_embeddings_concat": false,
23
+ "conv_in_kernel": 3,
24
+ "conv_out_kernel": 3,
25
  "cross_attention_dim": 1024,
26
+ "cross_attention_norm": null,
27
  "down_block_types": [
28
  "CrossAttnDownBlock2D",
29
  "CrossAttnDownBlock2D",
 
32
  ],
33
  "downsample_padding": 1,
34
  "dual_cross_attention": false,
35
+ "encoder_hid_dim": null,
36
+ "encoder_hid_dim_type": null,
37
  "flip_sin_to_cos": true,
38
  "freq_shift": 0,
39
  "in_channels": 4,
40
  "layers_per_block": 2,
41
+ "mid_block_only_cross_attention": null,
42
  "mid_block_scale_factor": 1,
43
+ "mid_block_type": "UNetMidBlock2DCrossAttn",
44
  "norm_eps": 1e-05,
45
  "norm_num_groups": 32,
46
  "num_attention_heads": null,
47
  "num_class_embeds": null,
48
  "only_cross_attention": false,
49
  "out_channels": 4,
50
+ "projection_class_embeddings_input_dim": null,
51
+ "resnet_out_scale_factor": 1.0,
52
+ "resnet_skip_time_act": false,
53
+ "resnet_time_scale_shift": "default",
54
+ "sample_size": 96,
55
+ "time_cond_proj_dim": null,
56
+ "time_embedding_act_fn": null,
57
+ "time_embedding_dim": null,
58
+ "time_embedding_type": "positional",
59
+ "timestep_post_act": null,
60
+ "transformer_layers_per_block": 1,
61
  "up_block_types": [
62
  "UpBlock2D",
63
  "CrossAttnUpBlock2D",
64
  "CrossAttnUpBlock2D",
65
  "CrossAttnUpBlock2D"
66
  ],
67
+ "upcast_attention": null,
68
  "use_linear_projection": true
69
  }
vae/config.json CHANGED
@@ -14,12 +14,14 @@
14
  "DownEncoderBlock2D",
15
  "DownEncoderBlock2D"
16
  ],
 
17
  "in_channels": 3,
18
  "latent_channels": 4,
19
  "layers_per_block": 2,
20
  "norm_num_groups": 32,
21
  "out_channels": 3,
22
- "sample_size": 256,
 
23
  "up_block_types": [
24
  "UpDecoderBlock2D",
25
  "UpDecoderBlock2D",
 
14
  "DownEncoderBlock2D",
15
  "DownEncoderBlock2D"
16
  ],
17
+ "force_upcast": true,
18
  "in_channels": 3,
19
  "latent_channels": 4,
20
  "layers_per_block": 2,
21
  "norm_num_groups": 32,
22
  "out_channels": 3,
23
+ "sample_size": 768,
24
+ "scaling_factor": 0.18215,
25
  "up_block_types": [
26
  "UpDecoderBlock2D",
27
  "UpDecoderBlock2D",