Redamancy2299 commited on
Commit
463b3d1
1 Parent(s): de35056

End of training

Browse files
README.md CHANGED
@@ -1,7 +1,7 @@
1
 
2
  ---
3
  license: creativeml-openrail-m
4
- base_model: stabilityai/stable-diffusion-2-1
5
  instance_prompt: A photo of a young people sleeping in front of a computer
6
  tags:
7
  - stable-diffusion
@@ -14,7 +14,7 @@ inference: true
14
 
15
  # DreamBooth - Redamancy2299/dreambooth3
16
 
17
- This is a dreambooth model derived from stabilityai/stable-diffusion-2-1. The weights were trained on A photo of a young people sleeping in front of a computer using [DreamBooth](https://dreambooth.github.io/).
18
  You can find some example images in the following.
19
 
20
 
 
1
 
2
  ---
3
  license: creativeml-openrail-m
4
+ base_model: runwayml/stable-diffusion-v1-5
5
  instance_prompt: A photo of a young people sleeping in front of a computer
6
  tags:
7
  - stable-diffusion
 
14
 
15
  # DreamBooth - Redamancy2299/dreambooth3
16
 
17
+ This is a dreambooth model derived from runwayml/stable-diffusion-v1-5. The weights were trained on A photo of a young people sleeping in front of a computer using [DreamBooth](https://dreambooth.github.io/).
18
  You can find some example images in the following.
19
 
20
 
checkpoint-1000/optimizer.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:002c3be28b266a209dd625d666a9528aecf9ecc001db16db9159214bbcfda262
3
- size 2415
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:467d70c372986fdb0f281af6b509dd0f673c561deb93f131c5ffd6ef017c02ea
3
+ size 6876576717
checkpoint-1000/random_states_0.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e92869e782c712cbb71e67c788edb27a0ff14cd8ef8f839bf4ba78b00510609b
3
- size 21643
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b09391c45649863318512756079e9064acdb106650db0e85db0de5f65d3bcd5a
3
+ size 21579
checkpoint-1000/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5df0168a751b1257361283b5aa0c288d7c712011edfd861c618859611a2278ec
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f810fc7b695697c440d8985f6042b4ba23a9e1027604c265718b518ca29f1b2b
3
  size 559
checkpoint-1000/scheduler.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2feff11e6c29b4fe174532267a1630de084a913d877000d37d8703b6bc266c91
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b4458f3e731799ca4080dc0c7a998ebe457637ef809e2a7d885d4c4b35a4b6b
3
  size 559
checkpoint-1000/unet/config.json CHANGED
@@ -1,16 +1,11 @@
1
  {
2
  "_class_name": "UNet2DConditionModel",
3
  "_diffusers_version": "0.18.0.dev0",
4
- "_name_or_path": "stabilityai/stable-diffusion-2-1",
5
  "act_fn": "silu",
6
  "addition_embed_type": null,
7
  "addition_embed_type_num_heads": 64,
8
- "attention_head_dim": [
9
- 5,
10
- 10,
11
- 20,
12
- 20
13
- ],
14
  "block_out_channels": [
15
  320,
16
  640,
@@ -22,7 +17,7 @@
22
  "class_embeddings_concat": false,
23
  "conv_in_kernel": 3,
24
  "conv_out_kernel": 3,
25
- "cross_attention_dim": 1024,
26
  "cross_attention_norm": null,
27
  "down_block_types": [
28
  "CrossAttnDownBlock2D",
@@ -50,7 +45,7 @@
50
  "resnet_out_scale_factor": 1.0,
51
  "resnet_skip_time_act": false,
52
  "resnet_time_scale_shift": "default",
53
- "sample_size": 96,
54
  "time_cond_proj_dim": null,
55
  "time_embedding_act_fn": null,
56
  "time_embedding_dim": null,
@@ -62,6 +57,6 @@
62
  "CrossAttnUpBlock2D",
63
  "CrossAttnUpBlock2D"
64
  ],
65
- "upcast_attention": true,
66
- "use_linear_projection": true
67
  }
 
1
  {
2
  "_class_name": "UNet2DConditionModel",
3
  "_diffusers_version": "0.18.0.dev0",
4
+ "_name_or_path": "runwayml/stable-diffusion-v1-5",
5
  "act_fn": "silu",
6
  "addition_embed_type": null,
7
  "addition_embed_type_num_heads": 64,
8
+ "attention_head_dim": 8,
 
 
 
 
 
9
  "block_out_channels": [
10
  320,
11
  640,
 
17
  "class_embeddings_concat": false,
18
  "conv_in_kernel": 3,
19
  "conv_out_kernel": 3,
20
+ "cross_attention_dim": 768,
21
  "cross_attention_norm": null,
22
  "down_block_types": [
23
  "CrossAttnDownBlock2D",
 
45
  "resnet_out_scale_factor": 1.0,
46
  "resnet_skip_time_act": false,
47
  "resnet_time_scale_shift": "default",
48
+ "sample_size": 64,
49
  "time_cond_proj_dim": null,
50
  "time_embedding_act_fn": null,
51
  "time_embedding_dim": null,
 
57
  "CrossAttnUpBlock2D",
58
  "CrossAttnUpBlock2D"
59
  ],
60
+ "upcast_attention": false,
61
+ "use_linear_projection": false
62
  }
checkpoint-1000/unet/diffusion_pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5d084337c1357e767608807670329217d8428d9124efab1918d4ddccfb164569
3
- size 3463923045
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff1c1c724c6f73368145be3a8eedef640ae8e5af79584267db611ec66a9bf973
3
+ size 3438364325
checkpoint-500/optimizer.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:002c3be28b266a209dd625d666a9528aecf9ecc001db16db9159214bbcfda262
3
- size 2415
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74dd9e2a6bd6b7109cd26b5fce21e1b3d760953d517b69322a21ce4a520e23df
3
+ size 6876576717
checkpoint-500/random_states_0.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6bf686bd09360de7abfbe45f4951106016a688dd79434d5e1c3126fb3bcb46f9
3
- size 21643
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d55a4a192962d4fd34ba2c53ae6cf68a99bce6cdf0bbd56db810b762434da2e0
3
+ size 21579
checkpoint-500/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5df0168a751b1257361283b5aa0c288d7c712011edfd861c618859611a2278ec
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fa4c7be44c959599b8b43bb9bc3371e9e4e5bbc5758b3ab5afcccfda3e72e67
3
  size 559
checkpoint-500/scheduler.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:15a30dc11a3915848233b4ac47aad41354fafd77728ae6dda8b77276573819da
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1b68fa02ba9e4f1df8cd74f282e78b2376e92078578c752eb37e7ed170bc5b0
3
  size 559
checkpoint-500/unet/config.json CHANGED
@@ -1,16 +1,11 @@
1
  {
2
  "_class_name": "UNet2DConditionModel",
3
  "_diffusers_version": "0.18.0.dev0",
4
- "_name_or_path": "stabilityai/stable-diffusion-2-1",
5
  "act_fn": "silu",
6
  "addition_embed_type": null,
7
  "addition_embed_type_num_heads": 64,
8
- "attention_head_dim": [
9
- 5,
10
- 10,
11
- 20,
12
- 20
13
- ],
14
  "block_out_channels": [
15
  320,
16
  640,
@@ -22,7 +17,7 @@
22
  "class_embeddings_concat": false,
23
  "conv_in_kernel": 3,
24
  "conv_out_kernel": 3,
25
- "cross_attention_dim": 1024,
26
  "cross_attention_norm": null,
27
  "down_block_types": [
28
  "CrossAttnDownBlock2D",
@@ -50,7 +45,7 @@
50
  "resnet_out_scale_factor": 1.0,
51
  "resnet_skip_time_act": false,
52
  "resnet_time_scale_shift": "default",
53
- "sample_size": 96,
54
  "time_cond_proj_dim": null,
55
  "time_embedding_act_fn": null,
56
  "time_embedding_dim": null,
@@ -62,6 +57,6 @@
62
  "CrossAttnUpBlock2D",
63
  "CrossAttnUpBlock2D"
64
  ],
65
- "upcast_attention": true,
66
- "use_linear_projection": true
67
  }
 
1
  {
2
  "_class_name": "UNet2DConditionModel",
3
  "_diffusers_version": "0.18.0.dev0",
4
+ "_name_or_path": "runwayml/stable-diffusion-v1-5",
5
  "act_fn": "silu",
6
  "addition_embed_type": null,
7
  "addition_embed_type_num_heads": 64,
8
+ "attention_head_dim": 8,
 
 
 
 
 
9
  "block_out_channels": [
10
  320,
11
  640,
 
17
  "class_embeddings_concat": false,
18
  "conv_in_kernel": 3,
19
  "conv_out_kernel": 3,
20
+ "cross_attention_dim": 768,
21
  "cross_attention_norm": null,
22
  "down_block_types": [
23
  "CrossAttnDownBlock2D",
 
45
  "resnet_out_scale_factor": 1.0,
46
  "resnet_skip_time_act": false,
47
  "resnet_time_scale_shift": "default",
48
+ "sample_size": 64,
49
  "time_cond_proj_dim": null,
50
  "time_embedding_act_fn": null,
51
  "time_embedding_dim": null,
 
57
  "CrossAttnUpBlock2D",
58
  "CrossAttnUpBlock2D"
59
  ],
60
+ "upcast_attention": false,
61
+ "use_linear_projection": false
62
  }
checkpoint-500/unet/diffusion_pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5d084337c1357e767608807670329217d8428d9124efab1918d4ddccfb164569
3
- size 3463923045
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e919a5097988aef2b20f32bbda8ca55dffc78804ae1b5dfe68dd590b69970f6e
3
+ size 3438364325
logs/dreambooth/1688740699.9952476/events.out.tfevents.1688740699.szth-acg-bcc04f1143.szth.baidu.com.36729.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56192fa15ef9c966f07671b5160b889a3a4daab96db084e5eacbd54d1f6e9a1e
3
+ size 2719
logs/dreambooth/1688740699.9970224/hparams.yml ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ center_crop: false
7
+ checkpointing_steps: 500
8
+ checkpoints_total_limit: null
9
+ class_data_dir: null
10
+ class_labels_conditioning: null
11
+ class_prompt: null
12
+ dataloader_num_workers: 0
13
+ enable_xformers_memory_efficient_attention: false
14
+ gradient_accumulation_steps: 1
15
+ gradient_checkpointing: false
16
+ hub_model_id: null
17
+ hub_token: null
18
+ instance_data_dir: ./sleep2
19
+ instance_prompt: A photo of a young people sleeping in front of a computer
20
+ learning_rate: 1.0e-06
21
+ local_rank: 0
22
+ logging_dir: logs
23
+ lr_num_cycles: 1
24
+ lr_power: 1.0
25
+ lr_scheduler: constant
26
+ lr_warmup_steps: 0
27
+ max_grad_norm: 1.0
28
+ max_train_steps: 1200
29
+ mixed_precision: null
30
+ num_class_images: 100
31
+ num_train_epochs: 1200
32
+ num_validation_images: 4
33
+ offset_noise: false
34
+ output_dir: sd_output/dreambooth3
35
+ pre_compute_text_embeddings: false
36
+ pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
37
+ prior_generation_precision: null
38
+ prior_loss_weight: 1.0
39
+ push_to_hub: true
40
+ report_to: tensorboard
41
+ resolution: 512
42
+ resume_from_checkpoint: null
43
+ revision: null
44
+ sample_batch_size: 4
45
+ scale_lr: false
46
+ seed: null
47
+ set_grads_to_none: false
48
+ skip_save_text_encoder: false
49
+ text_encoder_use_attention_mask: false
50
+ tokenizer_max_length: null
51
+ tokenizer_name: null
52
+ train_batch_size: 1
53
+ train_text_encoder: false
54
+ use_8bit_adam: false
55
+ validation_images: null
56
+ validation_prompt: null
57
+ validation_steps: 100
58
+ with_prior_preservation: false
logs/dreambooth/events.out.tfevents.1688740699.szth-acg-bcc04f1143.szth.baidu.com.36729.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3656699a6b7050548c114cf642d1167cae214be73732ee9de8a015e1fa5b8b25
3
+ size 100634
model_index.json CHANGED
@@ -5,14 +5,14 @@
5
  "transformers",
6
  "CLIPImageProcessor"
7
  ],
8
- "requires_safety_checker": false,
9
  "safety_checker": [
10
- null,
11
- null
12
  ],
13
  "scheduler": [
14
  "diffusers",
15
- "DDIMScheduler"
16
  ],
17
  "text_encoder": [
18
  "transformers",
 
5
  "transformers",
6
  "CLIPImageProcessor"
7
  ],
8
+ "requires_safety_checker": true,
9
  "safety_checker": [
10
+ "stable_diffusion",
11
+ "StableDiffusionSafetyChecker"
12
  ],
13
  "scheduler": [
14
  "diffusers",
15
+ "PNDMScheduler"
16
  ],
17
  "text_encoder": [
18
  "transformers",
safety_checker/config.json ADDED
@@ -0,0 +1,181 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_commit_hash": "c9ab35ff5f2c362e9e22fbafe278077e196057f0",
3
+ "_name_or_path": "/home/fuhongtao/.cache/huggingface/hub/models--runwayml--stable-diffusion-v1-5/snapshots/c9ab35ff5f2c362e9e22fbafe278077e196057f0/safety_checker",
4
+ "architectures": [
5
+ "StableDiffusionSafetyChecker"
6
+ ],
7
+ "initializer_factor": 1.0,
8
+ "logit_scale_init_value": 2.6592,
9
+ "model_type": "clip",
10
+ "projection_dim": 768,
11
+ "text_config": {
12
+ "_name_or_path": "",
13
+ "add_cross_attention": false,
14
+ "architectures": null,
15
+ "attention_dropout": 0.0,
16
+ "bad_words_ids": null,
17
+ "begin_suppress_tokens": null,
18
+ "bos_token_id": 0,
19
+ "chunk_size_feed_forward": 0,
20
+ "cross_attention_hidden_size": null,
21
+ "decoder_start_token_id": null,
22
+ "diversity_penalty": 0.0,
23
+ "do_sample": false,
24
+ "dropout": 0.0,
25
+ "early_stopping": false,
26
+ "encoder_no_repeat_ngram_size": 0,
27
+ "eos_token_id": 2,
28
+ "exponential_decay_length_penalty": null,
29
+ "finetuning_task": null,
30
+ "forced_bos_token_id": null,
31
+ "forced_eos_token_id": null,
32
+ "hidden_act": "quick_gelu",
33
+ "hidden_size": 768,
34
+ "id2label": {
35
+ "0": "LABEL_0",
36
+ "1": "LABEL_1"
37
+ },
38
+ "initializer_factor": 1.0,
39
+ "initializer_range": 0.02,
40
+ "intermediate_size": 3072,
41
+ "is_decoder": false,
42
+ "is_encoder_decoder": false,
43
+ "label2id": {
44
+ "LABEL_0": 0,
45
+ "LABEL_1": 1
46
+ },
47
+ "layer_norm_eps": 1e-05,
48
+ "length_penalty": 1.0,
49
+ "max_length": 20,
50
+ "max_position_embeddings": 77,
51
+ "min_length": 0,
52
+ "model_type": "clip_text_model",
53
+ "no_repeat_ngram_size": 0,
54
+ "num_attention_heads": 12,
55
+ "num_beam_groups": 1,
56
+ "num_beams": 1,
57
+ "num_hidden_layers": 12,
58
+ "num_return_sequences": 1,
59
+ "output_attentions": false,
60
+ "output_hidden_states": false,
61
+ "output_scores": false,
62
+ "pad_token_id": 1,
63
+ "prefix": null,
64
+ "problem_type": null,
65
+ "projection_dim": 512,
66
+ "pruned_heads": {},
67
+ "remove_invalid_values": false,
68
+ "repetition_penalty": 1.0,
69
+ "return_dict": true,
70
+ "return_dict_in_generate": false,
71
+ "sep_token_id": null,
72
+ "suppress_tokens": null,
73
+ "task_specific_params": null,
74
+ "temperature": 1.0,
75
+ "tf_legacy_loss": false,
76
+ "tie_encoder_decoder": false,
77
+ "tie_word_embeddings": true,
78
+ "tokenizer_class": null,
79
+ "top_k": 50,
80
+ "top_p": 1.0,
81
+ "torch_dtype": null,
82
+ "torchscript": false,
83
+ "transformers_version": "4.26.0",
84
+ "typical_p": 1.0,
85
+ "use_bfloat16": false,
86
+ "vocab_size": 49408
87
+ },
88
+ "text_config_dict": {
89
+ "hidden_size": 768,
90
+ "intermediate_size": 3072,
91
+ "num_attention_heads": 12,
92
+ "num_hidden_layers": 12
93
+ },
94
+ "torch_dtype": "float32",
95
+ "transformers_version": null,
96
+ "vision_config": {
97
+ "_name_or_path": "",
98
+ "add_cross_attention": false,
99
+ "architectures": null,
100
+ "attention_dropout": 0.0,
101
+ "bad_words_ids": null,
102
+ "begin_suppress_tokens": null,
103
+ "bos_token_id": null,
104
+ "chunk_size_feed_forward": 0,
105
+ "cross_attention_hidden_size": null,
106
+ "decoder_start_token_id": null,
107
+ "diversity_penalty": 0.0,
108
+ "do_sample": false,
109
+ "dropout": 0.0,
110
+ "early_stopping": false,
111
+ "encoder_no_repeat_ngram_size": 0,
112
+ "eos_token_id": null,
113
+ "exponential_decay_length_penalty": null,
114
+ "finetuning_task": null,
115
+ "forced_bos_token_id": null,
116
+ "forced_eos_token_id": null,
117
+ "hidden_act": "quick_gelu",
118
+ "hidden_size": 1024,
119
+ "id2label": {
120
+ "0": "LABEL_0",
121
+ "1": "LABEL_1"
122
+ },
123
+ "image_size": 224,
124
+ "initializer_factor": 1.0,
125
+ "initializer_range": 0.02,
126
+ "intermediate_size": 4096,
127
+ "is_decoder": false,
128
+ "is_encoder_decoder": false,
129
+ "label2id": {
130
+ "LABEL_0": 0,
131
+ "LABEL_1": 1
132
+ },
133
+ "layer_norm_eps": 1e-05,
134
+ "length_penalty": 1.0,
135
+ "max_length": 20,
136
+ "min_length": 0,
137
+ "model_type": "clip_vision_model",
138
+ "no_repeat_ngram_size": 0,
139
+ "num_attention_heads": 16,
140
+ "num_beam_groups": 1,
141
+ "num_beams": 1,
142
+ "num_channels": 3,
143
+ "num_hidden_layers": 24,
144
+ "num_return_sequences": 1,
145
+ "output_attentions": false,
146
+ "output_hidden_states": false,
147
+ "output_scores": false,
148
+ "pad_token_id": null,
149
+ "patch_size": 14,
150
+ "prefix": null,
151
+ "problem_type": null,
152
+ "projection_dim": 512,
153
+ "pruned_heads": {},
154
+ "remove_invalid_values": false,
155
+ "repetition_penalty": 1.0,
156
+ "return_dict": true,
157
+ "return_dict_in_generate": false,
158
+ "sep_token_id": null,
159
+ "suppress_tokens": null,
160
+ "task_specific_params": null,
161
+ "temperature": 1.0,
162
+ "tf_legacy_loss": false,
163
+ "tie_encoder_decoder": false,
164
+ "tie_word_embeddings": true,
165
+ "tokenizer_class": null,
166
+ "top_k": 50,
167
+ "top_p": 1.0,
168
+ "torch_dtype": null,
169
+ "torchscript": false,
170
+ "transformers_version": "4.26.0",
171
+ "typical_p": 1.0,
172
+ "use_bfloat16": false
173
+ },
174
+ "vision_config_dict": {
175
+ "hidden_size": 1024,
176
+ "intermediate_size": 4096,
177
+ "num_attention_heads": 16,
178
+ "num_hidden_layers": 24,
179
+ "patch_size": 14
180
+ }
181
+ }
safety_checker/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:193490b58ef62739077262e833bf091c66c29488058681ac25cf7df3d8190974
3
+ size 1216061799
scheduler/scheduler_config.json CHANGED
@@ -1,20 +1,14 @@
1
  {
2
- "_class_name": "DDIMScheduler",
3
  "_diffusers_version": "0.18.0.dev0",
4
  "beta_end": 0.012,
5
  "beta_schedule": "scaled_linear",
6
  "beta_start": 0.00085,
7
  "clip_sample": false,
8
- "clip_sample_range": 1.0,
9
- "dynamic_thresholding_ratio": 0.995,
10
  "num_train_timesteps": 1000,
11
- "prediction_type": "v_prediction",
12
- "rescale_betas_zero_snr": false,
13
- "sample_max_value": 1.0,
14
  "set_alpha_to_one": false,
15
  "skip_prk_steps": true,
16
  "steps_offset": 1,
17
- "thresholding": false,
18
- "timestep_spacing": "leading",
19
  "trained_betas": null
20
  }
 
1
  {
2
+ "_class_name": "PNDMScheduler",
3
  "_diffusers_version": "0.18.0.dev0",
4
  "beta_end": 0.012,
5
  "beta_schedule": "scaled_linear",
6
  "beta_start": 0.00085,
7
  "clip_sample": false,
 
 
8
  "num_train_timesteps": 1000,
9
+ "prediction_type": "epsilon",
 
 
10
  "set_alpha_to_one": false,
11
  "skip_prk_steps": true,
12
  "steps_offset": 1,
 
 
13
  "trained_betas": null
14
  }
text_encoder/config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "stabilityai/stable-diffusion-2-1",
3
  "architectures": [
4
  "CLIPTextModel"
5
  ],
@@ -7,18 +7,18 @@
7
  "bos_token_id": 0,
8
  "dropout": 0.0,
9
  "eos_token_id": 2,
10
- "hidden_act": "gelu",
11
- "hidden_size": 1024,
12
  "initializer_factor": 1.0,
13
  "initializer_range": 0.02,
14
- "intermediate_size": 4096,
15
  "layer_norm_eps": 1e-05,
16
  "max_position_embeddings": 77,
17
  "model_type": "clip_text_model",
18
- "num_attention_heads": 16,
19
- "num_hidden_layers": 23,
20
  "pad_token_id": 1,
21
- "projection_dim": 512,
22
  "torch_dtype": "float16",
23
  "transformers_version": "4.26.0",
24
  "vocab_size": 49408
 
1
  {
2
+ "_name_or_path": "runwayml/stable-diffusion-v1-5",
3
  "architectures": [
4
  "CLIPTextModel"
5
  ],
 
7
  "bos_token_id": 0,
8
  "dropout": 0.0,
9
  "eos_token_id": 2,
10
+ "hidden_act": "quick_gelu",
11
+ "hidden_size": 768,
12
  "initializer_factor": 1.0,
13
  "initializer_range": 0.02,
14
+ "intermediate_size": 3072,
15
  "layer_norm_eps": 1e-05,
16
  "max_position_embeddings": 77,
17
  "model_type": "clip_text_model",
18
+ "num_attention_heads": 12,
19
+ "num_hidden_layers": 12,
20
  "pad_token_id": 1,
21
+ "projection_dim": 768,
22
  "torch_dtype": "float16",
23
  "transformers_version": "4.26.0",
24
  "vocab_size": 49408
text_encoder/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f988248177fc727cf066267b3ccb62e7a74b7e3c5b3efa8a701d563e0f0ea037
3
- size 680901463
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a4311d3fc7b70396637a703ba65b7db30041ba536f569ae8f548312641a0fd6
3
+ size 246187063
tokenizer/special_tokens_map.json CHANGED
@@ -13,7 +13,7 @@
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
- "pad_token": "!",
17
  "unk_token": {
18
  "content": "<|endoftext|>",
19
  "lstrip": false,
 
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
+ "pad_token": "<|endoftext|>",
17
  "unk_token": {
18
  "content": "<|endoftext|>",
19
  "lstrip": false,
tokenizer/tokenizer_config.json CHANGED
@@ -19,7 +19,7 @@
19
  },
20
  "errors": "replace",
21
  "model_max_length": 77,
22
- "name_or_path": "/home/fuhongtao/.cache/huggingface/hub/models--stabilityai--stable-diffusion-2-1/snapshots/5cae40e6a2745ae2b01ad92ae5043f95f23644d6/tokenizer",
23
  "pad_token": "<|endoftext|>",
24
  "special_tokens_map_file": "./special_tokens_map.json",
25
  "tokenizer_class": "CLIPTokenizer",
 
19
  },
20
  "errors": "replace",
21
  "model_max_length": 77,
22
+ "name_or_path": "/home/fuhongtao/.cache/huggingface/hub/models--runwayml--stable-diffusion-v1-5/snapshots/c9ab35ff5f2c362e9e22fbafe278077e196057f0/tokenizer",
23
  "pad_token": "<|endoftext|>",
24
  "special_tokens_map_file": "./special_tokens_map.json",
25
  "tokenizer_class": "CLIPTokenizer",
unet/config.json CHANGED
@@ -1,16 +1,11 @@
1
  {
2
  "_class_name": "UNet2DConditionModel",
3
  "_diffusers_version": "0.18.0.dev0",
4
- "_name_or_path": "stabilityai/stable-diffusion-2-1",
5
  "act_fn": "silu",
6
  "addition_embed_type": null,
7
  "addition_embed_type_num_heads": 64,
8
- "attention_head_dim": [
9
- 5,
10
- 10,
11
- 20,
12
- 20
13
- ],
14
  "block_out_channels": [
15
  320,
16
  640,
@@ -22,7 +17,7 @@
22
  "class_embeddings_concat": false,
23
  "conv_in_kernel": 3,
24
  "conv_out_kernel": 3,
25
- "cross_attention_dim": 1024,
26
  "cross_attention_norm": null,
27
  "down_block_types": [
28
  "CrossAttnDownBlock2D",
@@ -50,7 +45,7 @@
50
  "resnet_out_scale_factor": 1.0,
51
  "resnet_skip_time_act": false,
52
  "resnet_time_scale_shift": "default",
53
- "sample_size": 96,
54
  "time_cond_proj_dim": null,
55
  "time_embedding_act_fn": null,
56
  "time_embedding_dim": null,
@@ -62,6 +57,6 @@
62
  "CrossAttnUpBlock2D",
63
  "CrossAttnUpBlock2D"
64
  ],
65
- "upcast_attention": true,
66
- "use_linear_projection": true
67
  }
 
1
  {
2
  "_class_name": "UNet2DConditionModel",
3
  "_diffusers_version": "0.18.0.dev0",
4
+ "_name_or_path": "runwayml/stable-diffusion-v1-5",
5
  "act_fn": "silu",
6
  "addition_embed_type": null,
7
  "addition_embed_type_num_heads": 64,
8
+ "attention_head_dim": 8,
 
 
 
 
 
9
  "block_out_channels": [
10
  320,
11
  640,
 
17
  "class_embeddings_concat": false,
18
  "conv_in_kernel": 3,
19
  "conv_out_kernel": 3,
20
+ "cross_attention_dim": 768,
21
  "cross_attention_norm": null,
22
  "down_block_types": [
23
  "CrossAttnDownBlock2D",
 
45
  "resnet_out_scale_factor": 1.0,
46
  "resnet_skip_time_act": false,
47
  "resnet_time_scale_shift": "default",
48
+ "sample_size": 64,
49
  "time_cond_proj_dim": null,
50
  "time_embedding_act_fn": null,
51
  "time_embedding_dim": null,
 
57
  "CrossAttnUpBlock2D",
58
  "CrossAttnUpBlock2D"
59
  ],
60
+ "upcast_attention": false,
61
+ "use_linear_projection": false
62
  }
unet/diffusion_pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5d084337c1357e767608807670329217d8428d9124efab1918d4ddccfb164569
3
- size 3463923045
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:613f375f225cc505f63ded1498d15a67b333b831f2fe695d8bf3ba22958b924d
3
+ size 3438364325
vae/config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "_class_name": "AutoencoderKL",
3
  "_diffusers_version": "0.18.0.dev0",
4
- "_name_or_path": "/home/fuhongtao/.cache/huggingface/hub/models--stabilityai--stable-diffusion-2-1/snapshots/5cae40e6a2745ae2b01ad92ae5043f95f23644d6/vae",
5
  "act_fn": "silu",
6
  "block_out_channels": [
7
  128,
@@ -20,7 +20,7 @@
20
  "layers_per_block": 2,
21
  "norm_num_groups": 32,
22
  "out_channels": 3,
23
- "sample_size": 768,
24
  "scaling_factor": 0.18215,
25
  "up_block_types": [
26
  "UpDecoderBlock2D",
 
1
  {
2
  "_class_name": "AutoencoderKL",
3
  "_diffusers_version": "0.18.0.dev0",
4
+ "_name_or_path": "/home/fuhongtao/.cache/huggingface/hub/models--runwayml--stable-diffusion-v1-5/snapshots/c9ab35ff5f2c362e9e22fbafe278077e196057f0/vae",
5
  "act_fn": "silu",
6
  "block_out_channels": [
7
  128,
 
20
  "layers_per_block": 2,
21
  "norm_num_groups": 32,
22
  "out_channels": 3,
23
+ "sample_size": 512,
24
  "scaling_factor": 0.18215,
25
  "up_block_types": [
26
  "UpDecoderBlock2D",
vae/diffusion_pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8b7010872555f03f3c7c94b3e510546755d6df0be9f06495b6bb01cc5d368779
3
  size 334707473
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c5cef2a0f410dea412810e1e7dc92b2f6797785c8c0447008ff6e07b99e20f3
3
  size 334707473