briannlongzhao commited on
Commit
71abb4d
1 Parent(s): d2eb9ef

End of training

Browse files
README.md CHANGED
@@ -2,21 +2,16 @@
2
  ---
3
  license: creativeml-openrail-m
4
  base_model: stabilityai/stable-diffusion-2-1
5
- instance_prompt: a photo of <new1> stinkhorn mushroom
6
  tags:
7
  - stable-diffusion
8
  - stable-diffusion-diffusers
9
  - text-to-image
10
  - diffusers
11
- - custom-diffusion
12
  inference: true
13
  ---
14
 
15
- # Custom Diffusion - briannlongzhao/99
 
16
 
17
- These are Custom Diffusion adaption weights for stabilityai/stable-diffusion-2-1. The weights were trained on a photo of <new1> stinkhorn mushroom using [Custom Diffusion](https://www.cs.cmu.edu/~custom-diffusion). You can find some example images in the following.
18
 
19
-
20
-
21
-
22
- For more details on the training, please follow [this link](https://github.com/huggingface/diffusers/blob/main/examples/custom_diffusion).
 
2
  ---
3
  license: creativeml-openrail-m
4
  base_model: stabilityai/stable-diffusion-2-1
 
5
  tags:
6
  - stable-diffusion
7
  - stable-diffusion-diffusers
8
  - text-to-image
9
  - diffusers
10
+ - textual_inversion
11
  inference: true
12
  ---
13
 
14
+ # Textual inversion text2image fine-tuning - briannlongzhao/99
15
+ These are textual inversion adaption weights for stabilityai/stable-diffusion-2-1. You can find some example images in the following.
16
 
 
17
 
 
 
 
 
learned_embeds.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dfbfb8bb4c74efaa013a0af3b41aae3040318bca3e2e58325d647a3408d60455
3
  size 4216
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e756ce5ec8ef051503618f937b61e41dd5477bd43a511bb6e7c0e739c4cad73
3
  size 4216
logs/textual_inversion/1706461845.9829762/events.out.tfevents.1706461846.node-0.2749.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b2d66762b1757ad154e96323e7ceb8c504343ab66d78aa5f2636c282bc13a17
3
+ size 2535
logs/textual_inversion/1706461846.9282053/hparams.yml ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ center_crop: false
7
+ checkpointing_steps: 500
8
+ checkpoints_total_limit: null
9
+ class_name: stinkhorn mushroom
10
+ dataloader_num_workers: 0
11
+ enable_xformers_memory_efficient_attention: true
12
+ gradient_accumulation_steps: 4
13
+ gradient_checkpointing: false
14
+ hub_model_id: null
15
+ hub_token: null
16
+ idx: 99
17
+ initializer_token: stinkhorn mushroom
18
+ learnable_property: object
19
+ learning_rate: 0.008
20
+ local_rank: -1
21
+ logging_dir: logs
22
+ lr_num_cycles: 1
23
+ lr_scheduler: constant
24
+ lr_warmup_steps: 0
25
+ max_train_steps: 35
26
+ mixed_precision: fp16
27
+ no_safe_serialization: false
28
+ num_train_epochs: 5
29
+ num_validation_images: 4
30
+ num_vectors: 1
31
+ output_dir: /mnt/default/textual_inversion_models_medium/99
32
+ placeholder_token: <stinkhorn mushroom>
33
+ pretrained_model_name_or_path: stabilityai/stable-diffusion-2-1
34
+ push_to_hub: true
35
+ repeats: 1
36
+ report_to: tensorboard
37
+ resolution: 512
38
+ resume_from_checkpoint: null
39
+ revision: null
40
+ save_as_full_pipeline: false
41
+ save_steps: 500
42
+ scale_lr: true
43
+ seed: null
44
+ tokenizer_name: null
45
+ train_batch_size: 4
46
+ train_data_dir: /mnt/default/imagenet/images/train_medium/n13040303
47
+ validation_epochs: null
48
+ validation_prompt: null
49
+ validation_steps: 100
50
+ wnid: n13040303
logs/textual_inversion/1706473799.1283302/events.out.tfevents.1706473799.node-0.2616.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0386b5566d33bd887a967ef95f9c602411ce769a7f3157a8e221c6f0af594d2
3
+ size 2535
logs/textual_inversion/1706473800.080144/hparams.yml ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ center_crop: false
7
+ checkpointing_steps: 500
8
+ checkpoints_total_limit: null
9
+ class_name: stinkhorn mushroom
10
+ dataloader_num_workers: 0
11
+ enable_xformers_memory_efficient_attention: true
12
+ gradient_accumulation_steps: 4
13
+ gradient_checkpointing: false
14
+ hub_model_id: null
15
+ hub_token: null
16
+ idx: 99
17
+ initializer_token: stinkhorn mushroom
18
+ learnable_property: object
19
+ learning_rate: 0.008
20
+ local_rank: -1
21
+ logging_dir: logs
22
+ lr_num_cycles: 1
23
+ lr_scheduler: constant
24
+ lr_warmup_steps: 0
25
+ max_train_steps: 35
26
+ mixed_precision: fp16
27
+ no_safe_serialization: false
28
+ num_train_epochs: 5
29
+ num_validation_images: 4
30
+ num_vectors: 1
31
+ output_dir: /mnt/default/textual_inversion_models_medium/99
32
+ placeholder_token: <stinkhorn mushroom>
33
+ pretrained_model_name_or_path: stabilityai/stable-diffusion-2-1
34
+ push_to_hub: true
35
+ repeats: 1
36
+ report_to: tensorboard
37
+ resolution: 512
38
+ resume_from_checkpoint: null
39
+ revision: null
40
+ save_as_full_pipeline: false
41
+ save_steps: 500
42
+ scale_lr: true
43
+ seed: null
44
+ tokenizer_name: null
45
+ train_batch_size: 4
46
+ train_data_dir: /mnt/default/imagenet/images/train_medium/n13040303
47
+ validation_epochs: null
48
+ validation_prompt: null
49
+ validation_steps: 100
50
+ wnid: n13040303
logs/textual_inversion/events.out.tfevents.1706461845.node-0.2749.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c3ddbf7566080b0fe259663160db3e170b6e6a27089ad1cce17ae3bdc136d3e
3
+ size 6472
logs/textual_inversion/events.out.tfevents.1706473798.node-0.2616.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26d53aca38489fddcca598ef891cab9a67a47c6ebba615766b6963e32a9ac8ff
3
+ size 10326
text_encoder/config.json CHANGED
@@ -19,7 +19,7 @@
19
  "num_hidden_layers": 23,
20
  "pad_token_id": 1,
21
  "projection_dim": 512,
22
- "torch_dtype": "float16",
23
  "transformers_version": "4.28.1",
24
- "vocab_size": 49408
25
  }
 
19
  "num_hidden_layers": 23,
20
  "pad_token_id": 1,
21
  "projection_dim": 512,
22
+ "torch_dtype": "float32",
23
  "transformers_version": "4.28.1",
24
+ "vocab_size": 49409
25
  }
text_encoder/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:681c555376658c81dc273f2d737a2aeb23ddb6d1d8e5b3a7064636d359a22668
3
- size 680821096
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4cb3f5fb87dbdd0ba9e6788db03b6be81a72b08a3b403a13617c2a61ce14a40
3
+ size 1361601112
unet/diffusion_pytorch_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9b83750631fa02da5069e880248a847db4c0a079e9b9c29f1f4b12dccf484861
3
- size 3463726504
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a3a4d7978884c5e4ef00b62641b1b544b257be2f6715d984188610ad6475ad2
3
+ size 1731904736
vae/config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "_class_name": "AutoencoderKL",
3
  "_diffusers_version": "0.25.1",
4
- "_name_or_path": "/home/aiscuser/.cache/huggingface/hub/models--stabilityai--stable-diffusion-2-1/snapshots/5cae40e6a2745ae2b01ad92ae5043f95f23644d6/vae",
5
  "act_fn": "silu",
6
  "block_out_channels": [
7
  128,
 
1
  {
2
  "_class_name": "AutoencoderKL",
3
  "_diffusers_version": "0.25.1",
4
+ "_name_or_path": "stabilityai/stable-diffusion-2-1",
5
  "act_fn": "silu",
6
  "block_out_channels": [
7
  128,
vae/diffusion_pytorch_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2aa1f43011b553a4cba7f37456465cdbd48aab7b54b9348b890e8058ea7683ec
3
- size 334643268
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e4c08995484ee61270175e9e7a072b66a6e4eeb5f0c266667fe1f45b90daf9a
3
+ size 167335342