briannlongzhao commited on
Commit
3d289f8
1 Parent(s): cdf539f

End of training

Browse files
README.md CHANGED
@@ -2,21 +2,16 @@
2
  ---
3
  license: creativeml-openrail-m
4
  base_model: stabilityai/stable-diffusion-2-1
5
- instance_prompt: a photo of <new1> Shih Tzu
6
  tags:
7
  - stable-diffusion
8
  - stable-diffusion-diffusers
9
  - text-to-image
10
  - diffusers
11
- - custom-diffusion
12
  inference: true
13
  ---
14
 
15
- # Custom Diffusion - briannlongzhao/14
 
16
 
17
- These are Custom Diffusion adaption weights for stabilityai/stable-diffusion-2-1. The weights were trained on a photo of <new1> Shih Tzu using [Custom Diffusion](https://www.cs.cmu.edu/~custom-diffusion). You can find some example images in the following.
18
 
19
-
20
-
21
-
22
- For more details on the training, please follow [this link](https://github.com/huggingface/diffusers/blob/main/examples/custom_diffusion).
 
2
  ---
3
  license: creativeml-openrail-m
4
  base_model: stabilityai/stable-diffusion-2-1
 
5
  tags:
6
  - stable-diffusion
7
  - stable-diffusion-diffusers
8
  - text-to-image
9
  - diffusers
10
+ - textual_inversion
11
  inference: true
12
  ---
13
 
14
+ # Textual inversion text2image fine-tuning - briannlongzhao/14
15
+ These are textual inversion adaption weights for stabilityai/stable-diffusion-2-1. You can find some example images in the following.
16
 
 
17
 
 
 
 
 
learned_embeds.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6317c92aeafd2cad5a9774d5e42a3afb9d5aad4f433921a068a044a0993499cc
3
  size 4208
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ee640b6dd0f4dd9122b4dea0c34159db5e5504984e793cd5c2bdc71b2612cd6
3
  size 4208
logs/textual_inversion/1706453945.1587198/events.out.tfevents.1706453945.node-0.2597.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36f4fc9c6912a327687d5585dc907f7a97507650aea2a82a481ffa67e0364bf2
3
+ size 2505
logs/textual_inversion/1706453945.6462321/hparams.yml ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ center_crop: false
7
+ checkpointing_steps: 500
8
+ checkpoints_total_limit: null
9
+ class_name: Shih Tzu
10
+ dataloader_num_workers: 0
11
+ enable_xformers_memory_efficient_attention: true
12
+ gradient_accumulation_steps: 4
13
+ gradient_checkpointing: false
14
+ hub_model_id: null
15
+ hub_token: null
16
+ idx: 14
17
+ initializer_token: Shih Tzu
18
+ learnable_property: object
19
+ learning_rate: 0.008
20
+ local_rank: -1
21
+ logging_dir: logs
22
+ lr_num_cycles: 1
23
+ lr_scheduler: constant
24
+ lr_warmup_steps: 0
25
+ max_train_steps: 35
26
+ mixed_precision: fp16
27
+ no_safe_serialization: false
28
+ num_train_epochs: 5
29
+ num_validation_images: 4
30
+ num_vectors: 1
31
+ output_dir: /mnt/default/textual_inversion_models_medium/14
32
+ placeholder_token: <Shih Tzu>
33
+ pretrained_model_name_or_path: stabilityai/stable-diffusion-2-1
34
+ push_to_hub: true
35
+ repeats: 1
36
+ report_to: tensorboard
37
+ resolution: 512
38
+ resume_from_checkpoint: null
39
+ revision: null
40
+ save_as_full_pipeline: false
41
+ save_steps: 500
42
+ scale_lr: true
43
+ seed: null
44
+ tokenizer_name: null
45
+ train_batch_size: 4
46
+ train_data_dir: /mnt/default/imagenet/images/train_medium/n02086240
47
+ validation_epochs: null
48
+ validation_prompt: null
49
+ validation_steps: 100
50
+ wnid: n02086240
logs/textual_inversion/events.out.tfevents.1706453945.node-0.2597.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14a5b99987e8132c87545299a3916c0be15a619d023a86c6b96870ebc819747a
3
+ size 10326
text_encoder/config.json CHANGED
@@ -19,7 +19,7 @@
19
  "num_hidden_layers": 23,
20
  "pad_token_id": 1,
21
  "projection_dim": 512,
22
- "torch_dtype": "float16",
23
  "transformers_version": "4.28.1",
24
- "vocab_size": 49408
25
  }
 
19
  "num_hidden_layers": 23,
20
  "pad_token_id": 1,
21
  "projection_dim": 512,
22
+ "torch_dtype": "float32",
23
  "transformers_version": "4.28.1",
24
+ "vocab_size": 49409
25
  }
text_encoder/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:681c555376658c81dc273f2d737a2aeb23ddb6d1d8e5b3a7064636d359a22668
3
- size 680821096
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d393b1231bb022451bdd777a3908894dac11974f02b0866893f3f9a3a86cea5a
3
+ size 1361601112
unet/diffusion_pytorch_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a2ba315dea0b83dc692127b58c62536158fd154be1b29a7091869f0c3cc439bf
3
- size 3463726504
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a3a4d7978884c5e4ef00b62641b1b544b257be2f6715d984188610ad6475ad2
3
+ size 1731904736
vae/config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "_class_name": "AutoencoderKL",
3
  "_diffusers_version": "0.25.1",
4
- "_name_or_path": "/home/aiscuser/.cache/huggingface/hub/models--stabilityai--stable-diffusion-2-1/snapshots/5cae40e6a2745ae2b01ad92ae5043f95f23644d6/vae",
5
  "act_fn": "silu",
6
  "block_out_channels": [
7
  128,
 
1
  {
2
  "_class_name": "AutoencoderKL",
3
  "_diffusers_version": "0.25.1",
4
+ "_name_or_path": "stabilityai/stable-diffusion-2-1",
5
  "act_fn": "silu",
6
  "block_out_channels": [
7
  128,
vae/diffusion_pytorch_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2aa1f43011b553a4cba7f37456465cdbd48aab7b54b9348b890e8058ea7683ec
3
- size 334643268
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e4c08995484ee61270175e9e7a072b66a6e4eeb5f0c266667fe1f45b90daf9a
3
+ size 167335342