iamkaikai commited on
Commit
481a43e
1 Parent(s): 01b3a4e

End of training

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. 10epoch-h/.gitattributes +36 -0
  2. 10epoch-h/README.md +46 -0
  3. 10epoch-h/feature_extractor/preprocessor_config.json +28 -0
  4. 10epoch-h/logs/text2image-fine-tune/1699306835.1319811/events.out.tfevents.1699306835.DESKTOP-TNN0PMP.8128.1 +3 -0
  5. 10epoch-h/logs/text2image-fine-tune/1699306835.1339812/hparams.yml +50 -0
  6. 10epoch-h/logs/text2image-fine-tune/1699312817.2914586/events.out.tfevents.1699312817.DESKTOP-TNN0PMP.10224.1 +3 -0
  7. 10epoch-h/logs/text2image-fine-tune/1699312817.2934585/hparams.yml +50 -0
  8. 10epoch-h/logs/text2image-fine-tune/1699314601.5908923/events.out.tfevents.1699314601.DESKTOP-TNN0PMP.2164.1 +3 -0
  9. 10epoch-h/logs/text2image-fine-tune/1699314601.5918913/hparams.yml +50 -0
  10. 10epoch-h/logs/text2image-fine-tune/1699412326.680156/events.out.tfevents.1699412326.DESKTOP-TNN0PMP.18100.1 +3 -0
  11. 10epoch-h/logs/text2image-fine-tune/1699412326.6821554/hparams.yml +50 -0
  12. 10epoch-h/logs/text2image-fine-tune/1699452581.0122697/events.out.tfevents.1699452581.DESKTOP-TNN0PMP.12764.1 +3 -0
  13. 10epoch-h/logs/text2image-fine-tune/1699452581.0132704/hparams.yml +50 -0
  14. 10epoch-h/logs/text2image-fine-tune/1699558210.3350325/events.out.tfevents.1699558210.DESKTOP-TNN0PMP.12724.1 +3 -0
  15. 10epoch-h/logs/text2image-fine-tune/1699558210.3370333/hparams.yml +50 -0
  16. 10epoch-h/logs/text2image-fine-tune/events.out.tfevents.1699306835.DESKTOP-TNN0PMP.8128.0 +3 -0
  17. 10epoch-h/logs/text2image-fine-tune/events.out.tfevents.1699312817.DESKTOP-TNN0PMP.10224.0 +3 -0
  18. 10epoch-h/logs/text2image-fine-tune/events.out.tfevents.1699314601.DESKTOP-TNN0PMP.2164.0 +3 -0
  19. 10epoch-h/logs/text2image-fine-tune/events.out.tfevents.1699412326.DESKTOP-TNN0PMP.18100.0 +3 -0
  20. 10epoch-h/logs/text2image-fine-tune/events.out.tfevents.1699452581.DESKTOP-TNN0PMP.12764.0 +3 -0
  21. 10epoch-h/logs/text2image-fine-tune/events.out.tfevents.1699558210.DESKTOP-TNN0PMP.12724.0 +3 -0
  22. 10epoch-h/model_index.json +34 -0
  23. 10epoch-h/safety_checker/config.json +28 -0
  24. 10epoch-h/safety_checker/model.safetensors +3 -0
  25. 10epoch-h/scheduler/scheduler_config.json +15 -0
  26. 10epoch-h/text_encoder/config.json +25 -0
  27. 10epoch-h/text_encoder/model.safetensors +3 -0
  28. 10epoch-h/tokenizer/merges.txt +0 -0
  29. 10epoch-h/tokenizer/special_tokens_map.json +24 -0
  30. 10epoch-h/tokenizer/tokenizer_config.json +33 -0
  31. 10epoch-h/tokenizer/vocab.json +0 -0
  32. 10epoch-h/unet/config.json +67 -0
  33. 10epoch-h/unet/diffusion_pytorch_model.safetensors +3 -0
  34. 10epoch-h/vae/config.json +32 -0
  35. 10epoch-h/vae/diffusion_pytorch_model.safetensors +3 -0
  36. 10epoch-h/val_imgs_grid.png +3 -0
  37. README.md +2 -2
  38. checkpoint-4620000/optimizer.bin +3 -0
  39. checkpoint-4620000/random_states_0.pkl +3 -0
  40. checkpoint-4620000/scaler.pt +3 -0
  41. checkpoint-4620000/scheduler.bin +3 -0
  42. checkpoint-4620000/unet/config.json +67 -0
  43. checkpoint-4620000/unet/diffusion_pytorch_model.safetensors +3 -0
  44. checkpoint-4640000/optimizer.bin +3 -0
  45. checkpoint-4640000/random_states_0.pkl +3 -0
  46. checkpoint-4640000/scaler.pt +3 -0
  47. checkpoint-4640000/scheduler.bin +3 -0
  48. checkpoint-4640000/unet/config.json +67 -0
  49. checkpoint-4640000/unet/diffusion_pytorch_model.safetensors +3 -0
  50. checkpoint-4660000/optimizer.bin +3 -0
10epoch-h/.gitattributes ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tar filter=lfs diff=lfs merge=lfs -text
29
+ *.tflite filter=lfs diff=lfs merge=lfs -text
30
+ *.tgz filter=lfs diff=lfs merge=lfs -text
31
+ *.wasm filter=lfs diff=lfs merge=lfs -text
32
+ *.xz filter=lfs diff=lfs merge=lfs -text
33
+ *.zip filter=lfs diff=lfs merge=lfs -text
34
+ *.zst filter=lfs diff=lfs merge=lfs -text
35
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ val_imgs_grid.png filter=lfs diff=lfs merge=lfs -text
10epoch-h/README.md ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ ---
3
+ license: creativeml-openrail-m
4
+ base_model: runwayml/stable-diffusion-v1-5
5
+ datasets:
6
+ - iamkaikai/amazing_logos_v4
7
+ tags:
8
+ - stable-diffusion
9
+ - stable-diffusion-diffusers
10
+ - text-to-image
11
+ - diffusers
12
+ inference: true
13
+ ---
14
+
15
+ # Text-to-image finetuning - iamkaikai/amazing-logos-v5
16
+
17
+ This pipeline was finetuned from **runwayml/stable-diffusion-v1-5** on the **iamkaikai/amazing_logos_v4** dataset. Below are some example images generated with the finetuned pipeline using the following prompts: ['Simple elegant logo for Mandarin Oriental, Fan Hong kong Lines Paper, Hospitality, successful vibe, minimalist, thought-provoking, abstract, recognizable, relatable, sharp, vector art, even edges, black and white', 'Simple elegant logo for AltVest Investments, alternative investments financial services, Finance, successful vibe, minimalist, thought-provoking, abstract, recognizable, relatable, sharp, vector art, even edges', 'Simple elegant logo for PeckCerativeHorz2.jpg, peck horizontal trends branding bold photography analysis packaging vertical products circle discovery identity color creative exhibition direction P graphics julian research, , successful vibe, minimalist, thought-provoking, abstract, recognizable, relatable, sharp, vector art, even edges', "Simple elegant logo for Johns Creek Shirts, printing T's art Apparel screen tshirt summer T t shirts, Apparel, successful vibe, minimalist, thought-provoking, abstract, recognizable, relatable, sharp, vector art, even edges", 'Simple elegant logo for MGD, Human Circle MGD dots Resources SRP 3D brown, Human Resources, successful vibe, minimalist, thought-provoking, abstract, recognizable, relatable, sharp, vector art, even edges', 'Simple elegant logo for Indooroopilly Uniting Church, abstract initials people swirl letter I letter U letter C giving community soft friendly purple blue red, Religious, successful vibe, minimalist, thought-provoking, abstract, recognizable, relatable, sharp, vector art, even edges', 'Simple elegant logo for Hacker, Douglas, & Company, accountant Hollywood law H filmstrip attorney HDC film, law, successful vibe, minimalist, thought-provoking, abstract, recognizable, relatable, sharp, vector art, even edges', 'Simple elegant logo for Windmill unused #5, windmill property community shapes quilt blades houses colorful carlsbad homes circle whimsical estate housing real, housing development, successful vibe, minimalist, thought-provoking, abstract, recognizable, relatable, sharp, vector art, even edges', 'Simple elegant logo for The Duck Store, track track and field sports athletics tree logo badge, Sports Apparel, successful vibe, minimalist, thought-provoking, abstract, recognizable, relatable, sharp, vector art, even edges', 'Simple elegant logo for InGenious Fitness, G Ball Green Blue, Fitness, successful vibe, minimalist, thought-provoking, abstract, recognizable, relatable, sharp, vector art, even edges', 'Simple elegant logo for KickCharge Creative, seating safety man driver person figure hardhat S initial sign, Transportation, successful vibe, minimalist, thought-provoking, abstract, recognizable, relatable, sharp, vector art, even edges', 'Simple elegant logo for Chickasaw Nation, water drop laundry, Commercial Laundry Services, successful vibe, minimalist, thought-provoking, abstract, recognizable, relatable, sharp, vector art, even edges', 'Simple elegant logo for NBA Properties, Inc., basketball sports branding team entertainment philadelphia star patriotic, Sports Entertainment, successful vibe, minimalist, thought-provoking, abstract, recognizable, relatable, sharp, vector art, even edges', 'Simple elegant logo for North Asheville Tailgate Market Veggie Sub Mark, culinary cheese Initials combo organic serif vegetable radish Farmers eggplant inspirations2023 tailgate food market submark asheville farm kale modern unique sanserif veggie , farmers market, culinary, food, retail, successful vibe, minimalist, thought-provoking, abstract, recognizable, relatable, sharp, vector art, even edges', 'Simple elegant logo for A. Diethelm, A Circle Line Switzerland Triangle, Painting Tools and Supplies, successful vibe, minimalist, thought-provoking, abstract, recognizable, relatable, sharp, vector art, even edges, black and white', 'Simple elegant logo for Grupo Altair Publicidad, Circle Lines Venezuela, Publishing, successful vibe, minimalist, thought-provoking, abstract, recognizable, relatable, sharp, vector art, even edges, black and white']:
18
+
19
+ ![val_imgs_grid](./val_imgs_grid.png)
20
+
21
+
22
+ ## Pipeline usage
23
+
24
+ You can use the pipeline like so:
25
+
26
+ ```python
27
+ from diffusers import DiffusionPipeline
28
+ import torch
29
+
30
+ pipeline = DiffusionPipeline.from_pretrained("iamkaikai/amazing-logos-v5", torch_dtype=torch.float16)
31
+ prompt = "Simple elegant logo for Mandarin Oriental, Fan Hong kong Lines Paper, Hospitality, successful vibe, minimalist, thought-provoking, abstract, recognizable, relatable, sharp, vector art, even edges, black and white"
32
+ image = pipeline(prompt).images[0]
33
+ image.save("my_image.png")
34
+ ```
35
+
36
+ ## Training info
37
+
38
+ These are the key hyperparameters used during training:
39
+
40
+ * Epochs: 10
41
+ * Learning rate: 1e-07
42
+ * Batch size: 1
43
+ * Gradient accumulation steps: 1
44
+ * Image resolution: 512
45
+ * Mixed-precision: fp16
46
+
10epoch-h/feature_extractor/preprocessor_config.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "crop_size": {
3
+ "height": 224,
4
+ "width": 224
5
+ },
6
+ "do_center_crop": true,
7
+ "do_convert_rgb": true,
8
+ "do_normalize": true,
9
+ "do_rescale": true,
10
+ "do_resize": true,
11
+ "feature_extractor_type": "CLIPFeatureExtractor",
12
+ "image_mean": [
13
+ 0.48145466,
14
+ 0.4578275,
15
+ 0.40821073
16
+ ],
17
+ "image_processor_type": "CLIPImageProcessor",
18
+ "image_std": [
19
+ 0.26862954,
20
+ 0.26130258,
21
+ 0.27577711
22
+ ],
23
+ "resample": 3,
24
+ "rescale_factor": 0.00392156862745098,
25
+ "size": {
26
+ "shortest_edge": 224
27
+ }
28
+ }
10epoch-h/logs/text2image-fine-tune/1699306835.1319811/events.out.tfevents.1699306835.DESKTOP-TNN0PMP.8128.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46cc3218caa95c24dcbbce7406b302ca38ea6a40634bfc0821830dee83201cf2
3
+ size 2414
10epoch-h/logs/text2image-fine-tune/1699306835.1339812/hparams.yml ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: true
6
+ cache_dir: null
7
+ caption_column: text
8
+ center_crop: true
9
+ checkpointing_steps: 10000
10
+ checkpoints_total_limit: null
11
+ dataloader_num_workers: 0
12
+ dataset_config_name: null
13
+ dataset_name: iamkaikai/amazing_logos_v4
14
+ enable_xformers_memory_efficient_attention: false
15
+ gradient_accumulation_steps: 1
16
+ gradient_checkpointing: false
17
+ hub_model_id: amazing-logos-v5
18
+ hub_token: null
19
+ image_column: image
20
+ input_perturbation: 0
21
+ learning_rate: 1.0e-07
22
+ local_rank: -1
23
+ logging_dir: logs
24
+ lr_scheduler: cosine
25
+ lr_warmup_steps: 400000
26
+ max_grad_norm: 1.0
27
+ max_train_samples: null
28
+ max_train_steps: 3972510
29
+ mixed_precision: fp16
30
+ noise_offset: 0
31
+ non_ema_revision: null
32
+ num_train_epochs: 10
33
+ output_dir: amazing-logos-v5
34
+ prediction_type: null
35
+ pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
36
+ push_to_hub: true
37
+ random_flip: false
38
+ report_to: tensorboard
39
+ resolution: 512
40
+ resume_from_checkpoint: checkpoint-3240000
41
+ revision: null
42
+ scale_lr: false
43
+ seed: 6666
44
+ snr_gamma: null
45
+ tracker_project_name: text2image-fine-tune
46
+ train_batch_size: 1
47
+ train_data_dir: null
48
+ use_8bit_adam: false
49
+ use_ema: false
50
+ validation_epochs: 1
10epoch-h/logs/text2image-fine-tune/1699312817.2914586/events.out.tfevents.1699312817.DESKTOP-TNN0PMP.10224.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3ab3986a45e371e166029e85700caf99be1bafdad50a4ca1a01760b9d709314
3
+ size 2414
10epoch-h/logs/text2image-fine-tune/1699312817.2934585/hparams.yml ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: true
6
+ cache_dir: null
7
+ caption_column: text
8
+ center_crop: true
9
+ checkpointing_steps: 10000
10
+ checkpoints_total_limit: null
11
+ dataloader_num_workers: 0
12
+ dataset_config_name: null
13
+ dataset_name: iamkaikai/amazing_logos_v4
14
+ enable_xformers_memory_efficient_attention: false
15
+ gradient_accumulation_steps: 1
16
+ gradient_checkpointing: false
17
+ hub_model_id: amazing-logos-v5
18
+ hub_token: null
19
+ image_column: image
20
+ input_perturbation: 0
21
+ learning_rate: 1.0e-07
22
+ local_rank: -1
23
+ logging_dir: logs
24
+ lr_scheduler: cosine
25
+ lr_warmup_steps: 400000
26
+ max_grad_norm: 1.0
27
+ max_train_samples: null
28
+ max_train_steps: 3972510
29
+ mixed_precision: fp16
30
+ noise_offset: 0
31
+ non_ema_revision: null
32
+ num_train_epochs: 10
33
+ output_dir: amazing-logos-v5
34
+ prediction_type: null
35
+ pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
36
+ push_to_hub: true
37
+ random_flip: false
38
+ report_to: tensorboard
39
+ resolution: 512
40
+ resume_from_checkpoint: checkpoint-3240000
41
+ revision: null
42
+ scale_lr: false
43
+ seed: 6666
44
+ snr_gamma: null
45
+ tracker_project_name: text2image-fine-tune
46
+ train_batch_size: 1
47
+ train_data_dir: null
48
+ use_8bit_adam: false
49
+ use_ema: false
50
+ validation_epochs: 1
10epoch-h/logs/text2image-fine-tune/1699314601.5908923/events.out.tfevents.1699314601.DESKTOP-TNN0PMP.2164.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5a8200fb531b1404a6c88caa9516db413e527fd724f6cc1264a8d0b2aafaa5f
3
+ size 2414
10epoch-h/logs/text2image-fine-tune/1699314601.5918913/hparams.yml ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: true
6
+ cache_dir: null
7
+ caption_column: text
8
+ center_crop: true
9
+ checkpointing_steps: 20000
10
+ checkpoints_total_limit: null
11
+ dataloader_num_workers: 0
12
+ dataset_config_name: null
13
+ dataset_name: iamkaikai/amazing_logos_v4
14
+ enable_xformers_memory_efficient_attention: false
15
+ gradient_accumulation_steps: 1
16
+ gradient_checkpointing: false
17
+ hub_model_id: amazing-logos-v5
18
+ hub_token: null
19
+ image_column: image
20
+ input_perturbation: 0
21
+ learning_rate: 1.0e-07
22
+ local_rank: -1
23
+ logging_dir: logs
24
+ lr_scheduler: cosine
25
+ lr_warmup_steps: 400000
26
+ max_grad_norm: 1.0
27
+ max_train_samples: null
28
+ max_train_steps: 3972510
29
+ mixed_precision: fp16
30
+ noise_offset: 0
31
+ non_ema_revision: null
32
+ num_train_epochs: 10
33
+ output_dir: amazing-logos-v5
34
+ prediction_type: null
35
+ pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
36
+ push_to_hub: true
37
+ random_flip: false
38
+ report_to: tensorboard
39
+ resolution: 512
40
+ resume_from_checkpoint: checkpoint-3250000
41
+ revision: null
42
+ scale_lr: false
43
+ seed: 6666
44
+ snr_gamma: null
45
+ tracker_project_name: text2image-fine-tune
46
+ train_batch_size: 1
47
+ train_data_dir: null
48
+ use_8bit_adam: false
49
+ use_ema: false
50
+ validation_epochs: 1
10epoch-h/logs/text2image-fine-tune/1699412326.680156/events.out.tfevents.1699412326.DESKTOP-TNN0PMP.18100.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba028b8220a8188a2b0ef94153b18aa7b28720363c8052aa89162ed586ddf112
3
+ size 2414
10epoch-h/logs/text2image-fine-tune/1699412326.6821554/hparams.yml ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: true
6
+ cache_dir: null
7
+ caption_column: text
8
+ center_crop: true
9
+ checkpointing_steps: 20000
10
+ checkpoints_total_limit: null
11
+ dataloader_num_workers: 0
12
+ dataset_config_name: null
13
+ dataset_name: iamkaikai/amazing_logos_v4
14
+ enable_xformers_memory_efficient_attention: false
15
+ gradient_accumulation_steps: 1
16
+ gradient_checkpointing: false
17
+ hub_model_id: amazing-logos-v5
18
+ hub_token: null
19
+ image_column: image
20
+ input_perturbation: 0
21
+ learning_rate: 1.0e-07
22
+ local_rank: -1
23
+ logging_dir: logs
24
+ lr_scheduler: cosine
25
+ lr_warmup_steps: 400000
26
+ max_grad_norm: 1.0
27
+ max_train_samples: null
28
+ max_train_steps: 3972510
29
+ mixed_precision: fp16
30
+ noise_offset: 0
31
+ non_ema_revision: null
32
+ num_train_epochs: 10
33
+ output_dir: amazing-logos-v5
34
+ prediction_type: null
35
+ pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
36
+ push_to_hub: true
37
+ random_flip: false
38
+ report_to: tensorboard
39
+ resolution: 512
40
+ resume_from_checkpoint: checkpoint-3540000
41
+ revision: null
42
+ scale_lr: false
43
+ seed: 6666
44
+ snr_gamma: null
45
+ tracker_project_name: text2image-fine-tune
46
+ train_batch_size: 1
47
+ train_data_dir: null
48
+ use_8bit_adam: false
49
+ use_ema: false
50
+ validation_epochs: 1
10epoch-h/logs/text2image-fine-tune/1699452581.0122697/events.out.tfevents.1699452581.DESKTOP-TNN0PMP.12764.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bdb4a8da4193d1c78d0577c314b1d8a14131ebb0e0ccca0bac3dc8dbc8931103
3
+ size 2414
10epoch-h/logs/text2image-fine-tune/1699452581.0132704/hparams.yml ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: true
6
+ cache_dir: null
7
+ caption_column: text
8
+ center_crop: true
9
+ checkpointing_steps: 20000
10
+ checkpoints_total_limit: null
11
+ dataloader_num_workers: 0
12
+ dataset_config_name: null
13
+ dataset_name: iamkaikai/amazing_logos_v4
14
+ enable_xformers_memory_efficient_attention: false
15
+ gradient_accumulation_steps: 1
16
+ gradient_checkpointing: false
17
+ hub_model_id: amazing-logos-v5
18
+ hub_token: null
19
+ image_column: image
20
+ input_perturbation: 0
21
+ learning_rate: 1.0e-07
22
+ local_rank: -1
23
+ logging_dir: logs
24
+ lr_scheduler: cosine
25
+ lr_warmup_steps: 400000
26
+ max_grad_norm: 1.0
27
+ max_train_samples: null
28
+ max_train_steps: 3972510
29
+ mixed_precision: fp16
30
+ noise_offset: 0
31
+ non_ema_revision: null
32
+ num_train_epochs: 10
33
+ output_dir: amazing-logos-v5
34
+ prediction_type: null
35
+ pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
36
+ push_to_hub: true
37
+ random_flip: false
38
+ report_to: tensorboard
39
+ resolution: 512
40
+ resume_from_checkpoint: checkpoint-3560000
41
+ revision: null
42
+ scale_lr: false
43
+ seed: 6666
44
+ snr_gamma: null
45
+ tracker_project_name: text2image-fine-tune
46
+ train_batch_size: 1
47
+ train_data_dir: null
48
+ use_8bit_adam: false
49
+ use_ema: false
50
+ validation_epochs: 1
10epoch-h/logs/text2image-fine-tune/1699558210.3350325/events.out.tfevents.1699558210.DESKTOP-TNN0PMP.12724.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e90272b18da5b394bfb18694370af0c6aa7600806b1a84f952c78a68aea4b474
3
+ size 2414
10epoch-h/logs/text2image-fine-tune/1699558210.3370333/hparams.yml ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: true
6
+ cache_dir: null
7
+ caption_column: text
8
+ center_crop: true
9
+ checkpointing_steps: 20000
10
+ checkpoints_total_limit: null
11
+ dataloader_num_workers: 0
12
+ dataset_config_name: null
13
+ dataset_name: iamkaikai/amazing_logos_v4
14
+ enable_xformers_memory_efficient_attention: false
15
+ gradient_accumulation_steps: 1
16
+ gradient_checkpointing: false
17
+ hub_model_id: amazing-logos-v5
18
+ hub_token: null
19
+ image_column: image
20
+ input_perturbation: 0
21
+ learning_rate: 1.0e-07
22
+ local_rank: -1
23
+ logging_dir: logs
24
+ lr_scheduler: cosine
25
+ lr_warmup_steps: 400000
26
+ max_grad_norm: 1.0
27
+ max_train_samples: null
28
+ max_train_steps: 3972510
29
+ mixed_precision: fp16
30
+ noise_offset: 0
31
+ non_ema_revision: null
32
+ num_train_epochs: 10
33
+ output_dir: amazing-logos-v5
34
+ prediction_type: null
35
+ pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
36
+ push_to_hub: true
37
+ random_flip: false
38
+ report_to: tensorboard
39
+ resolution: 512
40
+ resume_from_checkpoint: checkpoint-3740000
41
+ revision: null
42
+ scale_lr: false
43
+ seed: 6666
44
+ snr_gamma: null
45
+ tracker_project_name: text2image-fine-tune
46
+ train_batch_size: 1
47
+ train_data_dir: null
48
+ use_8bit_adam: false
49
+ use_ema: false
50
+ validation_epochs: 1
10epoch-h/logs/text2image-fine-tune/events.out.tfevents.1699306835.DESKTOP-TNN0PMP.8128.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71bba50968bcf32f0624de77b0872430d4712b48e16517c38dd20300583d5279
3
+ size 990610
10epoch-h/logs/text2image-fine-tune/events.out.tfevents.1699312817.DESKTOP-TNN0PMP.10224.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a945b0775debaded0e081ccae4f745b9cc49617bc470774096d49ca32b0ace2a
3
+ size 295225
10epoch-h/logs/text2image-fine-tune/events.out.tfevents.1699314601.DESKTOP-TNN0PMP.2164.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8150acd8eea3a8e16cb305f3dddb84c095b22d35be5bd433d8a1fb9c20a503ee
3
+ size 15295549
10epoch-h/logs/text2image-fine-tune/events.out.tfevents.1699412326.DESKTOP-TNN0PMP.18100.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:796213a23182deed80394e67dc42c2c2e4a032ae2d50f09665eb105dda654691
3
+ size 1563442
10epoch-h/logs/text2image-fine-tune/events.out.tfevents.1699452581.DESKTOP-TNN0PMP.12764.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20e0cf4c5f1d887b92da1f9d281193b87e81c9580683ec1f13fa922362db7f29
3
+ size 9379396
10epoch-h/logs/text2image-fine-tune/events.out.tfevents.1699558210.DESKTOP-TNN0PMP.12724.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14d095d7d1c5036780affc30fb5c83ef50109364393014cc48183efe946310da
3
+ size 18673753
10epoch-h/model_index.json ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "StableDiffusionPipeline",
3
+ "_diffusers_version": "0.22.0.dev0",
4
+ "_name_or_path": "runwayml/stable-diffusion-v1-5",
5
+ "feature_extractor": [
6
+ "transformers",
7
+ "CLIPImageProcessor"
8
+ ],
9
+ "requires_safety_checker": true,
10
+ "safety_checker": [
11
+ "stable_diffusion",
12
+ "StableDiffusionSafetyChecker"
13
+ ],
14
+ "scheduler": [
15
+ "diffusers",
16
+ "PNDMScheduler"
17
+ ],
18
+ "text_encoder": [
19
+ "transformers",
20
+ "CLIPTextModel"
21
+ ],
22
+ "tokenizer": [
23
+ "transformers",
24
+ "CLIPTokenizer"
25
+ ],
26
+ "unet": [
27
+ "diffusers",
28
+ "UNet2DConditionModel"
29
+ ],
30
+ "vae": [
31
+ "diffusers",
32
+ "AutoencoderKL"
33
+ ]
34
+ }
10epoch-h/safety_checker/config.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "C:\\Users\\Kyle\\.cache\\huggingface\\hub\\models--runwayml--stable-diffusion-v1-5\\snapshots\\1d0c4ebf6ff58a5caecab40fa1406526bca4b5b9\\safety_checker",
3
+ "architectures": [
4
+ "StableDiffusionSafetyChecker"
5
+ ],
6
+ "initializer_factor": 1.0,
7
+ "logit_scale_init_value": 2.6592,
8
+ "model_type": "clip",
9
+ "projection_dim": 768,
10
+ "text_config": {
11
+ "dropout": 0.0,
12
+ "hidden_size": 768,
13
+ "intermediate_size": 3072,
14
+ "model_type": "clip_text_model",
15
+ "num_attention_heads": 12
16
+ },
17
+ "torch_dtype": "float32",
18
+ "transformers_version": "4.32.1",
19
+ "vision_config": {
20
+ "dropout": 0.0,
21
+ "hidden_size": 1024,
22
+ "intermediate_size": 4096,
23
+ "model_type": "clip_vision_model",
24
+ "num_attention_heads": 16,
25
+ "num_hidden_layers": 24,
26
+ "patch_size": 14
27
+ }
28
+ }
10epoch-h/safety_checker/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb351a5ded815c3ff744968ad9c6b218d071b9d313d04f35e813b84b4c0ffde8
3
+ size 1215979664
10epoch-h/scheduler/scheduler_config.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "PNDMScheduler",
3
+ "_diffusers_version": "0.22.0.dev0",
4
+ "beta_end": 0.012,
5
+ "beta_schedule": "scaled_linear",
6
+ "beta_start": 0.00085,
7
+ "clip_sample": false,
8
+ "num_train_timesteps": 1000,
9
+ "prediction_type": "epsilon",
10
+ "set_alpha_to_one": false,
11
+ "skip_prk_steps": true,
12
+ "steps_offset": 1,
13
+ "timestep_spacing": "leading",
14
+ "trained_betas": null
15
+ }
10epoch-h/text_encoder/config.json ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "runwayml/stable-diffusion-v1-5",
3
+ "architectures": [
4
+ "CLIPTextModel"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 0,
8
+ "dropout": 0.0,
9
+ "eos_token_id": 2,
10
+ "hidden_act": "quick_gelu",
11
+ "hidden_size": 768,
12
+ "initializer_factor": 1.0,
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 3072,
15
+ "layer_norm_eps": 1e-05,
16
+ "max_position_embeddings": 77,
17
+ "model_type": "clip_text_model",
18
+ "num_attention_heads": 12,
19
+ "num_hidden_layers": 12,
20
+ "pad_token_id": 1,
21
+ "projection_dim": 768,
22
+ "torch_dtype": "float16",
23
+ "transformers_version": "4.32.1",
24
+ "vocab_size": 49408
25
+ }
10epoch-h/text_encoder/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:660c6f5b1abae9dc498ac2d21e1347d2abdb0cf6c0c0c8576cd796491d9a6cdd
3
+ size 246144152
10epoch-h/tokenizer/merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
10epoch-h/tokenizer/special_tokens_map.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<|startoftext|>",
4
+ "lstrip": false,
5
+ "normalized": true,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "<|endoftext|>",
11
+ "lstrip": false,
12
+ "normalized": true,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": "<|endoftext|>",
17
+ "unk_token": {
18
+ "content": "<|endoftext|>",
19
+ "lstrip": false,
20
+ "normalized": true,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ }
24
+ }
10epoch-h/tokenizer/tokenizer_config.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "bos_token": {
4
+ "__type": "AddedToken",
5
+ "content": "<|startoftext|>",
6
+ "lstrip": false,
7
+ "normalized": true,
8
+ "rstrip": false,
9
+ "single_word": false
10
+ },
11
+ "clean_up_tokenization_spaces": true,
12
+ "do_lower_case": true,
13
+ "eos_token": {
14
+ "__type": "AddedToken",
15
+ "content": "<|endoftext|>",
16
+ "lstrip": false,
17
+ "normalized": true,
18
+ "rstrip": false,
19
+ "single_word": false
20
+ },
21
+ "errors": "replace",
22
+ "model_max_length": 77,
23
+ "pad_token": "<|endoftext|>",
24
+ "tokenizer_class": "CLIPTokenizer",
25
+ "unk_token": {
26
+ "__type": "AddedToken",
27
+ "content": "<|endoftext|>",
28
+ "lstrip": false,
29
+ "normalized": true,
30
+ "rstrip": false,
31
+ "single_word": false
32
+ }
33
+ }
10epoch-h/tokenizer/vocab.json ADDED
The diff for this file is too large to render. See raw diff
 
10epoch-h/unet/config.json ADDED
@@ -0,0 +1,67 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "UNet2DConditionModel",
3
+ "_diffusers_version": "0.22.0.dev0",
4
+ "_name_or_path": "amazing-logos-v5\\checkpoint-3740000",
5
+ "act_fn": "silu",
6
+ "addition_embed_type": null,
7
+ "addition_embed_type_num_heads": 64,
8
+ "addition_time_embed_dim": null,
9
+ "attention_head_dim": 8,
10
+ "attention_type": "default",
11
+ "block_out_channels": [
12
+ 320,
13
+ 640,
14
+ 1280,
15
+ 1280
16
+ ],
17
+ "center_input_sample": false,
18
+ "class_embed_type": null,
19
+ "class_embeddings_concat": false,
20
+ "conv_in_kernel": 3,
21
+ "conv_out_kernel": 3,
22
+ "cross_attention_dim": 768,
23
+ "cross_attention_norm": null,
24
+ "down_block_types": [
25
+ "CrossAttnDownBlock2D",
26
+ "CrossAttnDownBlock2D",
27
+ "CrossAttnDownBlock2D",
28
+ "DownBlock2D"
29
+ ],
30
+ "downsample_padding": 1,
31
+ "dropout": 0.0,
32
+ "dual_cross_attention": false,
33
+ "encoder_hid_dim": null,
34
+ "encoder_hid_dim_type": null,
35
+ "flip_sin_to_cos": true,
36
+ "freq_shift": 0,
37
+ "in_channels": 4,
38
+ "layers_per_block": 2,
39
+ "mid_block_only_cross_attention": null,
40
+ "mid_block_scale_factor": 1,
41
+ "mid_block_type": "UNetMidBlock2DCrossAttn",
42
+ "norm_eps": 1e-05,
43
+ "norm_num_groups": 32,
44
+ "num_attention_heads": null,
45
+ "num_class_embeds": null,
46
+ "only_cross_attention": false,
47
+ "out_channels": 4,
48
+ "projection_class_embeddings_input_dim": null,
49
+ "resnet_out_scale_factor": 1.0,
50
+ "resnet_skip_time_act": false,
51
+ "resnet_time_scale_shift": "default",
52
+ "sample_size": 64,
53
+ "time_cond_proj_dim": null,
54
+ "time_embedding_act_fn": null,
55
+ "time_embedding_dim": null,
56
+ "time_embedding_type": "positional",
57
+ "timestep_post_act": null,
58
+ "transformer_layers_per_block": 1,
59
+ "up_block_types": [
60
+ "UpBlock2D",
61
+ "CrossAttnUpBlock2D",
62
+ "CrossAttnUpBlock2D",
63
+ "CrossAttnUpBlock2D"
64
+ ],
65
+ "upcast_attention": false,
66
+ "use_linear_projection": false
67
+ }
10epoch-h/unet/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34b80faa14958ed4e0ceed392e49796d6147b27995c6bca47f89d7a43314f108
3
+ size 3438167536
10epoch-h/vae/config.json ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "AutoencoderKL",
3
+ "_diffusers_version": "0.22.0.dev0",
4
+ "_name_or_path": "runwayml/stable-diffusion-v1-5",
5
+ "act_fn": "silu",
6
+ "block_out_channels": [
7
+ 128,
8
+ 256,
9
+ 512,
10
+ 512
11
+ ],
12
+ "down_block_types": [
13
+ "DownEncoderBlock2D",
14
+ "DownEncoderBlock2D",
15
+ "DownEncoderBlock2D",
16
+ "DownEncoderBlock2D"
17
+ ],
18
+ "force_upcast": true,
19
+ "in_channels": 3,
20
+ "latent_channels": 4,
21
+ "layers_per_block": 2,
22
+ "norm_num_groups": 32,
23
+ "out_channels": 3,
24
+ "sample_size": 512,
25
+ "scaling_factor": 0.18215,
26
+ "up_block_types": [
27
+ "UpDecoderBlock2D",
28
+ "UpDecoderBlock2D",
29
+ "UpDecoderBlock2D",
30
+ "UpDecoderBlock2D"
31
+ ]
32
+ }
10epoch-h/vae/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fbcf0ebe55a0984f5a5e00d8c4521d52359af7229bb4d81890039d2aa16dd7c
3
+ size 167335342
10epoch-h/val_imgs_grid.png ADDED

Git LFS Details

  • SHA256: 72404ab2b11666f9dcd2a6882c2528b87ac6ec130e7afc51cfd3b4e52263088a
  • Pointer size: 132 Bytes
  • Size of remote file: 6.56 MB
README.md CHANGED
@@ -37,8 +37,8 @@ image.save("my_image.png")
37
 
38
  These are the key hyperparameters used during training:
39
 
40
- * Epochs: 10
41
- * Learning rate: 1e-07
42
  * Batch size: 1
43
  * Gradient accumulation steps: 1
44
  * Image resolution: 512
 
37
 
38
  These are the key hyperparameters used during training:
39
 
40
+ * Epochs: 12
41
+ * Learning rate: 1e-08
42
  * Batch size: 1
43
  * Gradient accumulation steps: 1
44
  * Image resolution: 512
checkpoint-4620000/optimizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffc66c28eb8985e2319ae509d5606a38aaea7363cb61d84a2c422cfaa8315c9b
3
+ size 6876750164
checkpoint-4620000/random_states_0.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8a88b232795abf7aeb2bd310729f02ec5e051f8c22f194022722c496d48a739
3
+ size 14408
checkpoint-4620000/scaler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf6a9841372e72ae25fb5e71f2bc73568788f589d92b4e739d5ab70c7100ff30
3
+ size 988
checkpoint-4620000/scheduler.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccbd9000c530a76a010d797bea98d42b3ce8845bc67db605bb84713bb907c3a4
3
+ size 1000
checkpoint-4620000/unet/config.json ADDED
@@ -0,0 +1,67 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "UNet2DConditionModel",
3
+ "_diffusers_version": "0.22.0.dev0",
4
+ "_name_or_path": "amazing-logos-v5\\checkpoint-4560000",
5
+ "act_fn": "silu",
6
+ "addition_embed_type": null,
7
+ "addition_embed_type_num_heads": 64,
8
+ "addition_time_embed_dim": null,
9
+ "attention_head_dim": 8,
10
+ "attention_type": "default",
11
+ "block_out_channels": [
12
+ 320,
13
+ 640,
14
+ 1280,
15
+ 1280
16
+ ],
17
+ "center_input_sample": false,
18
+ "class_embed_type": null,
19
+ "class_embeddings_concat": false,
20
+ "conv_in_kernel": 3,
21
+ "conv_out_kernel": 3,
22
+ "cross_attention_dim": 768,
23
+ "cross_attention_norm": null,
24
+ "down_block_types": [
25
+ "CrossAttnDownBlock2D",
26
+ "CrossAttnDownBlock2D",
27
+ "CrossAttnDownBlock2D",
28
+ "DownBlock2D"
29
+ ],
30
+ "downsample_padding": 1,
31
+ "dropout": 0.0,
32
+ "dual_cross_attention": false,
33
+ "encoder_hid_dim": null,
34
+ "encoder_hid_dim_type": null,
35
+ "flip_sin_to_cos": true,
36
+ "freq_shift": 0,
37
+ "in_channels": 4,
38
+ "layers_per_block": 2,
39
+ "mid_block_only_cross_attention": null,
40
+ "mid_block_scale_factor": 1,
41
+ "mid_block_type": "UNetMidBlock2DCrossAttn",
42
+ "norm_eps": 1e-05,
43
+ "norm_num_groups": 32,
44
+ "num_attention_heads": null,
45
+ "num_class_embeds": null,
46
+ "only_cross_attention": false,
47
+ "out_channels": 4,
48
+ "projection_class_embeddings_input_dim": null,
49
+ "resnet_out_scale_factor": 1.0,
50
+ "resnet_skip_time_act": false,
51
+ "resnet_time_scale_shift": "default",
52
+ "sample_size": 64,
53
+ "time_cond_proj_dim": null,
54
+ "time_embedding_act_fn": null,
55
+ "time_embedding_dim": null,
56
+ "time_embedding_type": "positional",
57
+ "timestep_post_act": null,
58
+ "transformer_layers_per_block": 1,
59
+ "up_block_types": [
60
+ "UpBlock2D",
61
+ "CrossAttnUpBlock2D",
62
+ "CrossAttnUpBlock2D",
63
+ "CrossAttnUpBlock2D"
64
+ ],
65
+ "upcast_attention": false,
66
+ "use_linear_projection": false
67
+ }
checkpoint-4620000/unet/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9639b65078b9265bb3f8d7d1205147817e17b60d8ede0f73ddcb58f9e8ad189
3
+ size 3438167536
checkpoint-4640000/optimizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb22b44fbafad45a8dbd1f668e3f6e17403c0d9889b1c25d1808184098fc567f
3
+ size 6876750164
checkpoint-4640000/random_states_0.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b0c05bd1c756e5a8a02c92d9f8ccd614e4c42cc03beac5dd95eae6933cc2afb
3
+ size 14408
checkpoint-4640000/scaler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c1bb8cddda47fca5c0408c6bd99418448a32025bad6181574466273ba91e228
3
+ size 988
checkpoint-4640000/scheduler.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d01dc69b3ba6d183e0fab9f067e457d2187898ce4a44f66912f58dd528a2e074
3
+ size 1000
checkpoint-4640000/unet/config.json ADDED
@@ -0,0 +1,67 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "UNet2DConditionModel",
3
+ "_diffusers_version": "0.22.0.dev0",
4
+ "_name_or_path": "amazing-logos-v5\\checkpoint-4560000",
5
+ "act_fn": "silu",
6
+ "addition_embed_type": null,
7
+ "addition_embed_type_num_heads": 64,
8
+ "addition_time_embed_dim": null,
9
+ "attention_head_dim": 8,
10
+ "attention_type": "default",
11
+ "block_out_channels": [
12
+ 320,
13
+ 640,
14
+ 1280,
15
+ 1280
16
+ ],
17
+ "center_input_sample": false,
18
+ "class_embed_type": null,
19
+ "class_embeddings_concat": false,
20
+ "conv_in_kernel": 3,
21
+ "conv_out_kernel": 3,
22
+ "cross_attention_dim": 768,
23
+ "cross_attention_norm": null,
24
+ "down_block_types": [
25
+ "CrossAttnDownBlock2D",
26
+ "CrossAttnDownBlock2D",
27
+ "CrossAttnDownBlock2D",
28
+ "DownBlock2D"
29
+ ],
30
+ "downsample_padding": 1,
31
+ "dropout": 0.0,
32
+ "dual_cross_attention": false,
33
+ "encoder_hid_dim": null,
34
+ "encoder_hid_dim_type": null,
35
+ "flip_sin_to_cos": true,
36
+ "freq_shift": 0,
37
+ "in_channels": 4,
38
+ "layers_per_block": 2,
39
+ "mid_block_only_cross_attention": null,
40
+ "mid_block_scale_factor": 1,
41
+ "mid_block_type": "UNetMidBlock2DCrossAttn",
42
+ "norm_eps": 1e-05,
43
+ "norm_num_groups": 32,
44
+ "num_attention_heads": null,
45
+ "num_class_embeds": null,
46
+ "only_cross_attention": false,
47
+ "out_channels": 4,
48
+ "projection_class_embeddings_input_dim": null,
49
+ "resnet_out_scale_factor": 1.0,
50
+ "resnet_skip_time_act": false,
51
+ "resnet_time_scale_shift": "default",
52
+ "sample_size": 64,
53
+ "time_cond_proj_dim": null,
54
+ "time_embedding_act_fn": null,
55
+ "time_embedding_dim": null,
56
+ "time_embedding_type": "positional",
57
+ "timestep_post_act": null,
58
+ "transformer_layers_per_block": 1,
59
+ "up_block_types": [
60
+ "UpBlock2D",
61
+ "CrossAttnUpBlock2D",
62
+ "CrossAttnUpBlock2D",
63
+ "CrossAttnUpBlock2D"
64
+ ],
65
+ "upcast_attention": false,
66
+ "use_linear_projection": false
67
+ }
checkpoint-4640000/unet/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e92ff28cd2f656ccb1833cc092bbcf2fd7883caa06cab1c0d9b504a34b5cef90
3
+ size 3438167536
checkpoint-4660000/optimizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:771a2c1d37f97c94ffd4973b56adcb8e1689b18fa2e5c1f7aa3965f8b4e00300
3
+ size 6876750164