kyujinpy commited on
Commit
81a9e19
โ€ข
1 Parent(s): f559d47

Upload 2 files

Browse files
Files changed (2) hide show
  1. config.yaml +46 -0
  2. model_index.json +4 -12
config.yaml ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ pretrained_model_path: ./checkpoints/kyujinpy/KO-stable-diffusion-disney
2
+ output_dir: outputs/bear_guitar
3
+ train_data:
4
+ video_path: data/bear_guitar.mp4
5
+ prompt: A bear is playing guitar
6
+ n_sample_frames: 14
7
+ width: 512
8
+ height: 512
9
+ sample_start_idx: 0
10
+ sample_frame_rate: 2
11
+ validation_data:
12
+ prompts:
13
+ - ์ž˜์ƒ๊ธด ์™•์ž๊ฐ€ ํ”ผ์•„๋…ธ๋ฅผ ์—ฐ์ฃผํ•˜๊ณ  ์žˆ์Šต๋‹ˆ๋‹ค, ๋ชจ๋˜ํ•œ ๋””์ฆˆ๋‹ˆ ์Šคํƒ€์ผ
14
+ - ์—˜ํ”„๊ฐ€ ํ”ผ์•„๋…ธ๋ฅผ ์—ฐ์ฃผํ•˜๊ณ  ์žˆ์Šต๋‹ˆ๋‹ค, ๋ชจ๋˜ํ•œ ๋””์ฆˆ๋‹ˆ ์Šคํƒ€์ผ
15
+ - ๋นจ๊ฐ„์ƒ‰ ๋จธ๋ฆฌ๋ฅผ ํ•œ ๊ณต์ฃผ๊ฐ€ ํ”ผ์•„๋…ธ๋ฅผ ์—ฐ์ฃผํ•˜๊ณ  ์žˆ์Šต๋‹ˆ๋‹ค, ๋ชจ๋˜ํ•œ ๋””์ฆˆ๋‹ˆ ์Šคํƒ€์ผ
16
+ video_length: 14
17
+ width: 512
18
+ height: 512
19
+ num_inference_steps: 20
20
+ guidance_scale: 12.5
21
+ use_inv_latent: true
22
+ num_inv_steps: 50
23
+ validation_steps: 100
24
+ trainable_modules:
25
+ - attn1.to_q
26
+ - attn2.to_q
27
+ - attn_temp
28
+ train_batch_size: 1
29
+ max_train_steps: 400
30
+ learning_rate: 3.0e-05
31
+ scale_lr: false
32
+ lr_scheduler: constant
33
+ lr_warmup_steps: 0
34
+ adam_beta1: 0.9
35
+ adam_beta2: 0.999
36
+ adam_weight_decay: 0.01
37
+ adam_epsilon: 1.0e-08
38
+ max_grad_norm: 1.0
39
+ gradient_accumulation_steps: 1
40
+ gradient_checkpointing: true
41
+ checkpointing_steps: 1000
42
+ resume_from_checkpoint: null
43
+ mixed_precision: fp16
44
+ use_8bit_adam: false
45
+ enable_xformers_memory_efficient_attention: true
46
+ seed: 33
model_index.json CHANGED
@@ -1,14 +1,6 @@
1
  {
2
- "_class_name": "StableDiffusionPipeline",
3
- "_diffusers_version": "0.6.0",
4
- "feature_extractor": [
5
- "transformers",
6
- "CLIPImageProcessor"
7
- ],
8
- "safety_checker": [
9
- "stable_diffusion",
10
- "StableDiffusionSafetyChecker"
11
- ],
12
  "scheduler": [
13
  "diffusers",
14
  "PNDMScheduler"
@@ -22,8 +14,8 @@
22
  "CLIPTokenizer"
23
  ],
24
  "unet": [
25
- "diffusers",
26
- "UNet2DConditionModel"
27
  ],
28
  "vae": [
29
  "diffusers",
 
1
  {
2
+ "_class_name": "TuneAVideoPipeline",
3
+ "_diffusers_version": "0.11.1",
 
 
 
 
 
 
 
 
4
  "scheduler": [
5
  "diffusers",
6
  "PNDMScheduler"
 
14
  "CLIPTokenizer"
15
  ],
16
  "unet": [
17
+ "models",
18
+ "UNet3DConditionModel"
19
  ],
20
  "vae": [
21
  "diffusers",