File size: 1,124 Bytes
bde9e93
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
pretrained_model_path: ./checkpoints/Bingsu/my-korean-stable-diffusion-v1-5
output_dir: outputs/bear_guitar
train_data:
  video_path: data/man-surfing.mp4
  prompt: A man is surfing
  n_sample_frames: 24
  width: 512
  height: 512
  sample_start_idx: 0
  sample_frame_rate: 2
validation_data:
  prompts:
  - λ―Έν‚€λ§ˆμš°μŠ€κ°€ μ„œν•‘μ„ 타고 μžˆμŠ΅λ‹ˆλ‹€
  - ν•œ μ—¬μžκ°€ μ„œν•‘μ„ 타고 μžˆμŠ΅λ‹ˆλ‹€
  - 흰색 μ˜·μ„ μž…μ€ λ‚¨μžκ°€ λ°”λ‹€λ₯Ό κ±·κ³  μžˆμŠ΅λ‹ˆλ‹€
  video_length: 24
  width: 512
  height: 512
  num_inference_steps: 20
  guidance_scale: 12.5
  use_inv_latent: true
  num_inv_steps: 50
validation_steps: 100
trainable_modules:
- attn1.to_q
- attn2.to_q
- attn_temp
train_batch_size: 1
max_train_steps: 400
learning_rate: 3.0e-05
scale_lr: false
lr_scheduler: constant
lr_warmup_steps: 0
adam_beta1: 0.9
adam_beta2: 0.999
adam_weight_decay: 0.01
adam_epsilon: 1.0e-08
max_grad_norm: 1.0
gradient_accumulation_steps: 1
gradient_checkpointing: true
checkpointing_steps: 1000
resume_from_checkpoint: null
mixed_precision: fp16
use_8bit_adam: false
enable_xformers_memory_efficient_attention: true
seed: 33