pretrained_model_path: "/data/stable-diffusion/stable-diffusion-v1-5" output_dir: "./outputs/man-motor" train_data: video_path: "./data/motorbike" prompt: "a man is driving a motorbike in the forest" n_sample_frames: 8 width: 512 height: 512 sample_start_idx: 0 sample_frame_rate: 1 validation_data: prompts: - "a Spider-Man is driving a motorbike in the forest" video_length: 8 width: 512 height: 512 num_inference_steps: 50 guidance_scale: 12.5 use_inv_latent: True num_inv_steps: 50 learning_rate: 3e-5 train_batch_size: 1 max_train_steps: 500 checkpointing_steps: 1000 validation_steps: 500 trainable_modules: - "attn1.to_q" - "attn2.to_q" - "attn_temp" seed: 33 mixed_precision: fp16 use_8bit_adam: False gradient_checkpointing: True enable_xformers_memory_efficient_attention: True