Spaces:
Build error
Build error
File size: 783 Bytes
910e2ad |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 |
#!/bin/bash
# This script is used for batch extract the vae latents for video generation training
# Since the video latent extract is very slow, pre-extract the video vae latents will save the training time
GPUS=8 # The gpu number
MODEL_NAME=pyramid_flux # The model name, `pyramid_flux` or `pyramid_mmdit`
VAE_MODEL_PATH=/PATH/pyramid-flow-miniflux/causal_video_vae # The VAE CKPT dir.
ANNO_FILE=annotation/video_text.jsonl # The video annotation file path
WIDTH=640
HEIGHT=384
NUM_FRAMES=121
torchrun --nproc_per_node $GPUS \
tools/extract_video_vae_latents.py \
--batch_size 1 \
--model_dtype bf16 \
--model_path $VAE_MODEL_PATH \
--anno_file $ANNO_FILE \
--width $WIDTH \
--height $HEIGHT \
--num_frames $NUM_FRAMES |