high_fidelity_video_background_music_generation_with_transformers
/
models_peft
/nature_large
/configuration.yml
log_level: INFO | |
num_epochs: 20 | |
batch_size: 2 | |
save_step: 1720 | |
device: cuda | |
use_wandb: true | |
wandb_project_name: thesis_peft | |
gradient_clipping: 1.0 | |
beta1: 0.9 | |
beta2: 0.95 | |
weight_decay: 0.1 | |
learning_rate: 1.0e-05 | |
warmup_steps: 16 | |
video_extraction_framerate: 1 | |
encoder_input_dimension: 2048 | |
encoder_dim_feedforward: 32768 | |
encoder_heads: 64 | |
encoder_layers: 24 | |
musicgen_model_id: facebook/musicgen-stereo-large | |
use_peft: true | |
output_dir_name: nature_large | |
dataset_video_folder: ../../datasets/nature2/videos_30sec | |
dataset_audio_folder: ../../datasets/nature2/audio_30sec | |
use_demucs_folder_structure: false | |
dataset_validation_split: 0.1 | |
dataset_shuffling_seed: 42 | |