|
|
|
mode: sample |
|
gpu_ids: [3] |
|
batch_size: 1 |
|
num_workers: 4 |
|
num_cpu_cores: -1 |
|
seed: 0 |
|
ckpt_dir: /root/lihui/StoryVisualization/save_ckpt_epoch5_new |
|
run_name: ARLDM |
|
|
|
|
|
dataset: pororo |
|
task: visualization |
|
|
|
|
|
init_lr: 1e-5 |
|
warmup_epochs: 1 |
|
max_epochs: 5 |
|
train_model_file: /root/lihui/StoryVisualization/save_ckpt_3last50/ARLDM/last.ckpt |
|
freeze_clip: True |
|
freeze_blip: True |
|
freeze_resnet: True |
|
|
|
|
|
test_model_file: /root/lihui/StoryVisualization/save_ckpt_3last50/ARLDM/last.ckpt |
|
calculate_fid: True |
|
scheduler: ddim |
|
guidance_scale: 6 |
|
num_inference_steps: 250 |
|
sample_output_dir: /root/lihui/StoryVisualization/save_samples_128_epoch50 |
|
|
|
pororo: |
|
hdf5_file: /root/lihui/StoryVisualization/pororo.h5 |
|
max_length: 85 |
|
new_tokens: [ "pororo", "loopy", "eddy", "harry", "poby", "tongtong", "crong", "rody", "petty" ] |
|
clip_embedding_tokens: 49416 |
|
blip_embedding_tokens: 30530 |
|
|
|
flintstones: |
|
hdf5_file: /path/to/flintstones.h5 |
|
max_length: 91 |
|
new_tokens: [ "fred", "barney", "wilma", "betty", "pebbles", "dino", "slate" ] |
|
clip_embedding_tokens: 49412 |
|
blip_embedding_tokens: 30525 |
|
|
|
vistsis: |
|
hdf5_file: /path/to/vist.h5 |
|
max_length: 100 |
|
clip_embedding_tokens: 49408 |
|
blip_embedding_tokens: 30524 |
|
|
|
vistdii: |
|
hdf5_file: /path/to/vist.h5 |
|
max_length: 65 |
|
clip_embedding_tokens: 49408 |
|
blip_embedding_tokens: 30524 |
|
|
|
hydra: |
|
run: |
|
dir: . |
|
output_subdir: null |
|
hydra/job_logging: disabled |
|
hydra/hydra_logging: disabled |