|
|
|
|
|
|
|
|
|
|
|
model:
|
|
arch: blip2
|
|
model_type: coco
|
|
load_pretrained: True
|
|
load_finetuned: False
|
|
freeze_vit: False
|
|
|
|
|
|
|
|
|
|
|
|
|
|
datasets:
|
|
coco_retrieval:
|
|
vis_processor:
|
|
train:
|
|
name: "blip2_image_train"
|
|
image_size: 364
|
|
eval:
|
|
name: "blip_image_eval"
|
|
image_size: 364
|
|
text_processor:
|
|
train:
|
|
name: "blip_caption"
|
|
eval:
|
|
name: "blip_caption"
|
|
build_info:
|
|
images:
|
|
storage: '/export/share/datasets/vision/coco/images/'
|
|
|
|
run:
|
|
task: retrieval
|
|
|
|
lr_sched: "linear_warmup_cosine_lr"
|
|
init_lr: 1e-5
|
|
min_lr: 0
|
|
warmup_lr: 1e-8
|
|
warmup_steps: 1000
|
|
weight_decay: 0.05
|
|
max_epoch: 5
|
|
batch_size_train: 14
|
|
batch_size_eval: 16
|
|
lr_layer_decay: 0.95
|
|
num_workers: 4
|
|
accum_grad_iters: 1
|
|
|
|
seed: 42
|
|
output_dir: "output/BLIP2/Retrieval_coco"
|
|
|
|
amp: True
|
|
resume_ckpt_path: null
|
|
|
|
evaluate: False
|
|
train_splits: ["train"]
|
|
valid_splits: ["test"]
|
|
|
|
k_test: 128
|
|
|
|
device: "cuda"
|
|
world_size: 1
|
|
dist_url: "env://"
|
|
distributed: True
|
|
use_dist_eval_sampler: False
|
|
|