# Copyright (c) 2022, salesforce.com, inc. # All rights reserved. # SPDX-License-Identifier: BSD-3-Clause # For full license text, see the LICENSE file in the repo root or https://opensource.org/licenses/BSD-3-Clause model: arch: clip model_type: ViT-L-14-336 datasets: flickr30k: # name of the dataset builder vis_processor: train: name: "clip_image_train" image_size: 336 eval: name: "clip_image_eval" image_size: 336 text_processor: train: name: "blip_caption" eval: name: "blip_caption" run: task: retrieval # dataloading num_workers: 4 batch_size_train: 32 batch_size_eval: 128 test_splits: ["test"] # distribution device: "cuda" world_size: 1 dist_url: "env://" distributed: True use_dist_eval_sampler: True # misc seed: 42 output_dir: "output/clip/Retrieval_Flickr" evaluate: True