# Copyright (c) 2022, salesforce.com, inc. # All rights reserved. # SPDX-License-Identifier: BSD-3-Clause # For full license text, see the LICENSE file in the repo root or https://opensource.org/licenses/BSD-3-Clause model: arch: gpt_dialogue # pretrained: "https://storage.googleapis.com/sfr-vision-language-research/BLIP/models/model_base_caption_capfilt_large.pth" # pretrained: "https://storage.googleapis.com/sfr-vision-language-research/BLIP/models/model_base_capfilt_large.pth" len_tokenizer: 50264 # 50257 tokens from gpt2 default tokenizer + additional special tokens len_video_ft: 4224 # i3d_rgb: 2048 i3d_flow: 2048 vggish: 128 preprocess: vis_processor: train: name: "gpt_video_ft" eval: name: "gpt_video_ft" text_processor: train: name: "gpt_dialogue" eval: name: "gpt_dialogue"