FAPM_demo / lavis /configs /models /gpt_dialogue_base.yaml
wenkai's picture
Upload 560 files
a43ef32 verified
raw
history blame
No virus
916 Bytes
# Copyright (c) 2022, salesforce.com, inc.
# All rights reserved.
# SPDX-License-Identifier: BSD-3-Clause
# For full license text, see the LICENSE file in the repo root or https://opensource.org/licenses/BSD-3-Clause
model:
arch: gpt_dialogue
# pretrained: "https://storage.googleapis.com/sfr-vision-language-research/BLIP/models/model_base_caption_capfilt_large.pth"
# pretrained: "https://storage.googleapis.com/sfr-vision-language-research/BLIP/models/model_base_capfilt_large.pth"
len_tokenizer: 50264 # 50257 tokens from gpt2 default tokenizer + additional special tokens
len_video_ft: 4224 # i3d_rgb: 2048 i3d_flow: 2048 vggish: 128
preprocess:
vis_processor:
train:
name: "gpt_video_ft"
eval:
name: "gpt_video_ft"
text_processor:
train:
name: "gpt_dialogue"
eval:
name: "gpt_dialogue"