Koala-video-llm / global_local /datasets /builders /video_caption_builder.py
Reuben Tan
initial commit
b2afdba
raw history blame
No virus
996 Bytes
import os
import logging
import warnings
from global_local.common.registry import registry
from global_local.datasets.builders.base_dataset_builder import BaseDatasetBuilder
from global_local.datasets.datasets.webvid_datasets import WebvidDataset
@registry.register_builder("webvid")
class WebvidBuilder(BaseDatasetBuilder):
train_dataset_cls = WebvidDataset
DATASET_CONFIG_DICT = {"default": "configs/datasets/webvid/defaults.yaml"}
def _download_ann(self):
pass
def _download_vis(self):
pass
def build(self):
self.build_processors()
datasets = dict()
split = "train"
build_info = self.config.build_info
dataset_cls = self.train_dataset_cls
datasets[split] = dataset_cls(
vis_processor=self.vis_processors[split],
text_processor=self.text_processors[split],
vis_root=build_info.videos_dir,
ann_root=build_info.anno_dir
)
return datasets