File size: 891 Bytes
9d0a4ae
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
import pdb
import sys
import json
import torch
import numpy as np
from run_on_video.data_utils import ClipFeatureExtractor
import torch.nn.functional as F
import tqdm
import os

query_list = []
qid_list = []
dataset = 'charades'
split = 'test'

save_dir = f''

with open(f"data/{dataset}/metadata/{dataset}_{split}.jsonl", 'r') as f:
    while True:
        line = f.readline()
        if not line:
            break
        js = json.loads(line)
        query_list.append(js['query'])
        qid_list.append(str(js['qid']))

# clip
feature_extractor = ClipFeatureExtractor(
    framerate=1 / 2, size=224, centercrop=True,
    model_name_or_path="ViT-B/32", device='cuda'
)
# pdb.set_trace()
query_feats = feature_extractor.encode_text(query_list)

for i in tqdm.tqdm(range(len(query_feats))):
        np.savez(save_dir + '/' + qid_list[i],  last_hidden_state=query_feats[i].cpu().numpy())