DenseLabelDev / vlm /datasets /evaluation /vqav2_llava_eval_dataset.py

Upload folder using huggingface_hub

032e687 verified 7 months ago

4.01 kB

	import os
	import os.path as osp
	import json
	from mmengine.dist import master_only
	from .base_eval_dataset import BaseEvalDataset

	from xtuner.registry import BUILDER
	from .m4c_evaluator import EvalAIAnswerProcessor
	from .utils import custom_data_process


	class VQAv2Dataset(BaseEvalDataset):

	METAINFO: dict = dict(name='gqa')

	def __init__(
	self,
	question_file,
	answer_file,
	test_file,
	prediction_file,
	image_folder,
	image_processor,
	tier='val',
	test_question_file=None,
	pad_image_to_square=True,
	metainfo=None,
	):
	super().__init__(metainfo)
	self.image_folder = image_folder
	self.data_file = question_file
	self.answer_file = answer_file
	self.test_file = test_file
	self.prediction_file = prediction_file
	self.test_question_file = test_question_file
	self.tier = tier

	self.image_processor = BUILDER.build(image_processor)
	self.pad_image_to_square = pad_image_to_square
	self.name = os.path.splitext(os.path.basename(self.data_file))[0]
	self.results_xlsx_path = self.name + '-results.xlsx'
	self.data = self.load_data_list()

	def load_data_list(self):
	question_data = [json.loads(q) for q in open(os.path.expanduser(self.data_file), "r")]
	data_list = []
	for idx in range(len(question_data)):
	sample = question_data[idx]
	index = sample['question_id']
	image_path = sample['image']
	question = sample['text']
	category = sample['category']

	data = {
	'img_id': idx,
	'index': index,
	'image_path': image_path,
	'question': question,
	'category': category,
	}
	data_list.append(data)
	idx += 1

	return data_list

	def __len__(self):
	return len(self.data)

	def __getitem__(self, idx):
	data = self.data[idx]
	data_dict = custom_data_process(self, data)
	return data_dict

	@master_only
	def evaluate(self, results, work_dir):
	answers_file = osp.join(work_dir, self.answer_file)
	ans_file = open(answers_file, "w")
	test_split = self.test_file
	dst = osp.join(work_dir, self.prediction_file)

	for pred_dict in results:
	idx = pred_dict["img_id"]
	gt_data = self.data[idx]

	ans_file.write(
	json.dumps(
	{
	"question_id": gt_data['index'],
	"prompt": gt_data['question'],
	"text": pred_dict['prediction'],
	"metadata": {},
	}
	)
	+ "\n"
	)
	ans_file.close()

	results = []
	error_line = 0
	for line_idx, line in enumerate(open(answers_file)):
	try:
	results.append(json.loads(line))
	except:
	error_line += 1

	results = {x['question_id']: x['text'] for x in results}
	test_split = [json.loads(line) for line in open(test_split)]
	split_ids = set([x['question_id'] for x in test_split])

	print(f'total results: {len(results)}, total split: {len(test_split)}, error_line: {error_line}')

	all_answers = []

	answer_processor = EvalAIAnswerProcessor()

	for x in test_split:
	if x['question_id'] not in results:
	all_answers.append({
	'question_id': x['question_id'],
	'answer': ''
	})
	else:
	all_answers.append({
	'question_id': x['question_id'],
	'answer': answer_processor(results[x['question_id']])
	})

	with open(dst, 'w') as f:
	json.dump(all_answers, open(dst, 'w'))
	return None