Spaces:

Realcat
/

image-matching-webui

Running

image-matching-webui / third_party /lanet /datasets /hp_loader.py

Vincentqyw

fix: roma

c74a070 over 1 year ago

4.21 kB

	import torch
	import cv2
	import numpy as np

	from torchvision import transforms
	from torch.utils.data import Dataset
	from pathlib import Path


	class PatchesDataset(Dataset):
	"""
	HPatches dataset class.
	# Note: output_shape = (output_width, output_height)
	# Note: this returns Pytorch tensors, resized to output_shape (if specified)
	# Note: the homography will be adjusted according to output_shape.

	Parameters
	----------
	root_dir : str
	Path to the dataset
	use_color : bool
	Return color images or convert to grayscale.
	data_transform : Function
	Transformations applied to the sample
	output_shape: tuple
	If specified, the images and homographies will be resized to the desired shape.
	type: str
	Dataset subset to return from ['i', 'v', 'all']:
	i - illumination sequences
	v - viewpoint sequences
	all - all sequences
	"""

	def __init__(
	self,
	root_dir,
	use_color=True,
	data_transform=None,
	output_shape=None,
	type="all",
	):
	super().__init__()
	self.type = type
	self.root_dir = root_dir
	self.data_transform = data_transform
	self.output_shape = output_shape
	self.use_color = use_color
	base_path = Path(root_dir)
	folder_paths = [x for x in base_path.iterdir() if x.is_dir()]
	image_paths = []
	warped_image_paths = []
	homographies = []
	for path in folder_paths:
	if self.type == "i" and path.stem[0] != "i":
	continue
	if self.type == "v" and path.stem[0] != "v":
	continue
	num_images = 5
	file_ext = ".ppm"
	for i in range(2, 2 + num_images):
	image_paths.append(str(Path(path, "1" + file_ext)))
	warped_image_paths.append(str(Path(path, str(i) + file_ext)))
	homographies.append(np.loadtxt(str(Path(path, "H_1_" + str(i)))))
	self.files = {
	"image_paths": image_paths,
	"warped_image_paths": warped_image_paths,
	"homography": homographies,
	}

	def scale_homography(self, homography, original_scale, new_scale, pre):
	scales = np.divide(new_scale, original_scale)
	if pre:
	s = np.diag(np.append(scales, 1.0))
	homography = np.matmul(s, homography)
	else:
	sinv = np.diag(np.append(1.0 / scales, 1.0))
	homography = np.matmul(homography, sinv)
	return homography

	def __len__(self):
	return len(self.files["image_paths"])

	def __getitem__(self, idx):
	def _read_image(path):
	img = cv2.imread(path, cv2.IMREAD_COLOR)
	if self.use_color:
	return img
	gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
	return gray

	image = _read_image(self.files["image_paths"][idx])

	warped_image = _read_image(self.files["warped_image_paths"][idx])
	homography = np.array(self.files["homography"][idx])
	sample = {
	"image": image,
	"warped_image": warped_image,
	"homography": homography,
	"index": idx,
	}

	# Apply transformations
	if self.output_shape is not None:
	sample["homography"] = self.scale_homography(
	sample["homography"],
	sample["image"].shape[:2][::-1],
	self.output_shape,
	pre=False,
	)
	sample["homography"] = self.scale_homography(
	sample["homography"],
	sample["warped_image"].shape[:2][::-1],
	self.output_shape,
	pre=True,
	)

	for key in ["image", "warped_image"]:
	sample[key] = cv2.resize(sample[key], self.output_shape)
	if self.use_color is False:
	sample[key] = np.expand_dims(sample[key], axis=2)

	transform = transforms.ToTensor()

	for key in ["image", "warped_image"]:
	sample[key] = transform(sample[key]).type("torch.FloatTensor")
	return sample