gim-online

Running

gim-online / third_party /r2d2 /tools /transforms_tools.py

Vincentqyw

fix: roma

8b973ee over 1 year ago

7.11 kB

	# Copyright 2019-present NAVER Corp.
	# CC BY-NC-SA 3.0
	# Available only for non-commercial use

	import pdb
	import numpy as np
	from PIL import Image, ImageOps, ImageEnhance


	class DummyImg:
	"""This class is a dummy image only defined by its size."""

	def __init__(self, size):
	self.size = size

	def resize(self, size, args, *kwargs):
	return DummyImg(size)

	def expand(self, border):
	w, h = self.size
	if isinstance(border, int):
	size = (w + 2 * border, h + 2 * border)
	else:
	l, t, r, b = border
	size = (w + l + r, h + t + b)
	return DummyImg(size)

	def crop(self, border):
	w, h = self.size
	l, t, r, b = border
	assert 0 <= l <= r <= w
	assert 0 <= t <= b <= h
	size = (r - l, b - t)
	return DummyImg(size)

	def rotate(self, angle):
	raise NotImplementedError

	def transform(self, size, args, *kwargs):
	return DummyImg(size)


	def grab_img(img_and_label):
	"""Called to extract the image from an img_and_label input
	(a dictionary). Also compatible with old-style PIL images.
	"""
	if isinstance(img_and_label, dict):
	# if input is a dictionary, then
	# it must contains the img or its size.
	try:
	return img_and_label["img"]
	except KeyError:
	return DummyImg(img_and_label["imsize"])

	else:
	# or it must be the img directly
	return img_and_label


	def update_img_and_labels(img_and_label, img, persp=None):
	"""Called to update the img_and_label"""
	if isinstance(img_and_label, dict):
	img_and_label["img"] = img
	img_and_label["imsize"] = img.size

	if persp:
	if "persp" not in img_and_label:
	img_and_label["persp"] = (1, 0, 0, 0, 1, 0, 0, 0)
	img_and_label["persp"] = persp_mul(persp, img_and_label["persp"])

	return img_and_label

	else:
	# or it must be the img directly
	return img


	def rand_log_uniform(a, b):
	return np.exp(np.random.uniform(np.log(a), np.log(b)))


	def translate(tx, ty):
	return (1, 0, tx, 0, 1, ty, 0, 0)


	def rotate(angle):
	return (np.cos(angle), -np.sin(angle), 0, np.sin(angle), np.cos(angle), 0, 0, 0)


	def persp_mul(mat, mat2):
	"""homography (perspective) multiplication.
	mat: 8-tuple (homography transform)
	mat2: 8-tuple (homography transform) or 2-tuple (point)
	"""
	assert isinstance(mat, tuple)
	assert isinstance(mat2, tuple)

	mat = np.float32(mat + (1,)).reshape(3, 3)
	mat2 = np.array(mat2 + (1,)).reshape(3, 3)
	res = np.dot(mat, mat2)
	return tuple((res / res[2, 2]).ravel()[:8])


	def persp_apply(mat, pts):
	"""homography (perspective) transformation.
	mat: 8-tuple (homography transform)
	pts: numpy array
	"""
	assert isinstance(mat, tuple)
	assert isinstance(pts, np.ndarray)
	assert pts.shape[-1] == 2
	mat = np.float32(mat + (1,)).reshape(3, 3)

	if pts.ndim == 1:
	pt = np.dot(pts, mat[:, :2].T).ravel() + mat[:, 2]
	pt /= pt[2] # homogeneous coordinates
	return tuple(pt[:2])
	else:
	pt = np.dot(pts, mat[:, :2].T) + mat[:, 2]
	pt[:, :2] /= pt[:, 2:3] # homogeneous coordinates
	return pt[:, :2]


	def is_pil_image(img):
	return isinstance(img, Image.Image)


	def adjust_brightness(img, brightness_factor):
	"""Adjust brightness of an Image.
	Args:
	img (PIL Image): PIL Image to be adjusted.
	brightness_factor (float): How much to adjust the brightness. Can be
	any non negative number. 0 gives a black image, 1 gives the
	original image while 2 increases the brightness by a factor of 2.
	Returns:
	PIL Image: Brightness adjusted image.
	Copied from https://github.com/pytorch in torchvision/transforms/functional.py
	"""
	if not is_pil_image(img):
	raise TypeError("img should be PIL Image. Got {}".format(type(img)))

	enhancer = ImageEnhance.Brightness(img)
	img = enhancer.enhance(brightness_factor)
	return img


	def adjust_contrast(img, contrast_factor):
	"""Adjust contrast of an Image.
	Args:
	img (PIL Image): PIL Image to be adjusted.
	contrast_factor (float): How much to adjust the contrast. Can be any
	non negative number. 0 gives a solid gray image, 1 gives the
	original image while 2 increases the contrast by a factor of 2.
	Returns:
	PIL Image: Contrast adjusted image.
	Copied from https://github.com/pytorch in torchvision/transforms/functional.py
	"""
	if not is_pil_image(img):
	raise TypeError("img should be PIL Image. Got {}".format(type(img)))

	enhancer = ImageEnhance.Contrast(img)
	img = enhancer.enhance(contrast_factor)
	return img


	def adjust_saturation(img, saturation_factor):
	"""Adjust color saturation of an image.
	Args:
	img (PIL Image): PIL Image to be adjusted.
	saturation_factor (float): How much to adjust the saturation. 0 will
	give a black and white image, 1 will give the original image while
	2 will enhance the saturation by a factor of 2.
	Returns:
	PIL Image: Saturation adjusted image.
	Copied from https://github.com/pytorch in torchvision/transforms/functional.py
	"""
	if not is_pil_image(img):
	raise TypeError("img should be PIL Image. Got {}".format(type(img)))

	enhancer = ImageEnhance.Color(img)
	img = enhancer.enhance(saturation_factor)
	return img


	def adjust_hue(img, hue_factor):
	"""Adjust hue of an image.
	The image hue is adjusted by converting the image to HSV and
	cyclically shifting the intensities in the hue channel (H).
	The image is then converted back to original image mode.
	`hue_factor` is the amount of shift in H channel and must be in the
	interval `[-0.5, 0.5]`.
	See https://en.wikipedia.org/wiki/Hue for more details on Hue.
	Args:
	img (PIL Image): PIL Image to be adjusted.
	hue_factor (float): How much to shift the hue channel. Should be in
	[-0.5, 0.5]. 0.5 and -0.5 give complete reversal of hue channel in
	HSV space in positive and negative direction respectively.
	0 means no shift. Therefore, both -0.5 and 0.5 will give an image
	with complementary colors while 0 gives the original image.
	Returns:
	PIL Image: Hue adjusted image.
	Copied from https://github.com/pytorch in torchvision/transforms/functional.py
	"""
	if not (-0.5 <= hue_factor <= 0.5):
	raise ValueError("hue_factor is not in [-0.5, 0.5].".format(hue_factor))

	if not is_pil_image(img):
	raise TypeError("img should be PIL Image. Got {}".format(type(img)))

	input_mode = img.mode
	if input_mode in {"L", "1", "I", "F"}:
	return img

	h, s, v = img.convert("HSV").split()

	np_h = np.array(h, dtype=np.uint8)
	# uint8 addition take cares of rotation across boundaries
	with np.errstate(over="ignore"):
	np_h += np.uint8(hue_factor * 255)
	h = Image.fromarray(np_h, "L")

	img = Image.merge("HSV", (h, s, v)).convert(input_mode)
	return img