Spaces:

Yuxihenry
/

SpatialTracker2

Running on Zero

SpatialTracker2 / models /moge /utils /io.py

xiaoyuxi

gradio_app

a51c6d2 5 days ago

8.07 kB

	import os
	os.environ['OPENCV_IO_ENABLE_OPENEXR'] = '1'
	from typing import IO
	import zipfile
	import json
	import io
	from typing import *
	from pathlib import Path
	import re
	from PIL import Image, PngImagePlugin

	import numpy as np
	import cv2

	from .tools import timeit


	def save_glb(
	save_path: Union[str, os.PathLike],
	vertices: np.ndarray,
	faces: np.ndarray,
	vertex_uvs: np.ndarray,
	texture: np.ndarray,
	vertex_normals: Optional[np.ndarray] = None,
	):
	import trimesh
	import trimesh.visual
	from PIL import Image

	trimesh.Trimesh(
	vertices=vertices,
	vertex_normals=vertex_normals,
	faces=faces,
	visual = trimesh.visual.texture.TextureVisuals(
	uv=vertex_uvs,
	material=trimesh.visual.material.PBRMaterial(
	baseColorTexture=Image.fromarray(texture),
	metallicFactor=0.5,
	roughnessFactor=1.0
	)
	),
	process=False
	).export(save_path)


	def save_ply(
	save_path: Union[str, os.PathLike],
	vertices: np.ndarray,
	faces: np.ndarray,
	vertex_colors: np.ndarray,
	vertex_normals: Optional[np.ndarray] = None,
	):
	import trimesh
	import trimesh.visual
	from PIL import Image

	trimesh.Trimesh(
	vertices=vertices,
	faces=faces,
	vertex_colors=vertex_colors,
	vertex_normals=vertex_normals,
	process=False
	).export(save_path)


	def read_image(path: Union[str, os.PathLike, IO]) -> np.ndarray:
	"""
	Read a image, return uint8 RGB array of shape (H, W, 3).
	"""
	if isinstance(path, (str, os.PathLike)):
	data = Path(path).read_bytes()
	else:
	data = path.read()
	image = cv2.cvtColor(cv2.imdecode(np.frombuffer(data, np.uint8), cv2.IMREAD_COLOR), cv2.COLOR_BGR2RGB)
	return image


	def write_image(path: Union[str, os.PathLike, IO], image: np.ndarray, quality: int = 95):
	"""
	Write a image, input uint8 RGB array of shape (H, W, 3).
	"""
	data = cv2.imencode('.jpg', cv2.cvtColor(image, cv2.COLOR_RGB2BGR), [cv2.IMWRITE_JPEG_QUALITY, quality])[1].tobytes()
	if isinstance(path, (str, os.PathLike)):
	Path(path).write_bytes(data)
	else:
	path.write(data)


	def read_depth(path: Union[str, os.PathLike, IO]) -> Tuple[np.ndarray, float]:
	"""
	Read a depth image, return float32 depth array of shape (H, W).
	"""
	if isinstance(path, (str, os.PathLike)):
	data = Path(path).read_bytes()
	else:
	data = path.read()
	pil_image = Image.open(io.BytesIO(data))
	near = float(pil_image.info.get('near'))
	far = float(pil_image.info.get('far'))
	unit = float(pil_image.info.get('unit')) if 'unit' in pil_image.info else None
	depth = np.array(pil_image)
	mask_nan, mask_inf = depth == 0, depth == 65535
	depth = (depth.astype(np.float32) - 1) / 65533
	depth = near ** (1 - depth) * far ** depth
	depth[mask_nan] = np.nan
	depth[mask_inf] = np.inf
	return depth, unit


	def write_depth(
	path: Union[str, os.PathLike, IO],
	depth: np.ndarray,
	unit: float = None,
	max_range: float = 1e5,
	compression_level: int = 7,
	):
	"""
	Encode and write a depth image as 16-bit PNG format.
	### Parameters:
	- `path: Union[str, os.PathLike, IO]`
	The file path or file object to write to.
	- `depth: np.ndarray`
	The depth array, float32 array of shape (H, W).
	May contain `NaN` for invalid values and `Inf` for infinite values.
	- `unit: float = None`
	The unit of the depth values.

	Depth values are encoded as follows:
	- 0: unknown
	- 1 ~ 65534: depth values in logarithmic
	- 65535: infinity

	metadata is stored in the PNG file as text fields:
	- `near`: the minimum depth value
	- `far`: the maximum depth value
	- `unit`: the unit of the depth values (optional)
	"""
	mask_values, mask_nan, mask_inf = np.isfinite(depth), np.isnan(depth),np.isinf(depth)

	depth = depth.astype(np.float32)
	mask_finite = depth
	near = max(depth[mask_values].min(), 1e-5)
	far = max(near * 1.1, min(depth[mask_values].max(), near * max_range))
	depth = 1 + np.round((np.log(np.nan_to_num(depth, nan=0).clip(near, far) / near) / np.log(far / near)).clip(0, 1) * 65533).astype(np.uint16) # 1~65534
	depth[mask_nan] = 0
	depth[mask_inf] = 65535

	pil_image = Image.fromarray(depth)
	pnginfo = PngImagePlugin.PngInfo()
	pnginfo.add_text('near', str(near))
	pnginfo.add_text('far', str(far))
	if unit is not None:
	pnginfo.add_text('unit', str(unit))
	pil_image.save(path, pnginfo=pnginfo, compress_level=compression_level)


	def read_segmentation(path: Union[str, os.PathLike, IO]) -> Tuple[np.ndarray, Dict[str, int]]:
	"""
	Read a segmentation mask
	### Parameters:
	- `path: Union[str, os.PathLike, IO]`
	The file path or file object to read from.
	### Returns:
	- `Tuple[np.ndarray, Dict[str, int]]`
	A tuple containing:
	- `mask`: uint8 or uint16 numpy.ndarray of shape (H, W).
	- `labels`: Dict[str, int]. The label mapping, a dictionary of {label_name: label_id}.
	"""
	if isinstance(path, (str, os.PathLike)):
	data = Path(path).read_bytes()
	else:
	data = path.read()
	pil_image = Image.open(io.BytesIO(data))
	labels = json.loads(pil_image.info['labels']) if 'labels' in pil_image.info else None
	mask = np.array(pil_image)
	return mask, labels


	def write_segmentation(path: Union[str, os.PathLike, IO], mask: np.ndarray, labels: Dict[str, int] = None, compression_level: int = 7):
	"""
	Write a segmentation mask and label mapping, as PNG format.
	### Parameters:
	- `path: Union[str, os.PathLike, IO]`
	The file path or file object to write to.
	- `mask: np.ndarray`
	The segmentation mask, uint8 or uint16 array of shape (H, W).
	- `labels: Dict[str, int] = None`
	The label mapping, a dictionary of {label_name: label_id}.
	- `compression_level: int = 7`
	The compression level for PNG compression.
	"""
	assert mask.dtype == np.uint8 or mask.dtype == np.uint16, f"Unsupported dtype {mask.dtype}"
	pil_image = Image.fromarray(mask)
	pnginfo = PngImagePlugin.PngInfo()
	if labels is not None:
	labels_json = json.dumps(labels, ensure_ascii=True, separators=(',', ':'))
	pnginfo.add_text('labels', labels_json)
	pil_image.save(path, pnginfo=pnginfo, compress_level=compression_level)



	def read_normal(path: Union[str, os.PathLike, IO]) -> np.ndarray:
	"""
	Read a normal image, return float32 normal array of shape (H, W, 3).
	"""
	if isinstance(path, (str, os.PathLike)):
	data = Path(path).read_bytes()
	else:
	data = path.read()
	normal = cv2.cvtColor(cv2.imdecode(np.frombuffer(data, np.uint8), cv2.IMREAD_UNCHANGED), cv2.COLOR_BGR2RGB)
	mask_nan = np.all(normal == 0, axis=-1)
	normal = (normal.astype(np.float32) / 65535 - 0.5) * [2.0, -2.0, -2.0]
	normal = normal / (np.sqrt(np.square(normal[..., 0]) + np.square(normal[..., 1]) + np.square(normal[..., 2])) + 1e-12)
	normal[mask_nan] = np.nan
	return normal


	def write_normal(path: Union[str, os.PathLike, IO], normal: np.ndarray, compression_level: int = 7) -> np.ndarray:
	"""
	Write a normal image, input float32 normal array of shape (H, W, 3).
	"""
	mask_nan = np.isnan(normal).any(axis=-1)
	normal = ((normal * [0.5, -0.5, -0.5] + 0.5).clip(0, 1) * 65535).astype(np.uint16)
	normal[mask_nan] = 0
	data = cv2.imencode('.png', cv2.cvtColor(normal, cv2.COLOR_RGB2BGR), [cv2.IMWRITE_PNG_COMPRESSION, compression_level])[1].tobytes()
	if isinstance(path, (str, os.PathLike)):
	Path(path).write_bytes(data)
	else:
	path.write(data)


	def read_meta(path: Union[str, os.PathLike, IO]) -> Dict[str, Any]:
	return json.loads(Path(path).read_text())

	def write_meta(path: Union[str, os.PathLike, IO], meta: Dict[str, Any]):
	Path(path).write_text(json.dumps(meta))