Spaces:

fffiloni
/

L4GM-demo

Sleeping

App Files Files Community

L4GM-demo / blender_scripts /render_objaverse.py

fffiloni

Migrated from GitHub

2cdb96e verified 22 days ago

raw

history blame

19.3 kB

	# SPDX-FileCopyrightText: Copyright (c) 2024 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
	# SPDX-License-Identifier: Apache-2.0
	#
	# Licensed under the Apache License, Version 2.0 (the "License");
	# you may not use this file except in compliance with the License.
	# You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing, software
	# distributed under the License is distributed on an "AS IS" BASIS,
	# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	# See the License for the specific language governing permissions and
	# limitations under the License.

	import argparse, sys, os, math, re
	import bpy
	from mathutils import Vector, Matrix
	import numpy as np
	import cv2
	import signal
	from contextlib import contextmanager
	from loguru import logger
	from typing import Any, Callable, Dict, Generator, List, Literal, Optional, Set, Tuple
	import random
	class TimeoutException(Exception): pass

	logger.info('Rendering started.')

	@contextmanager
	def time_limit(seconds):
	def signal_handler(signum, frame):
	raise TimeoutException("Timed out!")
	signal.signal(signal.SIGALRM, signal_handler)
	signal.alarm(seconds)
	try:
	yield
	finally:
	signal.alarm(0)

	parser = argparse.ArgumentParser(description='Renders given obj file by rotation a camera around it.')
	parser.add_argument(
	'--seed', type=int, default=0,
	help='number of views to be rendered')
	parser.add_argument(
	'--views', type=int, default=4,
	help='number of views to be rendered')
	parser.add_argument(
	'obj', type=str,
	help='Path to the obj file to be rendered.')
	parser.add_argument(
	'--output_folder', type=str, default='/tmp',
	help='The path the output will be dumped to.')
	parser.add_argument(
	'--scale', type=float, default=1,
	help='Scaling factor applied to model. Depends on size of mesh.')
	parser.add_argument(
	'--format', type=str, default='PNG',
	help='Format of files generated. Either PNG or OPEN_EXR')

	parser.add_argument(
	'--resolution', type=int, default=512,
	help='Resolution of the images.')
	parser.add_argument(
	'--engine', type=str, default='CYCLES',
	help='Blender internal engine for rendering. E.g. CYCLES, BLENDER_EEVEE, ...')
	parser.add_argument(
	'--gpu', type=int, default=0,
	help='gpu.')
	parser.add_argument(
	'--animation_idx', type=int, default=0,
	help='The index of animation')

	parser.add_argument(
	'--camera_option', type=str, default='fixed',
	help='Camera Options')
	parser.add_argument(
	'--fixed_animation_length', type=int, default=-1,
	help='Set animation length to fixed number of framnes')
	parser.add_argument(
	'--step_angle', type=int, default=3,
	help='Angle in degree for each step camera rotation')
	parser.add_argument(
	'--downsample', type=int, default=1,
	help='Downsample ratio. No downsample by default')

	argv = sys.argv[sys.argv.index("--") + 1:]
	args = parser.parse_args(argv)


	model_identifier = os.path.split(args.obj)[1].split('.')[0]
	synset_idx = args.obj.split('/')[-2]

	save_root = os.path.join(os.path.abspath(args.output_folder), synset_idx, model_identifier, f'{args.animation_idx:03d}')

	# Set up rendering
	context = bpy.context
	scene = bpy.context.scene
	render = bpy.context.scene.render

	render.engine = args.engine# 'BLENDER_EEVEE'
	render.image_settings.color_mode = 'RGBA' # ('RGB', 'RGBA', ...)
	render.image_settings.file_format = args.format # ('PNG', 'OPEN_EXR', 'JPEG, ...)
	render.resolution_x = args.resolution
	render.resolution_y = args.resolution
	render.resolution_percentage = 100
	bpy.context.scene.cycles.filter_width = 0.01
	bpy.context.scene.render.film_transparent = True
	render_depth_normal = False
	bpy.context.scene.cycles.device = 'GPU'
	bpy.context.scene.cycles.diffuse_bounces = 1
	bpy.context.scene.cycles.glossy_bounces = 1
	bpy.context.scene.cycles.transparent_max_bounces = 1
	bpy.context.scene.cycles.transmission_bounces = 1
	bpy.context.scene.cycles.samples = 16
	bpy.context.scene.cycles.use_denoising = True
	bpy.context.scene.cycles.denoiser = 'OPTIX'
	bpy.context.preferences.addons['cycles'].preferences.compute_device_type = 'CUDA'
	bpy.context.scene.cycles.device = 'GPU'


	def enable_cuda_devices():
	prefs = bpy.context.preferences
	cprefs = prefs.addons['cycles'].preferences
	cprefs.get_devices()
	# Attempt to set GPU device types if available
	for compute_device_type in ('CUDA', 'OPENCL', 'NONE'):
	try:
	cprefs.compute_device_type = compute_device_type
	print("Compute device selected: {0}".format(compute_device_type))
	break
	except TypeError:
	pass

	# Any CUDA/OPENCL devices?
	acceleratedTypes = ['CUDA', 'OPENCL', 'OPTIX']
	acceleratedTypes = ['CUDA', 'OPENCL']
	accelerated = any(device.type in acceleratedTypes for device in cprefs.devices)
	print('Accelerated render = {0}'.format(accelerated))

	# If we have CUDA/OPENCL devices, enable only them, otherwise enable
	# all devices (assumed to be CPU)
	print(cprefs.devices)
	for idx, device in enumerate(cprefs.devices):
	device.use = (not accelerated or device.type in acceleratedTypes)# and idx == args.gpu
	print('Device enabled ({type}) = {enabled}'.format(type=device.type, enabled=device.use))
	return accelerated

	enable_cuda_devices()
	context.active_object.select_set(True)
	bpy.ops.object.delete()

	# Import textured mesh
	bpy.ops.object.select_all(action='DESELECT')

	try:
	with time_limit(1000):
	imported_object = bpy.ops.import_scene.gltf(filepath=args.obj, merge_vertices=True, guess_original_bind_pose=False, bone_heuristic="TEMPERANCE")
	except TimeoutException as e:
	print("Timed out finished!")
	exit()


	# count animated frames
	animation_names = []
	ending_frame_list = {}
	for k in bpy.data.actions.keys():
	matched_obj_name = ''
	for obj in bpy.context.selected_objects:
	if '_'+obj.name in k and len(obj.name) > len(matched_obj_name):
	matched_obj_name = obj.name
	a_name = k.replace('_'+matched_obj_name, '')
	a = bpy.data.actions[k]
	frame_start, frame_end = map(int, a.frame_range)
	logger.info(f'{k} \| frame start: {frame_start}, frame end: {frame_end} \| fps: {bpy.context.scene.render.fps}')
	if a_name not in animation_names:
	animation_names.append(a_name)
	ending_frame_list[a_name] = frame_end
	else:
	ending_frame_list[a_name] = max(frame_end, ending_frame_list[a_name])



	selected_a_name = animation_names[args.animation_idx]
	max_frame = ending_frame_list[selected_a_name]
	for obj in bpy.context.selected_objects:
	if obj.animation_data is not None:
	obj_a_name = selected_a_name+'_'+obj.name
	if obj_a_name in bpy.data.actions:
	print('Found ', obj_a_name)
	obj.animation_data.action = bpy.data.actions[obj_a_name]
	else:
	print('Miss ', obj_a_name)

	num_frames = args.fixed_animation_length if args.fixed_animation_length != -1 else max_frame
	num_frames = num_frames // args.downsample

	if num_frames == 0:
	print("No animation!")
	exit()

	# from https://github.com/allenai/objaverse-xl/blob/main/scripts/rendering/blender_script.py
	def get_3x4_RT_matrix_from_blender(cam: bpy.types.Object):
	"""Returns the 3x4 RT matrix from the given camera.

	Taken from Zero123, which in turn was taken from
	https://github.com/panmari/stanford-shapenet-renderer/blob/master/render_blender.py

	Args:
	cam (bpy.types.Object): The camera object.

	Returns:
	Matrix: The 3x4 RT matrix from the given camera.
	"""
	# Use matrix_world instead to account for all constraints
	location, rotation = cam.matrix_world.decompose()[0:2]
	R_world2bcam = rotation.to_matrix().transposed()

	# Use location from matrix_world to account for constraints:
	T_world2bcam = -1 * R_world2bcam @ location

	# put into 3x4 matrix
	RT = Matrix(
	(
	R_world2bcam[0][:] + (T_world2bcam[0],),
	R_world2bcam[1][:] + (T_world2bcam[1],),
	R_world2bcam[2][:] + (T_world2bcam[2],),
	)
	)
	return RT
	def _create_light(
	name: str,
	light_type: Literal["POINT", "SUN", "SPOT", "AREA"],
	location: Tuple[float, float, float],
	rotation: Tuple[float, float, float],
	energy: float,
	use_shadow: bool = False,
	specular_factor: float = 1.0,
	):
	"""Creates a light object.

	Args:
	name (str): Name of the light object.
	light_type (Literal["POINT", "SUN", "SPOT", "AREA"]): Type of the light.
	location (Tuple[float, float, float]): Location of the light.
	rotation (Tuple[float, float, float]): Rotation of the light.
	energy (float): Energy of the light.
	use_shadow (bool, optional): Whether to use shadows. Defaults to False.
	specular_factor (float, optional): Specular factor of the light. Defaults to 1.0.

	Returns:
	bpy.types.Object: The light object.
	"""

	light_data = bpy.data.lights.new(name=name, type=light_type)
	light_object = bpy.data.objects.new(name, light_data)
	bpy.context.collection.objects.link(light_object)
	light_object.location = location
	light_object.rotation_euler = rotation
	light_data.use_shadow = use_shadow
	light_data.specular_factor = specular_factor
	light_data.energy = energy
	return light_object


	def randomize_lighting() -> Dict[str, bpy.types.Object]:
	"""Randomizes the lighting in the scene.

	Returns:
	Dict[str, bpy.types.Object]: Dictionary of the lights in the scene. The keys are
	"key_light", "fill_light", "rim_light", and "bottom_light".
	"""

	# Clear existing lights
	bpy.ops.object.select_all(action="DESELECT")
	bpy.ops.object.select_by_type(type="LIGHT")
	bpy.ops.object.delete()

	# Create key light
	key_light = _create_light(
	name="Key_Light",
	light_type="SUN",
	location=(0, 0, 0),
	rotation=(0.785398, 0, -0.785398),
	# energy=random.choice([3, 4, 5]),
	energy=4,
	)

	# Create fill light
	fill_light = _create_light(
	name="Fill_Light",
	light_type="SUN",
	location=(0, 0, 0),
	rotation=(0.785398, 0, 2.35619),
	# energy=random.choice([2, 3, 4]),
	energy=3,
	)

	# Create rim light
	rim_light = _create_light(
	name="Rim_Light",
	light_type="SUN",
	location=(0, 0, 0),
	rotation=(-0.785398, 0, -3.92699),
	# energy=random.choice([3, 4, 5]),
	energy=4,
	)

	# Create bottom light
	bottom_light = _create_light(
	name="Bottom_Light",
	light_type="SUN",
	location=(0, 0, 0),
	rotation=(3.14159, 0, 0),
	# energy=random.choice([1, 2, 3]),
	energy=2,
	)

	return dict(
	key_light=key_light,
	fill_light=fill_light,
	rim_light=rim_light,
	bottom_light=bottom_light,
	)

	def scene_bbox(
	single_obj = None, ignore_matrix = False
	):
	"""Returns the bounding box of the scene.

	Taken from Shap-E rendering script
	(https://github.com/openai/shap-e/blob/main/shap_e/rendering/blender/blender_script.py#L68-L82)

	Args:
	single_obj (Optional[bpy.types.Object], optional): If not None, only computes
	the bounding box for the given object. Defaults to None.
	ignore_matrix (bool, optional): Whether to ignore the object's matrix. Defaults
	to False.

	Raises:
	RuntimeError: If there are no objects in the scene.

	Returns:
	Tuple[Vector, Vector]: The minimum and maximum coordinates of the bounding box.
	"""
	bbox_min = (math.inf,) * 3
	bbox_max = (-math.inf,) * 3
	found = False
	for i in range(num_frames):
	bpy.context.scene.frame_set(i * args.downsample)
	for obj in get_scene_meshes() if single_obj is None else [single_obj]:
	found = True
	for coord in obj.bound_box:
	coord = Vector(coord)
	if not ignore_matrix:
	coord = obj.matrix_world @ coord
	bbox_min = tuple(min(x, y) for x, y in zip(bbox_min, coord))
	bbox_max = tuple(max(x, y) for x, y in zip(bbox_max, coord))

	if not found:
	raise RuntimeError("no objects in scene to compute bounding box for")

	return Vector(bbox_min), Vector(bbox_max)

	def get_scene_meshes():
	"""Returns all meshes in the scene.

	Yields:
	Generator[bpy.types.Object, None, None]: Generator of all meshes in the scene.
	"""
	for obj in bpy.context.scene.objects.values():
	if isinstance(obj.data, (bpy.types.Mesh)):
	yield obj

	def get_scene_root_objects():
	"""Returns all root objects in the scene.

	Yields:
	Generator[bpy.types.Object, None, None]: Generator of all root objects in the
	scene.
	"""
	for obj in bpy.context.scene.objects.values():
	if not obj.parent:
	yield obj

	def normalize_scene():
	"""Normalizes the scene by scaling and translating it to fit in a unit cube centered
	at the origin.

	Mostly taken from the Point-E / Shap-E rendering script
	(https://github.com/openai/point-e/blob/main/point_e/evals/scripts/blender_script.py#L97-L112),
	but fix for multiple root objects: (see bug report here:
	https://github.com/openai/shap-e/pull/60).

	Returns:
	None
	"""
	if len(list(get_scene_root_objects())) > 1:
	# create an empty object to be used as a parent for all root objects
	parent_empty = bpy.data.objects.new("ParentEmpty", None)
	bpy.context.scene.collection.objects.link(parent_empty)

	# parent all root objects to the empty object
	for obj in get_scene_root_objects():
	if obj != parent_empty:
	obj.parent = parent_empty

	bbox_min, bbox_max = scene_bbox()
	scale = 1 / max(bbox_max - bbox_min)
	logger.info(f"Scale: {scale}")
	for obj in get_scene_root_objects():
	obj.scale = obj.scale * scale

	# Apply scale to matrix_world.
	bpy.context.view_layer.update()
	bbox_min, bbox_max = scene_bbox()
	offset = -(bbox_min + bbox_max) / 2
	for obj in get_scene_root_objects():
	obj.matrix_world.translation += offset
	bpy.ops.object.select_all(action="DESELECT")

	# unparent the camera
	bpy.data.objects["Camera"].parent = None

	normalize_scene()

	randomize_lighting()

	# Place camera
	cam = scene.objects['Camera']
	cam.location = (0, 1.5, 0) # radius equals to 1
	cam.data.lens = 35
	cam.data.sensor_width = 32

	cam_constraint = cam.constraints.new(type='TRACK_TO')
	cam_constraint.track_axis = 'TRACK_NEGATIVE_Z'
	cam_constraint.up_axis = 'UP_Y'

	cam_empty = bpy.data.objects.new("Empty", None)
	cam_empty.location = (0, 0, 0)
	cam.parent = cam_empty

	scene.collection.objects.link(cam_empty)
	context.view_layer.objects.active = cam_empty
	cam_constraint.target = cam_empty

	stepsize = 360.0 / args.views
	rotation_mode = 'XYZ'


	np.random.seed(args.seed)

	if args.camera_option == "fixed":
	for scene in bpy.data.scenes:
	scene.cycles.device = 'GPU'

	elevation_angle = 0.
	rotation_angle = 0.

	for view_idx in range(args.views):
	img_folder = os.path.join(save_root, f'{view_idx:03d}', 'img')
	mask_folder = os.path.join(save_root, f'{view_idx:03d}', 'mask')
	camera_folder = os.path.join(save_root, f'{view_idx:03d}', 'camera')

	os.makedirs(img_folder, exist_ok=True)
	os.makedirs(mask_folder, exist_ok=True)
	os.makedirs(camera_folder, exist_ok=True)

	np.save(os.path.join(camera_folder, 'rotation'), np.array([rotation_angle + view_idx * stepsize for _ in range(num_frames)]))
	np.save(os.path.join(camera_folder, 'elevation'), np.array([elevation_angle for _ in range(num_frames)]))

	cam_empty.rotation_euler[2] = math.radians(rotation_angle + view_idx * stepsize)
	cam_empty.rotation_euler[0] = math.radians(elevation_angle)

	# save camera RT matrix
	rt_matrix = get_3x4_RT_matrix_from_blender(cam)
	rt_matrix_path = os.path.join(camera_folder, "rt_matrix.npy")
	np.save(rt_matrix_path, rt_matrix)
	for i in range(0, num_frames):
	bpy.context.scene.frame_set(i * args.downsample)
	render_file_path = os.path.join(img_folder,'%03d.png' % (i))
	scene.render.filepath = render_file_path
	bpy.ops.render.render(write_still=True)

	for i in range(0, num_frames):
	img = cv2.imread(os.path.join(img_folder, '%03d.png' % (i)), cv2.IMREAD_UNCHANGED)
	mask = img[:, :, 3:4] / 255.0
	white_img = img[:, :, :3] * mask + np.ones_like(img[:, :, :3]) * (1 - mask) * 255
	white_img = np.clip(white_img, 0, 255)
	cv2.imwrite(os.path.join(img_folder, '%03d.jpg' % (i)), white_img)
	cv2.imwrite(os.path.join(mask_folder, '%03d.png'%(i)), img[:, :, 3])
	os.system('rm %s'%(os.path.join(img_folder, '%03d.png' % (i))))

	elif args.camera_option == "random":
	for scene in bpy.data.scenes:
	scene.cycles.device = 'GPU'

	for view_idx in range(args.views):
	elevation_angle = np.random.rand(1) * 35 - 5 # [-5, 30]
	rotation_angle = np.random.rand(1) * 360

	img_folder = os.path.join(save_root, f'{view_idx:03d}', 'img')
	mask_folder = os.path.join(save_root, f'{view_idx:03d}', 'mask')
	camera_folder = os.path.join(save_root, f'{view_idx:03d}', 'camera')

	os.makedirs(img_folder, exist_ok=True)
	os.makedirs(mask_folder, exist_ok=True)
	os.makedirs(camera_folder, exist_ok=True)

	np.save(os.path.join(camera_folder, 'rotation'), np.array([rotation_angle for _ in range(num_frames)]))
	np.save(os.path.join(camera_folder, 'elevation'), np.array([elevation_angle for _ in range(num_frames)]))

	cam_empty.rotation_euler[2] = math.radians(rotation_angle)
	cam_empty.rotation_euler[0] = math.radians(elevation_angle)

	# save camera RT matrix
	rt_matrix = get_3x4_RT_matrix_from_blender(cam)
	rt_matrix_path = os.path.join(camera_folder, "rt_matrix.npy")
	np.save(rt_matrix_path, rt_matrix)

	for i in range(0, num_frames):
	bpy.context.scene.frame_set(i * args.downsample)
	render_file_path = os.path.join(img_folder,'%03d.png' % (i))
	scene.render.filepath = render_file_path
	bpy.ops.render.render(write_still=True)

	for i in range(0, num_frames):
	img = cv2.imread(os.path.join(img_folder, '%03d.png' % (i)), cv2.IMREAD_UNCHANGED)
	mask = img[:, :, 3:4] / 255.0
	white_img = img[:, :, :3] * mask + np.ones_like(img[:, :, :3]) * (1 - mask) * 255
	white_img = np.clip(white_img, 0, 255)
	cv2.imwrite(os.path.join(img_folder, '%03d.jpg' % (i)), white_img)
	cv2.imwrite(os.path.join(mask_folder, '%03d.png'%(i)), img[:, :, 3])
	os.system('rm %s'%(os.path.join(img_folder, '%03d.png' % (i))))

	else:
	raise NotImplemented