Spaces:

zxhezexin
/

OpenLRM

Sleeping

App Files Files

OpenLRM / app.py

zxhezexin

Update spaces

f2a2544 9 months ago

raw

history blame

7.93 kB

	# Copyright (c) 2023-2024, Zexin He
	#
	# Licensed under the Apache License, Version 2.0 (the "License");
	# you may not use this file except in compliance with the License.
	# You may obtain a copy of the License at
	#
	# https://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing, software
	# distributed under the License is distributed on an "AS IS" BASIS,
	# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	# See the License for the specific language governing permissions and
	# limitations under the License.


	import os
	from PIL import Image
	import numpy as np
	import gradio as gr


	def assert_input_image(input_image):
	if input_image is None:
	raise gr.Error("No image selected or uploaded!")

	def prepare_working_dir():
	import tempfile
	working_dir = tempfile.TemporaryDirectory()
	return working_dir

	def init_preprocessor():
	from openlrm.utils.preprocess import Preprocessor
	global preprocessor
	preprocessor = Preprocessor()

	def preprocess_fn(image_in: np.ndarray, remove_bg: bool, recenter: bool, working_dir):
	image_raw = os.path.join(working_dir.name, "raw.png")
	with Image.fromarray(image_in) as img:
	img.save(image_raw)
	image_out = os.path.join(working_dir.name, "rembg.png")
	success = preprocessor.preprocess(image_path=image_raw, save_path=image_out, rmbg=remove_bg, recenter=recenter)
	assert success, f"Failed under preprocess_fn!"
	return image_out


	def demo_openlrm(infer_impl):

	def core_fn(image: str, source_cam_dist: float, working_dir):
	dump_video_path = os.path.join(working_dir.name, "output.mp4")
	dump_mesh_path = os.path.join(working_dir.name, "output.ply")
	infer_impl(
	image_path=image,
	source_cam_dist=source_cam_dist,
	export_video=True,
	export_mesh=False,
	dump_video_path=dump_video_path,
	dump_mesh_path=dump_mesh_path,
	)
	return dump_video_path

	def example_fn(image: np.ndarray):
	from gradio.utils import get_cache_folder
	working_dir = get_cache_folder()
	image = preprocess_fn(
	image_in=image,
	remove_bg=True,
	recenter=True,
	working_dir=working_dir,
	)
	video = core_fn(
	image=image,
	source_cam_dist=2.0,
	working_dir=working_dir,
	)
	return image, video


	_TITLE = '''OpenLRM: Open-Source Large Reconstruction Models'''

	_DESCRIPTION = '''
	<div>
	<a style="display:inline-block" href='https://github.com/3DTopia/OpenLRM'><img src='https://img.shields.io/github/stars/3DTopia/OpenLRM?style=social'/></a>
	<a style="display:inline-block; margin-left: .5em" href="https://huggingface.co/zxhezexin"><img src='https://img.shields.io/badge/Model-Weights-blue'/></a>
	</div>
	OpenLRM is an open-source implementation of Large Reconstruction Models.

	<strong>Image-to-3D in 10 seconds!</strong>

	<strong>Disclaimer:</strong> This demo uses `openlrm-mix-base-1.1` model with 288x288 rendering resolution here for a quick demonstration.
	'''

	with gr.Blocks(analytics_enabled=False) as demo:

	# HEADERS
	with gr.Row():
	with gr.Column(scale=1):
	gr.Markdown('# ' + _TITLE)
	with gr.Row():
	gr.Markdown(_DESCRIPTION)

	# DISPLAY
	with gr.Row():

	with gr.Column(variant='panel', scale=1):
	with gr.Tabs(elem_id="openlrm_input_image"):
	with gr.TabItem('Input Image'):
	with gr.Row():
	input_image = gr.Image(label="Input Image", image_mode="RGBA", width="auto", sources="upload", type="numpy", elem_id="content_image")

	with gr.Column(variant='panel', scale=1):
	with gr.Tabs(elem_id="openlrm_processed_image"):
	with gr.TabItem('Processed Image'):
	with gr.Row():
	processed_image = gr.Image(label="Processed Image", image_mode="RGBA", type="filepath", elem_id="processed_image", width="auto", interactive=False)

	with gr.Column(variant='panel', scale=1):
	with gr.Tabs(elem_id="openlrm_render_video"):
	with gr.TabItem('Rendered Video'):
	with gr.Row():
	output_video = gr.Video(label="Rendered Video", format="mp4", width="auto", autoplay=True)

	# SETTING
	with gr.Row():
	with gr.Column(variant='panel', scale=1):
	with gr.Tabs(elem_id="openlrm_attrs"):
	with gr.TabItem('Settings'):
	with gr.Column(variant='panel'):
	gr.Markdown(
	"""
	<strong>Best Practice</strong>:
	Centered objects in reasonable sizes. Try adjusting source camera distances.
	"""
	)
	checkbox_rembg = gr.Checkbox(True, label='Remove background')
	checkbox_recenter = gr.Checkbox(True, label='Recenter the object')
	slider_cam_dist = gr.Slider(1.0, 3.5, value=2.0, step=0.1, label="Source Camera Distance")
	submit = gr.Button('Generate', elem_id="openlrm_generate", variant='primary')

	# EXAMPLES
	with gr.Row():
	examples = [
	['assets/sample_input/owl.png'],
	['assets/sample_input/building.png'],
	['assets/sample_input/mailbox.png'],
	['assets/sample_input/fire.png'],
	['assets/sample_input/girl.png'],
	['assets/sample_input/lamp.png'],
	['assets/sample_input/hydrant.png'],
	['assets/sample_input/hotdogs.png'],
	['assets/sample_input/traffic.png'],
	['assets/sample_input/ceramic.png'],
	]
	gr.Examples(
	examples=examples,
	inputs=[input_image],
	outputs=[processed_image, output_video],
	fn=example_fn,
	cache_examples=os.getenv('SYSTEM') != 'spaces',
	examples_per_page=20,
	)

	working_dir = gr.State()
	submit.click(
	fn=assert_input_image,
	inputs=[input_image],
	queue=False,
	).success(
	fn=prepare_working_dir,
	outputs=[working_dir],
	queue=False,
	).success(
	fn=preprocess_fn,
	inputs=[input_image, checkbox_rembg, checkbox_recenter, working_dir],
	outputs=[processed_image],
	).success(
	fn=core_fn,
	inputs=[processed_image, slider_cam_dist, working_dir],
	outputs=[output_video],
	)

	demo.queue()
	demo.launch()


	def launch_gradio_app():

	os.environ.update({
	"APP_ENABLED": "1",
	"APP_MODEL_NAME": "zxhezexin/openlrm-mix-base-1.1",
	"APP_INFER": "./configs/infer-gradio.yaml",
	"APP_TYPE": "infer.lrm",
	"NUMBA_THREADING_LAYER": 'omp',
	})

	from openlrm.runners import REGISTRY_RUNNERS
	from openlrm.runners.infer.base_inferrer import Inferrer
	InferrerClass : Inferrer = REGISTRY_RUNNERS[os.getenv("APP_TYPE")]
	with InferrerClass() as inferrer:
	init_preprocessor()
	if os.getenv('SYSTEM') != 'spaces':
	from openlrm.utils.proxy import no_proxy
	demo = no_proxy(demo_openlrm)
	else:
	demo = demo_openlrm
	demo(infer_impl=inferrer.infer_single)


	if __name__ == '__main__':

	launch_gradio_app()