Spaces:

ybelkada
/

FocusOnDepth

Runtime error

App Files Files Community

FocusOnDepth / app.py

ybelkada

add enable queue + cache example

5a568bc about 3 years ago

raw

history blame contribute delete

2.74 kB

	import torch
	import gradio as gr
	import numpy as np

	import requests
	from PIL import Image
	from io import BytesIO
	from torchvision import transforms

	from transformers import AutoConfig, AutoModel
	from transformers import AutoModel

	from focusondepth.model_config import FocusOnDepthConfig
	from focusondepth.model_definition import FocusOnDepth

	AutoConfig.register("focusondepth", FocusOnDepthConfig)
	AutoModel.register(FocusOnDepthConfig, FocusOnDepth)

	transform = transforms.Compose([
	transforms.Resize((384, 384)),
	transforms.ToTensor(),
	transforms.Normalize(mean=[0.5, 0.5, 0.5], std=[0.5, 0.5, 0.5]),
	])
	model = AutoModel.from_pretrained('ybelkada/focusondepth', trust_remote_code=True)

	@torch.no_grad()
	def inference(input_image):
	global model, transform

	model.eval()
	input_image = Image.fromarray(input_image)
	original_size = input_image.size
	tensor_image = transform(input_image)

	depth, segmentation = model(tensor_image.unsqueeze(0))
	depth = 1-depth

	depth = transforms.ToPILImage()(depth[0, :])
	segmentation = transforms.ToPILImage()(segmentation.argmax(dim=1).float())

	return [depth.resize(original_size, resample=Image.BICUBIC), segmentation.resize(original_size, resample=Image.NEAREST)]

	description = """
	<center>
	Can a single model predict both segmentation and depth estimation? At least, if the segmentation is constrained for a single class, the answer is yes! <br>
	In this project, we use a DPT model to predict the depth and the segmentation mask of the class human, of an image. This model could be potentially used for an autofocus application where you would need the segmentation mask of the humans on the picture, as well as the depth estimation of the scene<br>
	Credits also to <div style='text-align: center;'><a href='https://github.com/antocad' target='_blank'>@antocad</a> !
	</center>
	"""
	title="""
	FocusOnDepth - A single DPT encoder for Dense Prediction Tasks
	"""
	css = """
	"""
	article = """
	<center>
	Example image taken from <a href="https://www.flickr.com/photos/17423713@N03/29129350066">here</a>. The image is free to share and use. <br>
	</center>
	<div style='text-align: center;'><a href='https://github.com/isl-org/DPT' target='_blank'>Original Paper</a> \| <a href='https://github.com/antocad/FocusOnDepth' target='_blank'>Extended Version</a></div>
	"""

	iface = gr.Interface(
	fn=inference,
	inputs=gr.inputs.Image(label="Input Image"),
	outputs = [
	gr.outputs.Image(label="Depth Map:"),
	gr.outputs.Image(label="Segmentation Map:"),
	],
	examples=['example_image.jpg'],
	description=description,
	title=title,
	css=css,
	article=article
	)
	iface.launch(enable_queue=True, cache_examples=True)