Spaces:

Yuliang
/

ICON

Runtime error

App Files Files Community

ICON / apps /infer.py

Yuliang

init

162943d over 2 years ago

raw

history blame

23 kB

	# -- coding: utf-8 --

	# Max-Planck-Gesellschaft zur Förderung der Wissenschaften e.V. (MPG) is
	# holder of all proprietary rights on this computer program.
	# You can only use this computer program if you have closed
	# a license agreement with MPG or you get the right to use the computer
	# program from someone who is authorized to grant you that right.
	# Any use of the computer program without a valid license is prohibited and
	# liable to prosecution.
	#
	# Copyright©2019 Max-Planck-Gesellschaft zur Förderung
	# der Wissenschaften e.V. (MPG). acting on behalf of its Max Planck Institute
	# for Intelligent Systems. All rights reserved.
	#
	# Contact: ps-license@tuebingen.mpg.de

	import logging
	from lib.common.render import query_color, image2vid
	from lib.common.config import cfg
	from lib.common.cloth_extraction import extract_cloth
	from lib.dataset.mesh_util import (
	load_checkpoint,
	update_mesh_shape_prior_losses,
	get_optim_grid_image,
	blend_rgb_norm,
	unwrap,
	remesh,
	tensor2variable,
	normal_loss
	)

	from lib.dataset.TestDataset import TestDataset
	from lib.net.local_affine import LocalAffine
	from pytorch3d.structures import Meshes
	from apps.ICON import ICON

	import os
	from termcolor import colored
	import argparse
	import numpy as np
	from PIL import Image
	import trimesh
	import pickle
	import numpy as np

	import torch
	torch.backends.cudnn.benchmark = True

	logging.getLogger("trimesh").setLevel(logging.ERROR)


	if __name__ == "__main__":

	# loading cfg file
	parser = argparse.ArgumentParser()

	parser.add_argument("-gpu", "--gpu_device", type=int, default=0)
	parser.add_argument("-colab", action="store_true")
	parser.add_argument("-loop_smpl", "--loop_smpl", type=int, default=100)
	parser.add_argument("-patience", "--patience", type=int, default=5)
	parser.add_argument("-vis_freq", "--vis_freq", type=int, default=10)
	parser.add_argument("-loop_cloth", "--loop_cloth", type=int, default=200)
	parser.add_argument("-hps_type", "--hps_type", type=str, default="pymaf")
	parser.add_argument("-export_video", action="store_true")
	parser.add_argument("-in_dir", "--in_dir", type=str, default="./examples")
	parser.add_argument("-out_dir", "--out_dir",
	type=str, default="./results")
	parser.add_argument('-seg_dir', '--seg_dir', type=str, default=None)
	parser.add_argument(
	"-cfg", "--config", type=str, default="./configs/icon-filter.yaml"
	)

	args = parser.parse_args()

	# cfg read and merge
	cfg.merge_from_file(args.config)
	cfg.merge_from_file("./lib/pymaf/configs/pymaf_config.yaml")

	cfg_show_list = [
	"test_gpus",
	[args.gpu_device],
	"mcube_res",
	256,
	"clean_mesh",
	True,
	]

	cfg.merge_from_list(cfg_show_list)
	cfg.freeze()

	os.environ["CUDA_VISIBLE_DEVICES"] = "0,1"
	device = torch.device(f"cuda:{args.gpu_device}")

	if args.colab:
	print(colored("colab environment...", "red"))
	from tqdm.notebook import tqdm
	else:
	print(colored("normal environment...", "red"))
	from tqdm import tqdm

	# load model and dataloader
	model = ICON(cfg)
	model = load_checkpoint(model, cfg)

	dataset_param = {
	'image_dir': args.in_dir,
	'seg_dir': args.seg_dir,
	'has_det': True, # w/ or w/o detection
	'hps_type': args.hps_type # pymaf/pare/pixie
	}

	if args.hps_type == "pixie" and "pamir" in args.config:
	print(colored("PIXIE isn't compatible with PaMIR, thus switch to PyMAF", "red"))
	dataset_param["hps_type"] = "pymaf"

	dataset = TestDataset(dataset_param, device)

	print(colored(f"Dataset Size: {len(dataset)}", "green"))

	pbar = tqdm(dataset)

	for data in pbar:

	pbar.set_description(f"{data['name']}")

	in_tensor = {"smpl_faces": data["smpl_faces"], "image": data["image"]}

	# The optimizer and variables
	optimed_pose = torch.tensor(
	data["body_pose"], device=device, requires_grad=True
	) # [1,23,3,3]
	optimed_trans = torch.tensor(
	data["trans"], device=device, requires_grad=True
	) # [3]
	optimed_betas = torch.tensor(
	data["betas"], device=device, requires_grad=True
	) # [1,10]
	optimed_orient = torch.tensor(
	data["global_orient"], device=device, requires_grad=True
	) # [1,1,3,3]

	optimizer_smpl = torch.optim.SGD(
	[optimed_pose, optimed_trans, optimed_betas, optimed_orient],
	lr=1e-3,
	momentum=0.9,
	)
	scheduler_smpl = torch.optim.lr_scheduler.ReduceLROnPlateau(
	optimizer_smpl,
	mode="min",
	factor=0.5,
	verbose=0,
	min_lr=1e-5,
	patience=args.patience,
	)

	losses = {
	"cloth": {"weight": 1e1, "value": 0.0}, # Cloth: Normal_recon - Normal_pred
	"stiffness": {"weight": 1e5, "value": 0.0}, # Cloth: [RT]_v1 - [RT]_v2 (v1-edge-v2)
	"rigid": {"weight": 1e5, "value": 0.0}, # Cloth: det(R) = 1
	"edge": {"weight": 0, "value": 0.0}, # Cloth: edge length
	"nc": {"weight": 0, "value": 0.0}, # Cloth: normal consistency
	"laplacian": {"weight": 1e2, "value": 0.0}, # Cloth: laplacian smoonth
	"normal": {"weight": 1e0, "value": 0.0}, # Body: Normal_pred - Normal_smpl
	"silhouette": {"weight": 1e1, "value": 0.0}, # Body: Silhouette_pred - Silhouette_smpl
	}

	# smpl optimization

	loop_smpl = tqdm(
	range(args.loop_smpl if cfg.net.prior_type != "pifu" else 1))

	per_data_lst = []

	for i in loop_smpl:

	per_loop_lst = []

	optimizer_smpl.zero_grad()

	if dataset_param["hps_type"] != "pixie":
	smpl_out = dataset.smpl_model(
	betas=optimed_betas,
	body_pose=optimed_pose,
	global_orient=optimed_orient,
	pose2rot=False,
	)

	smpl_verts = ((smpl_out.vertices) +
	optimed_trans) * data["scale"]
	else:
	smpl_verts, _, _ = dataset.smpl_model(
	shape_params=optimed_betas,
	expression_params=tensor2variable(data["exp"], device),
	body_pose=optimed_pose,
	global_pose=optimed_orient,
	jaw_pose=tensor2variable(data["jaw_pose"], device),
	left_hand_pose=tensor2variable(
	data["left_hand_pose"], device),
	right_hand_pose=tensor2variable(
	data["right_hand_pose"], device),
	)

	smpl_verts = (smpl_verts + optimed_trans) * data["scale"]

	# render optimized mesh (normal, T_normal, image [-1,1])
	in_tensor["T_normal_F"], in_tensor["T_normal_B"] = dataset.render_normal(
	smpl_verts *
	torch.tensor([1.0, -1.0, -1.0]
	).to(device), in_tensor["smpl_faces"]
	)
	T_mask_F, T_mask_B = dataset.render.get_silhouette_image()

	with torch.no_grad():
	in_tensor["normal_F"], in_tensor["normal_B"] = model.netG.normal_filter(
	in_tensor
	)

	diff_F_smpl = torch.abs(
	in_tensor["T_normal_F"] - in_tensor["normal_F"])
	diff_B_smpl = torch.abs(
	in_tensor["T_normal_B"] - in_tensor["normal_B"])

	loss_F_smpl = normal_loss(
	in_tensor["T_normal_F"], in_tensor["normal_F"])
	loss_B_smpl = normal_loss(
	in_tensor["T_normal_B"], in_tensor["normal_B"])

	losses["normal"]["value"] = (loss_F_smpl + loss_B_smpl).mean()

	# silhouette loss
	smpl_arr = torch.cat([T_mask_F, T_mask_B], dim=-1)[0]
	gt_arr = torch.cat(
	[in_tensor["normal_F"][0], in_tensor["normal_B"][0]], dim=2
	).permute(1, 2, 0)
	gt_arr = ((gt_arr + 1.0) * 0.5).to(device)
	bg_color = (
	torch.Tensor([0.5, 0.5, 0.5]).unsqueeze(
	0).unsqueeze(0).to(device)
	)
	gt_arr = ((gt_arr - bg_color).sum(dim=-1) != 0.0).float()
	diff_S = torch.abs(smpl_arr - gt_arr)
	losses["silhouette"]["value"] = diff_S.mean()

	# Weighted sum of the losses
	smpl_loss = 0.0
	pbar_desc = "Body Fitting --- "
	for k in ["normal", "silhouette"]:
	pbar_desc += f"{k}: {losses[k]['value'] * losses[k]['weight']:.3f} \| "
	smpl_loss += losses[k]["value"] * losses[k]["weight"]
	pbar_desc += f"Total: {smpl_loss:.3f}"
	loop_smpl.set_description(pbar_desc)

	if i % args.vis_freq == 0:

	per_loop_lst.extend(
	[
	in_tensor["image"],
	in_tensor["T_normal_F"],
	in_tensor["normal_F"],
	diff_F_smpl / 2.0,
	diff_S[:, :512].unsqueeze(
	0).unsqueeze(0).repeat(1, 3, 1, 1),
	]
	)
	per_loop_lst.extend(
	[
	in_tensor["image"],
	in_tensor["T_normal_B"],
	in_tensor["normal_B"],
	diff_B_smpl / 2.0,
	diff_S[:, 512:].unsqueeze(
	0).unsqueeze(0).repeat(1, 3, 1, 1),
	]
	)
	per_data_lst.append(
	get_optim_grid_image(
	per_loop_lst, None, nrow=5, type="smpl")
	)

	smpl_loss.backward()
	optimizer_smpl.step()
	scheduler_smpl.step(smpl_loss)
	in_tensor["smpl_verts"] = smpl_verts * \
	torch.tensor([1.0, 1.0, -1.0]).to(device)

	# visualize the optimization process
	# 1. SMPL Fitting
	# 2. Clothes Refinement

	os.makedirs(os.path.join(args.out_dir, cfg.name,
	"refinement"), exist_ok=True)

	# visualize the final results in self-rotation mode
	os.makedirs(os.path.join(args.out_dir, cfg.name, "vid"), exist_ok=True)

	# final results rendered as image
	# 1. Render the final fitted SMPL (xxx_smpl.png)
	# 2. Render the final reconstructed clothed human (xxx_cloth.png)
	# 3. Blend the original image with predicted cloth normal (xxx_overlap.png)

	os.makedirs(os.path.join(args.out_dir, cfg.name, "png"), exist_ok=True)

	# final reconstruction meshes
	# 1. SMPL mesh (xxx_smpl.obj)
	# 2. SMPL params (xxx_smpl.npy)
	# 3. clohted mesh (xxx_recon.obj)
	# 4. remeshed clothed mesh (xxx_remesh.obj)
	# 5. refined clothed mesh (xxx_refine.obj)

	os.makedirs(os.path.join(args.out_dir, cfg.name, "obj"), exist_ok=True)

	if cfg.net.prior_type != "pifu":

	per_data_lst[0].save(
	os.path.join(
	args.out_dir, cfg.name, f"refinement/{data['name']}_smpl.gif"
	),
	save_all=True,
	append_images=per_data_lst[1:],
	duration=500,
	loop=0,
	)

	if args.vis_freq == 1:
	image2vid(
	per_data_lst,
	os.path.join(
	args.out_dir, cfg.name, f"refinement/{data['name']}_smpl.avi"
	),
	)

	per_data_lst[-1].save(
	os.path.join(args.out_dir, cfg.name,
	f"png/{data['name']}_smpl.png")
	)

	norm_pred = (
	((in_tensor["normal_F"][0].permute(1, 2, 0) + 1.0) * 255.0 / 2.0)
	.detach()
	.cpu()
	.numpy()
	.astype(np.uint8)
	)

	norm_orig = unwrap(norm_pred, data)
	mask_orig = unwrap(
	np.repeat(
	data["mask"].permute(1, 2, 0).detach().cpu().numpy(), 3, axis=2
	).astype(np.uint8),
	data,
	)
	rgb_norm = blend_rgb_norm(data["ori_image"], norm_orig, mask_orig)

	Image.fromarray(
	np.concatenate(
	[data["ori_image"].astype(np.uint8), rgb_norm], axis=1)
	).save(os.path.join(args.out_dir, cfg.name, f"png/{data['name']}_overlap.png"))

	smpl_obj = trimesh.Trimesh(
	in_tensor["smpl_verts"].detach().cpu()[0] *
	torch.tensor([1.0, -1.0, 1.0]),
	in_tensor['smpl_faces'].detach().cpu()[0],
	process=False,
	maintains_order=True
	)
	smpl_obj.export(
	f"{args.out_dir}/{cfg.name}/obj/{data['name']}_smpl.obj")

	smpl_info = {'betas': optimed_betas,
	'pose': optimed_pose,
	'orient': optimed_orient,
	'trans': optimed_trans}

	np.save(
	f"{args.out_dir}/{cfg.name}/obj/{data['name']}_smpl.npy", smpl_info, allow_pickle=True)

	# ------------------------------------------------------------------------------------------------------------------

	# cloth optimization

	per_data_lst = []

	# cloth recon
	in_tensor.update(
	dataset.compute_vis_cmap(
	in_tensor["smpl_verts"][0], in_tensor["smpl_faces"][0]
	)
	)

	if cfg.net.prior_type == "pamir":
	in_tensor.update(
	dataset.compute_voxel_verts(
	optimed_pose,
	optimed_orient,
	optimed_betas,
	optimed_trans,
	data["scale"],
	)
	)

	with torch.no_grad():
	verts_pr, faces_pr, _ = model.test_single(in_tensor)

	recon_obj = trimesh.Trimesh(
	verts_pr, faces_pr, process=False, maintains_order=True
	)
	recon_obj.export(
	os.path.join(args.out_dir, cfg.name,
	f"obj/{data['name']}_recon.obj")
	)

	# Isotropic Explicit Remeshing for better geometry topology
	verts_refine, faces_refine = remesh(os.path.join(args.out_dir, cfg.name,
	f"obj/{data['name']}_recon.obj"), 0.5, device)

	# define local_affine deform verts
	mesh_pr = Meshes(verts_refine, faces_refine).to(device)
	local_affine_model = LocalAffine(
	mesh_pr.verts_padded().shape[1], mesh_pr.verts_padded().shape[0], mesh_pr.edges_packed()).to(device)
	optimizer_cloth = torch.optim.Adam(
	[{'params': local_affine_model.parameters()}], lr=1e-4, amsgrad=True)

	scheduler_cloth = torch.optim.lr_scheduler.ReduceLROnPlateau(
	optimizer_cloth,
	mode="min",
	factor=0.1,
	verbose=0,
	min_lr=1e-5,
	patience=args.patience,
	)

	with torch.no_grad():
	per_loop_lst = []
	rotate_recon_lst = dataset.render.get_rgb_image(cam_ids=[
	0, 1, 2, 3])
	per_loop_lst.extend(rotate_recon_lst)
	per_data_lst.append(get_optim_grid_image(
	per_loop_lst, None, type="cloth"))

	final = None

	if args.loop_cloth > 0:

	loop_cloth = tqdm(range(args.loop_cloth))

	for i in loop_cloth:

	per_loop_lst = []

	optimizer_cloth.zero_grad()

	deformed_verts, stiffness, rigid = local_affine_model(
	verts_refine.to(device), return_stiff=True)
	mesh_pr = mesh_pr.update_padded(deformed_verts)

	# losses for laplacian, edge, normal consistency
	update_mesh_shape_prior_losses(mesh_pr, losses)

	in_tensor["P_normal_F"], in_tensor["P_normal_B"] = dataset.render_normal(
	mesh_pr.verts_padded(), mesh_pr.faces_padded())

	diff_F_cloth = torch.abs(
	in_tensor["P_normal_F"] - in_tensor["normal_F"])
	diff_B_cloth = torch.abs(
	in_tensor["P_normal_B"] - in_tensor["normal_B"])

	losses["cloth"]["value"] = (diff_F_cloth + diff_B_cloth).mean()
	losses["stiffness"]["value"] = torch.mean(stiffness)
	losses["rigid"]["value"] = torch.mean(rigid)

	# Weighted sum of the losses
	cloth_loss = torch.tensor(0.0, requires_grad=True).to(device)
	pbar_desc = "Cloth Refinement --- "

	for k in losses.keys():
	if k not in ["normal", "silhouette"] and losses[k]["weight"] > 0.0:
	cloth_loss = cloth_loss + \
	losses[k]["value"] * losses[k]["weight"]
	pbar_desc += f"{k}:{losses[k]['value']* losses[k]['weight']:.5f} \| "

	pbar_desc += f"Total: {cloth_loss:.5f}"
	loop_cloth.set_description(pbar_desc)

	# update params
	cloth_loss.backward(retain_graph=True)
	optimizer_cloth.step()
	scheduler_cloth.step(cloth_loss)

	# for vis
	with torch.no_grad():
	if i % args.vis_freq == 0:

	rotate_recon_lst = dataset.render.get_rgb_image(cam_ids=[
	0, 1, 2, 3])

	per_loop_lst.extend(
	[
	in_tensor["image"],
	in_tensor["P_normal_F"],
	in_tensor["normal_F"],
	diff_F_cloth / 2.0,
	]
	)
	per_loop_lst.extend(
	[
	in_tensor["image"],
	in_tensor["P_normal_B"],
	in_tensor["normal_B"],
	diff_B_cloth / 2.0,
	]
	)
	per_loop_lst.extend(rotate_recon_lst)
	per_data_lst.append(
	get_optim_grid_image(
	per_loop_lst, None, type="cloth")
	)

	# gif for optimization
	per_data_lst[1].save(
	os.path.join(
	args.out_dir, cfg.name, f"refinement/{data['name']}_cloth.gif"
	),
	save_all=True,
	append_images=per_data_lst[2:],
	duration=500,
	loop=0,
	)

	if args.vis_freq == 1:
	image2vid(
	per_data_lst,
	os.path.join(
	args.out_dir, cfg.name, f"refinement/{data['name']}_cloth.avi"
	),
	)

	final = trimesh.Trimesh(
	mesh_pr.verts_packed().detach().squeeze(0).cpu(),
	mesh_pr.faces_packed().detach().squeeze(0).cpu(),
	process=False, maintains_order=True
	)
	final_colors = query_color(
	mesh_pr.verts_packed().detach().squeeze(0).cpu(),
	mesh_pr.faces_packed().detach().squeeze(0).cpu(),
	in_tensor["image"],
	device=device,
	)
	final.visual.vertex_colors = final_colors
	final.export(
	f"{args.out_dir}/{cfg.name}/obj/{data['name']}_refine.obj")

	# always export visualized png regardless of the cloth refinment
	per_data_lst[-1].save(
	os.path.join(args.out_dir, cfg.name,
	f"png/{data['name']}_cloth.png")
	)

	# always export visualized video regardless of the cloth refinment
	if args.export_video:
	if final is not None:
	verts_lst = [verts_pr, final.vertices]
	faces_lst = [faces_pr, final.faces]
	else:
	verts_lst = [verts_pr]
	faces_lst = [faces_pr]

	# self-rotated video
	dataset.render.load_meshes(
	verts_lst, faces_lst)
	dataset.render.get_rendered_video(
	[data["ori_image"], rgb_norm],
	os.path.join(args.out_dir, cfg.name,
	f"vid/{data['name']}_cloth.mp4"),
	)

	# garment extraction from deepfashion images
	if not (args.seg_dir is None):
	if final is not None:
	recon_obj = final.copy()

	os.makedirs(os.path.join(
	args.out_dir, cfg.name, "clothes"), exist_ok=True)
	os.makedirs(os.path.join(args.out_dir, cfg.name,
	"clothes", "info"), exist_ok=True)
	for seg in data['segmentations']:
	# These matrices work for PyMaf, not sure about the other hps type
	K = np.array([[1.0000, 0.0000, 0.0000, 0.0000],
	[0.0000, 1.0000, 0.0000, 0.0000],
	[0.0000, 0.0000, -0.5000, 0.0000],
	[-0.0000, -0.0000, 0.5000, 1.0000]]).T

	R = np.array([[-1., 0., 0.],
	[0., 1., 0.],
	[0., 0., -1.]])

	t = np.array([[-0., -0., 100.]])
	clothing_obj = extract_cloth(recon_obj, seg, K, R, t, smpl_obj)
	if clothing_obj is not None:
	cloth_type = seg['type'].replace(' ', '_')
	cloth_info = {
	'betas': optimed_betas,
	'body_pose': optimed_pose,
	'global_orient': optimed_orient,
	'pose2rot': False,
	'clothing_type': cloth_type,
	}

	file_id = f"{data['name']}_{cloth_type}"
	with open(os.path.join(args.out_dir, cfg.name, "clothes", "info", f"{file_id}_info.pkl"), 'wb') as fp:
	pickle.dump(cloth_info, fp)

	clothing_obj.export(os.path.join(
	args.out_dir, cfg.name, "clothes", f"{file_id}.obj"))
	else:
	print(
	f"Unable to extract clothing of type {seg['type']} from image {data['name']}")