AniPortrait_official

Paused

AniPortrait_official / src /utils /mp_utils.py

zejunyang

update

ac336de 4 months ago

3.83 kB

	import os
	import sys
	import numpy as np
	import cv2
	import time
	from tqdm import tqdm
	import multiprocessing
	import glob

	import mediapipe as mp
	from mediapipe import solutions
	from mediapipe.framework.formats import landmark_pb2
	from mediapipe.tasks import python
	from mediapipe.tasks.python import vision
	from src.utils import face_landmark

	CUR_DIR = os.path.dirname(__file__)


	class LMKExtractor():
	def __init__(self, FPS=25):
	# Create an FaceLandmarker object.
	self.mode = mp.tasks.vision.FaceDetectorOptions.running_mode.IMAGE
	base_options = python.BaseOptions(model_asset_path=os.path.join(CUR_DIR, 'mp_models/face_landmarker_v2_with_blendshapes.task'))
	base_options.delegate = mp.tasks.BaseOptions.Delegate.CPU
	options = vision.FaceLandmarkerOptions(base_options=base_options,
	running_mode=self.mode,
	output_face_blendshapes=True,
	output_facial_transformation_matrixes=True,
	num_faces=1)
	self.detector = face_landmark.FaceLandmarker.create_from_options(options)
	self.last_ts = 0
	self.frame_ms = int(1000 / FPS)

	# det_base_options = python.BaseOptions(model_asset_path=os.path.join(CUR_DIR, 'mp_models/blaze_face_short_range.tflite'))
	# det_options = vision.FaceDetectorOptions(base_options=det_base_options)
	# self.det_detector = vision.FaceDetector.create_from_options(det_options)


	def __call__(self, img):
	frame = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
	image = mp.Image(image_format=mp.ImageFormat.SRGB, data=frame)
	# t0 = time.time()
	# if self.mode == mp.tasks.vision.FaceDetectorOptions.running_mode.VIDEO:
	# det_result = self.det_detector.detect(image)
	# if len(det_result.detections) != 1:
	# return None
	# self.last_ts += self.frame_ms
	# try:
	# detection_result, mesh3d = self.detector.detect_for_video(image, timestamp_ms=self.last_ts)
	# except:
	# return None
	# elif self.mode == mp.tasks.vision.FaceDetectorOptions.running_mode.IMAGE:
	# det_result = self.det_detector.detect(image)

	# if len(det_result.detections) != 1:
	# return None
	try:
	detection_result, mesh3d = self.detector.detect(image)
	except:
	return None

	bs_list = detection_result.face_blendshapes
	if len(bs_list) == 1:
	bs = bs_list[0]
	bs_values = []
	for index in range(len(bs)):
	bs_values.append(bs[index].score)
	bs_values = bs_values[1:] # remove neutral
	trans_mat = detection_result.facial_transformation_matrixes[0]
	face_landmarks_list = detection_result.face_landmarks
	face_landmarks = face_landmarks_list[0]
	lmks = []
	for index in range(len(face_landmarks)):
	x = face_landmarks[index].x
	y = face_landmarks[index].y
	z = face_landmarks[index].z
	lmks.append([x, y, z])
	lmks = np.array(lmks)

	lmks3d = np.array(mesh3d.vertex_buffer)
	lmks3d = lmks3d.reshape(-1, 5)[:, :3]
	mp_tris = np.array(mesh3d.index_buffer).reshape(-1, 3) + 1

	return {
	"lmks": lmks,
	'lmks3d': lmks3d,
	"trans_mat": trans_mat,
	'faces': mp_tris,
	"bs": bs_values
	}
	else:
	# print('multiple faces in the image: {}'.format(img_path))
	return None