Spaces:
Running
Running
import os | |
import json | |
import argparse | |
import operator | |
import gradio as gr | |
import torchvision | |
from typing import Tuple, Dict | |
from facetorch import FaceAnalyzer | |
from facetorch.datastruct import ImageData | |
from omegaconf import OmegaConf | |
from torch.nn.functional import cosine_similarity | |
parser = argparse.ArgumentParser(description="App") | |
parser.add_argument( | |
"--path-conf", | |
type=str, | |
default="config.merged.yml", | |
help="Path to the config file", | |
) | |
args = parser.parse_args() | |
cfg = OmegaConf.load(args.path_conf) | |
analyzer = FaceAnalyzer(cfg.analyzer) | |
def gen_sim_dict_str(response: ImageData, pred_name: str = "verify", index: int = 0)-> str: | |
if len(response.faces) > 0: | |
base_emb = response.faces[index].preds[pred_name].logits | |
sim_dict = {face.indx: cosine_similarity(base_emb, face.preds[pred_name].logits, dim=0).item() for face in response.faces} | |
sim_dict_sort = dict(sorted(sim_dict.items(), key=operator.itemgetter(1),reverse=True)) | |
sim_dict_sort_str = str(sim_dict_sort) | |
else: | |
sim_dict_sort_str = "" | |
return sim_dict_sort_str | |
def inference(path_image: str) -> Tuple: | |
response = analyzer.run( | |
path_image=path_image, | |
batch_size=cfg.batch_size, | |
fix_img_size=cfg.fix_img_size, | |
return_img_data=cfg.return_img_data, | |
include_tensors=cfg.include_tensors, | |
path_output=None, | |
) | |
pil_image = torchvision.transforms.functional.to_pil_image(response.img) | |
fer_dict_str = str({face.indx: face.preds["fer"].label for face in response.faces}) | |
au_dict_str = str({face.indx: face.preds["au"].other["multi"] for face in response.faces}) | |
deepfake_dict_str = str({face.indx: face.preds["deepfake"].label for face in response.faces}) | |
response_str = str(response) | |
sim_dict_str_embed = gen_sim_dict_str(response, pred_name="embed", index=0) | |
sim_dict_str_verify = gen_sim_dict_str(response, pred_name="verify", index=0) | |
os.remove(path_image) | |
out_tuple = (pil_image, fer_dict_str, au_dict_str, deepfake_dict_str, sim_dict_str_embed, sim_dict_str_verify, response_str) | |
return out_tuple | |
title = "Face Analysis" | |
description = "Demo of facetorch, a face analysis Python library that implements open-source pre-trained neural networks for face detection, representation learning, verification, expression recognition, action unit detection, deepfake detection, and 3D alignment. Try selecting one of the example images or upload your own. Feel free to duplicate this space and run it faster on a GPU instance. This work would not be possible without the researchers and engineers who trained the models (sources and credits can be found in the facetorch repository)." | |
article = "<p style='text-align: center'><a href='https://github.com/tomas-gajarsky/facetorch' style='text-align:center' target='_blank'>facetorch GitHub repository</a></p>" | |
demo=gr.Interface( | |
inference, | |
[gr.Image(label="Input", type="filepath")], | |
[gr.Image(type="pil", label="Face Detection and 3D Landmarks"), | |
gr.Textbox(label="Facial Expression Recognition"), | |
gr.Textbox(label="Facial Action Unit Detection"), | |
gr.Textbox(label="DeepFake Detection"), | |
gr.Textbox(label="Cosine similarity of Face Representation Embeddings"), | |
gr.Textbox(label="Cosine similarity of Face Verification Embeddings"), | |
gr.Textbox(label="Response")], | |
title=title, | |
description=description, | |
article=article, | |
examples=[["./test5.jpg"], ["./test.jpg"], ["./test4.jpg"], ["./test8.jpg"], ["./test6.jpg"], ["./test3.jpg"], ["./test10.jpg"]], | |
) | |
demo.queue(concurrency_count=1, api_open=False) | |
demo.launch(server_name="0.0.0.0", server_port=7860, debug=True) | |