facetorch-app / app.py
tomas-gajarsky's picture
Add valence arousal text box
12089af
raw
history blame
3.89 kB
import os
import json
import argparse
import operator
import gradio as gr
import torchvision
from typing import Tuple, Dict
from facetorch import FaceAnalyzer
from facetorch.datastruct import ImageData
from omegaconf import OmegaConf
from torch.nn.functional import cosine_similarity
parser = argparse.ArgumentParser(description="App")
parser.add_argument(
"--path-conf",
type=str,
default="config.merged.yml",
help="Path to the config file",
)
args = parser.parse_args()
cfg = OmegaConf.load(args.path_conf)
analyzer = FaceAnalyzer(cfg.analyzer)
def gen_sim_dict_str(response: ImageData, pred_name: str = "verify", index: int = 0)-> str:
if len(response.faces) > 0:
base_emb = response.faces[index].preds[pred_name].logits
sim_dict = {face.indx: cosine_similarity(base_emb, face.preds[pred_name].logits, dim=0).item() for face in response.faces}
sim_dict_sort = dict(sorted(sim_dict.items(), key=operator.itemgetter(1),reverse=True))
sim_dict_sort_str = str(sim_dict_sort)
else:
sim_dict_sort_str = ""
return sim_dict_sort_str
def inference(path_image: str) -> Tuple:
response = analyzer.run(
path_image=path_image,
batch_size=cfg.batch_size,
fix_img_size=cfg.fix_img_size,
return_img_data=cfg.return_img_data,
include_tensors=cfg.include_tensors,
path_output=None,
)
pil_image = torchvision.transforms.functional.to_pil_image(response.img)
fer_dict_str = str({face.indx: face.preds["fer"].label for face in response.faces})
au_dict_str = str({face.indx: face.preds["au"].other["multi"] for face in response.faces})
va_dict_str = str({face.indx: face.preds["va"].other for face in response.faces})
deepfake_dict_str = str({face.indx: face.preds["deepfake"].label for face in response.faces})
response_str = str(response)
sim_dict_str_embed = gen_sim_dict_str(response, pred_name="embed", index=0)
sim_dict_str_verify = gen_sim_dict_str(response, pred_name="verify", index=0)
os.remove(path_image)
out_tuple = (pil_image, fer_dict_str, au_dict_str, va_dict_str, deepfake_dict_str, sim_dict_str_embed, sim_dict_str_verify, response_str)
return out_tuple
title = "Face Analysis"
description = "Demo of facetorch, a face analysis Python library that implements open-source pre-trained neural networks for face detection, representation learning, verification, expression recognition, action unit detection, deepfake detection, and 3D alignment. Try selecting one of the example images or upload your own. Feel free to duplicate this space and run it faster on a GPU instance. This work would not be possible without the researchers and engineers who trained the models (sources and credits can be found in the facetorch repository)."
article = "<p style='text-align: center'><a href='https://github.com/tomas-gajarsky/facetorch' style='text-align:center' target='_blank'>facetorch GitHub repository</a></p>"
demo=gr.Interface(
inference,
[gr.Image(label="Input", type="filepath")],
[gr.Image(type="pil", label="Face Detection and 3D Landmarks"),
gr.Textbox(label="Facial Expression Recognition"),
gr.Textbox(label="Facial Action Unit Detection"),
gr.Textbox(label="Facial Valence Arousal"),
gr.Textbox(label="DeepFake Detection"),
gr.Textbox(label="Cosine similarity of Face Representation Embeddings"),
gr.Textbox(label="Cosine similarity of Face Verification Embeddings"),
gr.Textbox(label="Response")],
title=title,
description=description,
article=article,
examples=[["./test5.jpg"], ["./test.jpg"], ["./test4.jpg"], ["./test8.jpg"], ["./test6.jpg"], ["./test3.jpg"], ["./test10.jpg"]],
concurrency_limit=10,
)
demo.queue(api_open=True)
demo.launch(server_name="0.0.0.0", server_port=7860, debug=True)