Spaces:

tomas-gajarsky
/

facetorch-app

Running

File size: 4,380 Bytes

e2c48d1
899c524
77fb271
5910f04
b723189
636e0ba
b723189
0184aed
b723189
0184aed
41b1b4e
5910f04
b723189
77fb271
 
 
 
 
 
 
b723189
77fb271
 
 
b723189
 
636e0ba
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
78c79c8
d0e1651
78c79c8
 
 
 
 
 
 
0184aed
 
 
b723189
ba05218
b723189
 
 
 
caa7434
b723189
899c524
b723189
2398e1d
899c524
b5d23b1
899c524
636e0ba
899c524
78c79c8
 
ce805af
e2c48d1
 
b5d23b1
2398e1d
b723189
 
72e01bc
b5d23b1
15d93c6
b5a31f2
 
 
3c886fa
 
 
b5d23b1
3c886fa
 
 
 
b5a31f2
 
 
afda8c0
b5a31f2
7918186
94e7509

import os
import json
import argparse
import operator
import gradio as gr
import torch
import torchvision
from typing import Tuple, Dict
from facetorch import FaceAnalyzer
from facetorch.datastruct import ImageData
from omegaconf import OmegaConf
from torch.nn.functional import cosine_similarity

parser = argparse.ArgumentParser(description="App")
parser.add_argument(
    "--path-conf",
    type=str,
    default="config.merged.yml",
    help="Path to the config file",
)

args = parser.parse_args()

cfg = OmegaConf.load(args.path_conf)
analyzer = FaceAnalyzer(cfg.analyzer)


def tensor_to_list(tensor: torch.Tensor) -> list:
    return tensor.tolist()

def dataclass_to_dict(obj):
    if hasattr(obj, "__dataclass_fields__"):
        return asdict(obj)
    return obj

def image_data_to_json(image_data: ImageData) -> str:
    # Convert tensors to lists
    image_data.img = tensor_to_list(image_data.img)
    image_data.tensor = tensor_to_list(image_data.tensor)
    
    # Convert dataclass to dictionary
    data_dict = dataclass_to_dict(image_data)
    
    # Convert dictionary to JSON string
    json_str = json.dumps(data_dict, indent=4, default=dataclass_to_dict)
    return json_str

def gen_sim_dict_str(response: ImageData, pred_name: str = "verify", index: int = 0)-> str:     
    if len(response.faces) > 0:
        base_emb = response.faces[index].preds[pred_name].logits
        sim_dict = {face.indx: cosine_similarity(base_emb, face.preds[pred_name].logits, dim=0).item() for face in response.faces}
        sim_dict_sort = dict(sorted(sim_dict.items(), key=operator.itemgetter(1),reverse=True))
        sim_dict_sort_str = str(sim_dict_sort)
    else:
        sim_dict_sort_str = ""
        
    return sim_dict_sort_str

def inference(path_image: str) -> Tuple:
    response = analyzer.run(
        path_image=path_image,
        batch_size=cfg.batch_size,
        fix_img_size=cfg.fix_img_size,
        return_img_data=cfg.return_img_data,
        include_tensors=cfg.include_tensors,
        path_output=None,
    )
    
    pil_image = torchvision.transforms.functional.to_pil_image(response.img)
    
    fer_dict_str = str({face.indx: face.preds["fer"].label for face in response.faces})
    au_dict_str = str({face.indx: face.preds["au"].other["multi"] for face in response.faces})
    deepfake_dict_str = str({face.indx: face.preds["deepfake"].label for face in response.faces})
    response_str = image_data_to_json(response)
    
    sim_dict_str_embed = gen_sim_dict_str(response, pred_name="embed", index=0)
    sim_dict_str_verify = gen_sim_dict_str(response, pred_name="verify", index=0)
    
    os.remove(path_image)
    
    out_tuple = (pil_image, fer_dict_str, au_dict_str, deepfake_dict_str, sim_dict_str_embed, sim_dict_str_verify, response_str)
    return out_tuple


title = "Face Analysis"
description = "Demo of facetorch, a face analysis Python library that implements open-source pre-trained neural networks for face detection, representation learning, verification, expression recognition, action unit detection, deepfake detection, and 3D alignment. Try selecting one of the example images or upload your own. Feel free to duplicate this space and run it faster on a GPU instance. This work would not be possible without the researchers and engineers who trained the models (sources and credits can be found in the facetorch repository)."
article = "<p style='text-align: center'><a href='https://github.com/tomas-gajarsky/facetorch' style='text-align:center' target='_blank'>facetorch GitHub repository</a></p>"

demo=gr.Interface(
    inference,
    [gr.Image(label="Input", type="filepath")],
    [gr.Image(type="pil", label="Face Detection and 3D Landmarks"),
     gr.Textbox(label="Facial Expression Recognition"),
     gr.Textbox(label="Facial Action Unit Detection"),
     gr.Textbox(label="DeepFake Detection"),
     gr.Textbox(label="Cosine similarity of Face Representation Embeddings"),
     gr.Textbox(label="Cosine similarity of Face Verification Embeddings"),
     gr.Textbox(label="Response")],
    title=title,
    description=description,
    article=article,
    examples=[["./test5.jpg"], ["./test.jpg"], ["./test4.jpg"], ["./test8.jpg"], ["./test6.jpg"], ["./test3.jpg"], ["./test10.jpg"]],
)
demo.queue(concurrency_count=1, api_open=False)
demo.launch(server_name="0.0.0.0", server_port=7860, debug=True)