|
import os |
|
import cv2 |
|
import numpy as np |
|
from tqdm import tqdm |
|
from utils import scale_bbox_from_center |
|
import spaces |
|
|
|
detect_conditions = [ |
|
"best detection", |
|
"left most", |
|
"right most", |
|
"top most", |
|
"bottom most", |
|
"middle", |
|
"biggest", |
|
"smallest", |
|
] |
|
|
|
swap_options_list = [ |
|
"All Face", |
|
"Specific Face", |
|
"Age less than", |
|
"Age greater than", |
|
"All Male", |
|
"All Female", |
|
"Left Most", |
|
"Right Most", |
|
"Top Most", |
|
"Bottom Most", |
|
"Middle", |
|
"Biggest", |
|
"Smallest", |
|
] |
|
|
|
def get_single_face(faces, method="best detection"): |
|
total_faces = len(faces) |
|
if total_faces == 1: |
|
return faces[0] |
|
|
|
print(f"{total_faces} face detected. Using {method} face.") |
|
if method == "best detection": |
|
return sorted(faces, key=lambda face: face["det_score"])[-1] |
|
elif method == "left most": |
|
return sorted(faces, key=lambda face: face["bbox"][0])[0] |
|
elif method == "right most": |
|
return sorted(faces, key=lambda face: face["bbox"][0])[-1] |
|
elif method == "top most": |
|
return sorted(faces, key=lambda face: face["bbox"][1])[0] |
|
elif method == "bottom most": |
|
return sorted(faces, key=lambda face: face["bbox"][1])[-1] |
|
elif method == "middle": |
|
return sorted(faces, key=lambda face: ( |
|
(face["bbox"][0] + face["bbox"][2]) / 2 - 0.5) ** 2 + |
|
((face["bbox"][1] + face["bbox"][3]) / 2 - 0.5) ** 2)[len(faces) // 2] |
|
elif method == "biggest": |
|
return sorted(faces, key=lambda face: (face["bbox"][2] - face["bbox"][0]) * (face["bbox"][3] - face["bbox"][1]))[-1] |
|
elif method == "smallest": |
|
return sorted(faces, key=lambda face: (face["bbox"][2] - face["bbox"][0]) * (face["bbox"][3] - face["bbox"][1]))[0] |
|
|
|
|
|
|
|
def analyse_face(image, model, return_single_face=True, detect_condition="best detection", scale=1.0): |
|
faces = model.get(image) |
|
if scale != 1: |
|
for i, face in enumerate(faces): |
|
landmark = face['kps'] |
|
center = np.mean(landmark, axis=0) |
|
landmark = center + (landmark - center) * scale |
|
faces[i]['kps'] = landmark |
|
|
|
if not return_single_face: |
|
return faces |
|
|
|
return get_single_face(faces, method=detect_condition) |
|
|
|
|
|
def cosine_distance(a, b): |
|
a /= np.linalg.norm(a) |
|
b /= np.linalg.norm(b) |
|
return 1 - np.dot(a, b) |
|
|
|
|
|
|
|
def get_analysed_data(face_analyser, image_sequence, source_data, swap_condition="All face", detect_condition="left most", scale=1.0): |
|
if swap_condition != "Specific Face": |
|
source_path, age = source_data |
|
source_image = cv2.imread(source_path) |
|
analysed_source = analyse_face(source_image, face_analyser, return_single_face=True, detect_condition=detect_condition, scale=scale) |
|
else: |
|
analysed_source_specifics = [] |
|
source_specifics, threshold = source_data |
|
for source, specific in zip(*source_specifics): |
|
if source is None or specific is None: |
|
continue |
|
analysed_source = analyse_face(source, face_analyser, return_single_face=True, detect_condition=detect_condition, scale=scale) |
|
analysed_specific = analyse_face(specific, face_analyser, return_single_face=True, detect_condition=detect_condition, scale=scale) |
|
analysed_source_specifics.append([analysed_source, analysed_specific]) |
|
|
|
analysed_target_list = [] |
|
analysed_source_list = [] |
|
whole_frame_eql_list = [] |
|
num_faces_per_frame = [] |
|
|
|
total_frames = len(image_sequence) |
|
curr_idx = 0 |
|
for curr_idx, frame_path in tqdm(enumerate(image_sequence), total=total_frames, desc="Analysing face data"): |
|
frame = cv2.imread(frame_path) |
|
analysed_faces = analyse_face(frame, face_analyser, return_single_face=False, detect_condition=detect_condition, scale=scale) |
|
|
|
n_faces = 0 |
|
for analysed_face in analysed_faces: |
|
if swap_condition == "All Face": |
|
analysed_target_list.append(analysed_face) |
|
analysed_source_list.append(analysed_source) |
|
whole_frame_eql_list.append(frame_path) |
|
n_faces += 1 |
|
elif swap_condition == "Age less than" and analysed_face["age"] < age: |
|
analysed_target_list.append(analysed_face) |
|
analysed_source_list.append(analysed_source) |
|
whole_frame_eql_list.append(frame_path) |
|
n_faces += 1 |
|
elif swap_condition == "Age greater than" and analysed_face["age"] > age: |
|
analysed_target_list.append(analysed_face) |
|
analysed_source_list.append(analysed_source) |
|
whole_frame_eql_list.append(frame_path) |
|
n_faces += 1 |
|
elif swap_condition == "All Male" and analysed_face["gender"] == 1: |
|
analysed_target_list.append(analysed_face) |
|
analysed_source_list.append(analysed_source) |
|
whole_frame_eql_list.append(frame_path) |
|
n_faces += 1 |
|
elif swap_condition == "All Female" and analysed_face["gender"] == 0: |
|
analysed_target_list.append(analysed_face) |
|
analysed_source_list.append(analysed_source) |
|
whole_frame_eql_list.append(frame_path) |
|
n_faces += 1 |
|
elif swap_condition == "Specific Face": |
|
for analysed_source, analysed_specific in analysed_source_specifics: |
|
distance = cosine_distance(analysed_specific["embedding"], analysed_face["embedding"]) |
|
if distance < threshold: |
|
analysed_target_list.append(analysed_face) |
|
analysed_source_list.append(analysed_source) |
|
whole_frame_eql_list.append(frame_path) |
|
n_faces += 1 |
|
|
|
if swap_condition == "Left Most": |
|
analysed_face = get_single_face(analysed_faces, method="left most") |
|
analysed_target_list.append(analysed_face) |
|
analysed_source_list.append(analysed_source) |
|
whole_frame_eql_list.append(frame_path) |
|
n_faces += 1 |
|
|
|
elif swap_condition == "Right Most": |
|
analysed_face = get_single_face(analysed_faces, method="right most") |
|
analysed_target_list.append(analysed_face) |
|
analysed_source_list.append(analysed_source) |
|
whole_frame_eql_list.append(frame_path) |
|
n_faces += 1 |
|
|
|
elif swap_condition == "Top Most": |
|
analysed_face = get_single_face(analysed_faces, method="top most") |
|
analysed_target_list.append(analysed_face) |
|
analysed_source_list.append(analysed_source) |
|
whole_frame_eql_list.append(frame_path) |
|
n_faces += 1 |
|
|
|
elif swap_condition == "Bottom Most": |
|
analysed_face = get_single_face(analysed_faces, method="bottom most") |
|
analysed_target_list.append(analysed_face) |
|
analysed_source_list.append(analysed_source) |
|
whole_frame_eql_list.append(frame_path) |
|
n_faces += 1 |
|
|
|
elif swap_condition == "Middle": |
|
analysed_face = get_single_face(analysed_faces, method="middle") |
|
analysed_target_list.append(analysed_face) |
|
analysed_source_list.append(analysed_source) |
|
whole_frame_eql_list.append(frame_path) |
|
n_faces += 1 |
|
|
|
elif swap_condition == "Biggest": |
|
analysed_face = get_single_face(analysed_faces, method="biggest") |
|
analysed_target_list.append(analysed_face) |
|
analysed_source_list.append(analysed_source) |
|
whole_frame_eql_list.append(frame_path) |
|
n_faces += 1 |
|
|
|
elif swap_condition == "Smallest": |
|
analysed_face = get_single_face(analysed_faces, method="smallest") |
|
analysed_target_list.append(analysed_face) |
|
analysed_source_list.append(analysed_source) |
|
whole_frame_eql_list.append(frame_path) |
|
n_faces += 1 |
|
|
|
num_faces_per_frame.append(n_faces) |
|
|
|
return analysed_target_list, analysed_source_list, whole_frame_eql_list, num_faces_per_frame |
|
|