Spaces:

Anuj-Panthri
/

Face_rec_api

Sleeping

App Files Files Community

joshiayush commited on Aug 16, 2023

Commit

f5562ad

1 Parent(s): 143c297

Refactor `Aligner` to support multiple cropped images at once

Browse files

Files changed (5) hide show

app/__init__.py +4 -4
app/demo/routes.py +1 -1
face_detection/helper.py +1 -1
face_recognition/aligner.py +102 -69
face_recognition/inference.py +3 -3

app/__init__.py CHANGED Viewed

@@ -4,19 +4,19 @@ from datetime import timedelta
 from face_detection import inference as fd
 from face_detection.helper import get_crops as fd_get_crops
 from face_recognition import inference as fr
-from face_recognition.aligner import aligner
 from face_recognition import helper as fr_helper
-# face_detector=fd.face_detection("face_detection/Models/v1")
 # face_detector=fd.face_detection("face_detection/Models/mobilenet")
-face_detector=fd.face_detection("face_detection/Models/BestMap")
 face_detector.square_preprocessing=fd.square_pad()
 # face_recognizer=fr.face_recognition("face_recognition/Models/v1")
 # face_recognizer=fr.face_recognition("face_recognition/Models/mobilenet_basic_lfw")
 face_recognizer=fr.face_recognition("face_recognition/Models/keras_mobilenet_emore_adamw")
-aligner_obj=aligner()
 # image_size=544
 # p_thres=0.7

 from face_detection import inference as fd
 from face_detection.helper import get_crops as fd_get_crops
 from face_recognition import inference as fr
+from face_recognition.aligner import Aligner
 from face_recognition import helper as fr_helper
+face_detector=fd.face_detection("face_detection/Models/v1")
 # face_detector=fd.face_detection("face_detection/Models/mobilenet")
+# face_detector=fd.face_detection("face_detection/Models/BestMap")
 face_detector.square_preprocessing=fd.square_pad()
 # face_recognizer=fr.face_recognition("face_recognition/Models/v1")
 # face_recognizer=fr.face_recognition("face_recognition/Models/mobilenet_basic_lfw")
 face_recognizer=fr.face_recognition("face_recognition/Models/keras_mobilenet_emore_adamw")
+aligner_obj=Aligner()
 # image_size=544
 # p_thres=0.7

app/demo/routes.py CHANGED Viewed

@@ -42,7 +42,7 @@ def load_settings(func):
         # we will set image_size inside routes
         # set face aligner settings
-        aligner_obj.face_mesh_images.min_detection_confidence=session["demo"]['settings']['a_thres']
         # set face recognizer settings
         face_recognizer.thres=session["demo"]['settings']['d_thres']

         # we will set image_size inside routes
         # set face aligner settings
+        aligner_obj.min_detection_confidence=session["demo"]['settings']['a_thres']
         # set face recognizer settings
         face_recognizer.thres=session["demo"]['settings']['d_thres']

face_detection/helper.py CHANGED Viewed

@@ -17,7 +17,7 @@ def get_crops(img,objs_found,aligner=None,resize:tuple=None):
         crop=img[ymin:ymax,xmin:xmax]
         if aligner is not None:
-            crop=aligner.align_image(crop)
             if crop is None: continue
         if resize is not None:
             crop=square_maker(crop)

         crop=img[ymin:ymax,xmin:xmax]
         if aligner is not None:
+            crop=aligner.align((crop,))[0]
             if crop is None: continue
         if resize is not None:
             crop=square_maker(crop)

face_recognition/aligner.py CHANGED Viewed

@@ -9,72 +9,105 @@ import shutil
-class aligner:
-    def __init__(self,min_aligner_confidence=0.5):
-        mp_face_mesh = mp.solutions.face_mesh
-        self.face_mesh_images = mp_face_mesh.FaceMesh(static_image_mode=True, max_num_faces=1,
-                                                min_detection_confidence=min_aligner_confidence)
-        mp_drawing = mp.solutions.drawing_utils
-        mp_drawing_styles = mp.solutions.drawing_styles
-        LEFT_EYE_INDEXES = list(set(itertools.chain(*mp_face_mesh.FACEMESH_LEFT_EYE)))
-        RIGHT_EYE_INDEXES = list(set(itertools.chain(*mp_face_mesh.FACEMESH_RIGHT_EYE)))
-        self.LEFT_EYE_INDEX=LEFT_EYE_INDEXES[7]  # eye point index
-        self.RIGHT_EYE_INDEX=RIGHT_EYE_INDEXES[4]  # eye point index
-    def align_image(self,img):
-        # start work
-        face_mesh_results = self.face_mesh_images.process(img)
-        if face_mesh_results.multi_face_landmarks!=None:
-            face_landmarks=face_mesh_results.multi_face_landmarks[0]
-            h,w,_=img.shape
-            points=[]
-            x_coord=int(np.clip(face_landmarks.landmark[self.LEFT_EYE_INDEX].x*w,0,w))
-            y_coord=int(np.clip(face_landmarks.landmark[self.LEFT_EYE_INDEX].y*h,0,h))
-            points.append((x_coord,y_coord))
-            x_coord=int(np.clip(face_landmarks.landmark[self.RIGHT_EYE_INDEX].x*w,0,w))
-            y_coord=int(np.clip(face_landmarks.landmark[self.RIGHT_EYE_INDEX].y*h,0,h))
-            points.append((x_coord,y_coord))
-            p0=np.array(points[0],dtype='float64')
-            p1=np.array(points[1],dtype='float64')
-            h=abs(p0[1]-p1[1])
-            w=abs(p0[0]-p1[0])
-            theta=np.arctan(h/w)
-            angle=(theta * 180) / np.pi
-            def get_direction(p0,p1):
-                if p0[0]<p1[0]:
-                    if p0[1]<p1[1]:
-                        direction=1
-                    else:
-                        direction=-1
-                else:
-                    if p1[1]<p0[1]:
-                        direction=1
-                    else:
-                        direction=-1
-                return direction
-            direction=get_direction(p0,p1)
-            angle=direction*angle
-            # print("rotated anticlockwise by :",angle,"angle")
-            new_img = PIL.Image.fromarray(img)
-            new_img = new_img.rotate(angle)
-            return np.array(new_img)
-        else:
-            return None

+class Aligner(mp.solutions.face_mesh.FaceMesh):
+  """Inherits from MediaPipe Face Mesh."""
+  def __init__(
+    self,
+    static_image_mode: bool = True,
+    max_num_faces: int = 1,
+    refine_landmarks: bool = False,
+    min_detection_confidence: float = 0.5,
+    min_tracking_confidence: float = 0.5
+  ):
+    """Initializes a Image Aligner object.
+    Unlike MediaPipe Face Mesh we set `static_image_mode` to `True` as we only
+    require image manipulation.
+    Args:
+      static_image_mode: Whether to treat the input images as a batch of static
+        and possibly unrelated images, or a video stream.
+      max_num_faces: Maximum number of faces to detect.
+      refine_landmarks: Whether to further refine the landmark coordinates
+        around the eyes and lips, and output additional landmarks around the
+        irises. Default to False.
+      min_detection_confidence: Minimum confidence value ([0.0, 1.0]) for face
+        detection to be considered successful.
+      min_tracking_confidence: Minimum confidence value ([0.0, 1.0]) for the
+        face landmarks to be considered tracked successfully.
+    """
+    super().__init__(
+      static_image_mode=static_image_mode,
+      max_num_faces=max_num_faces,
+      refine_landmarks=refine_landmarks,
+      min_detection_confidence=min_detection_confidence,
+      min_tracking_confidence=min_tracking_confidence
+    )
+    self._left_eye_idx = list(
+      set(itertools.chain(*mp.solutions.face_mesh.FACEMESH_LEFT_EYE))
+    )[7]
+    self._right_eye_idx = list(
+      set(itertools.chain(*mp.solutions.face_mesh.FACEMESH_RIGHT_EYE))
+    )[4]
+  def _aligner(self, /, img: np.ndarray) -> np.ndarray:
+    """Private helper function to align the given image parallel to the x-axis.
+    This function creates a line between the left and right eye points and tries
+    to align that line parallel to the x-axis, thus aligning the complete image.
+    Args:
+      img: Image to align parallel to the x-axis.
+    """
+    fm = self.process(img)
+    if fm is None:
+      return None
+    points = []
+    h, w, _ = img.shape
+    face_landmarks = fm.multi_face_landmarks[0]
+    le_x_coord = int(
+      np.clip(face_landmarks.landmark[self._left_eye_idx].x * w, 0, w)
+    )
+    le_y_coord = int(
+      np.clip(face_landmarks.landmark[self._left_eye_idx].y * h, 0, h)
+    )
+    p0 = np.array((le_x_coord, le_y_coord), dtype=np.float64)
+    re_x_coord = int(
+      np.clip(face_landmarks.landmark[self._right_eye_idx].x * w, 0, w)
+    )
+    re_y_coord = int(
+      np.clip(face_landmarks.landmark[self._right_eye_idx].y * h, 0, h)
+    )
+    p1 = np.array((re_x_coord, re_y_coord), dtype=np.float64)
+    h = abs(p0[1] - p1[1])
+    w = abs(p0[0] - p1[0])
+    # Get the angle between the x-axis and the line joining the eye points.
+    theta = np.arctan(h / w)
+    angle = (theta * 180) / np.pi
+    if p0[0] < p1[0]:
+      direction = 1 if p0[1] < p1[1] else -1
+    else:
+      direction = 1 if p1[1] < p0[1] else -1
+    angle *= direction
+    img = PIL.Image.fromarray(img)
+    return np.array(img.rotate(angle))
+  def align(self, /, imgs: tuple[np.ndarray]) -> list[np.ndarray]:
+    """Aligns the given set of images parallel to the x-axis on the image plane.
+    Args:
+      imgs: Images to align parallel to the x-axis on the image place.
+    """
+    return [self._aligner(img) for img in imgs]

face_recognition/inference.py CHANGED Viewed

@@ -14,7 +14,7 @@ import importlib
 from face_recognition import config
-from face_recognition.aligner import  aligner
@@ -25,7 +25,7 @@ class face_recognition:
     self.model_config= importlib.import_module(config_file_path)
     # print(self.model_config)
     self.thres=thres if thres is not None else self.model_config.d_thres
-    self.aligner=aligner(min_aligner_confidence)  if min_aligner_confidence is not None else aligner(config.min_aligner_confidence)
     self.feature_extractor=tf.keras.models.load_model(model_path+"/model.h5",compile=False)
@@ -139,7 +139,7 @@ class face_recognition:
         crop_img=img[ymin:ymax,xmin:xmax]
         crop_img=cv2.resize(crop_img,[self.model_config.input_size,self.model_config.input_size])
-        crop_img=self.aligner.align_image(crop_img)
         if crop_img is not None:

 from face_recognition import config
+from face_recognition.aligner import  Aligner
     self.model_config= importlib.import_module(config_file_path)
     # print(self.model_config)
     self.thres=thres if thres is not None else self.model_config.d_thres
+    self.aligner=Aligner(min_aligner_confidence)  if min_aligner_confidence is not None else Aligner(config.min_aligner_confidence)
     self.feature_extractor=tf.keras.models.load_model(model_path+"/model.h5",compile=False)
         crop_img=img[ymin:ymax,xmin:xmax]
         crop_img=cv2.resize(crop_img,[self.model_config.input_size,self.model_config.input_size])
+        crop_img=self.aligner.align((crop_img,))
         if crop_img is not None: