Spaces:

felixrosberg
/

face-swap

Running

App Files Files Community

felixrosberg commited on Feb 9, 2022

Commit

87d3df0

•

1 Parent(s): 1b7cc25

Update app.py

Browse files

Files changed (1) hide show

app.py +63 -59

app.py CHANGED Viewed

@@ -43,65 +43,69 @@ blend_mask_base = gaussian_filter(blend_mask_base, sigma=7)
 def run_inference(target, source):
-    source = np.array(source)
-    target = np.array(target)
-    # Prepare to load video
-    source_a = RetinaFace(np.expand_dims(source, axis=0)).numpy()[0]
-    source_h, source_w, _ = source.shape
-    source_lm = get_lm(source_a, source_w, source_h)
-    source_aligned = norm_crop(source, source_lm, image_size=256)
-    source_z = ArcFace.predict(np.expand_dims(tf.image.resize(source_aligned, [112, 112]) / 255.0, axis=0))
-    # read frame
-    im = target
-    im_h, im_w, _ = im.shape
-    im_shape = (im_w, im_h)
-    detection_scale = im_w // 640 if im_w > 640 else 1
-    faces = RetinaFace(np.expand_dims(cv2.resize(im,
-                                                 (im_w // detection_scale,
-                                                  im_h // detection_scale)), axis=0)).numpy()
-    total_img = im / 255.0
-    for annotation in faces:
-        lm_align = np.array([[annotation[4] * im_w, annotation[5] * im_h],
-                             [annotation[6] * im_w, annotation[7] * im_h],
-                             [annotation[8] * im_w, annotation[9] * im_h],
-                             [annotation[10] * im_w, annotation[11] * im_h],
-                             [annotation[12] * im_w, annotation[13] * im_h]],
-                            dtype=np.float32)
-        # align the detected face
-        M, pose_index = estimate_norm(lm_align, 256, "arcface", shrink_factor=1.0)
-        im_aligned = cv2.warpAffine(im, M, (256, 256), borderValue=0.0)
-        # face swap
-        changed_face_cage = G.predict([np.expand_dims((im_aligned - 127.5) / 127.5, axis=0),
-                                       source_z])
-        changed_face = (changed_face_cage[0] + 1) / 2
-        # get inverse transformation landmarks
-        transformed_lmk = transform_landmark_points(M, lm_align)
-        # warp image back
-        iM, _ = inverse_estimate_norm(lm_align, transformed_lmk, 256, "arcface", shrink_factor=1.0)
-        iim_aligned = cv2.warpAffine(changed_face, iM, im_shape, borderValue=0.0)
-        # blend swapped face with target image
-        blend_mask = cv2.warpAffine(blend_mask_base, iM, im_shape, borderValue=0.0)
-        blend_mask = np.expand_dims(blend_mask, axis=-1)
-        total_img = (iim_aligned * blend_mask + total_img * (1 - blend_mask))
-    if opt.compare:
-        total_img = np.concatenate((im / 255.0, total_img), axis=1)
-    total_img = np.clip(total_img, 0, 1)
-    total_img *= 255.0
-    total_img = total_img.astype('uint8')
-    return total_img
 description = "Performs subject agnostic identity transfer from a source face to all target faces."
 examples = [["elon_musk_example.jpg", "rick_astely_example.jpg"], ["10017.png", "9538.png"]]

 def run_inference(target, source):
+    try:
+        source = np.array(source)
+        target = np.array(target)
+        # Prepare to load video
+        source_a = RetinaFace(np.expand_dims(source, axis=0)).numpy()[0]
+        source_h, source_w, _ = source.shape
+        source_lm = get_lm(source_a, source_w, source_h)
+        source_aligned = norm_crop(source, source_lm, image_size=256)
+        source_z = ArcFace.predict(np.expand_dims(tf.image.resize(source_aligned, [112, 112]) / 255.0, axis=0))
+        # read frame
+        im = target
+        im_h, im_w, _ = im.shape
+        im_shape = (im_w, im_h)
+        detection_scale = im_w // 640 if im_w > 640 else 1
+        faces = RetinaFace(np.expand_dims(cv2.resize(im,
+                                                     (im_w // detection_scale,
+                                                      im_h // detection_scale)), axis=0)).numpy()
+        total_img = im / 255.0
+        for annotation in faces:
+            lm_align = np.array([[annotation[4] * im_w, annotation[5] * im_h],
+                                 [annotation[6] * im_w, annotation[7] * im_h],
+                                 [annotation[8] * im_w, annotation[9] * im_h],
+                                 [annotation[10] * im_w, annotation[11] * im_h],
+                                 [annotation[12] * im_w, annotation[13] * im_h]],
+                                dtype=np.float32)
+            # align the detected face
+            M, pose_index = estimate_norm(lm_align, 256, "arcface", shrink_factor=1.0)
+            im_aligned = cv2.warpAffine(im, M, (256, 256), borderValue=0.0)
+            # face swap
+            changed_face_cage = G.predict([np.expand_dims((im_aligned - 127.5) / 127.5, axis=0),
+                                           source_z])
+            changed_face = (changed_face_cage[0] + 1) / 2
+            # get inverse transformation landmarks
+            transformed_lmk = transform_landmark_points(M, lm_align)
+            # warp image back
+            iM, _ = inverse_estimate_norm(lm_align, transformed_lmk, 256, "arcface", shrink_factor=1.0)
+            iim_aligned = cv2.warpAffine(changed_face, iM, im_shape, borderValue=0.0)
+            # blend swapped face with target image
+            blend_mask = cv2.warpAffine(blend_mask_base, iM, im_shape, borderValue=0.0)
+            blend_mask = np.expand_dims(blend_mask, axis=-1)
+            total_img = (iim_aligned * blend_mask + total_img * (1 - blend_mask))
+        if opt.compare:
+            total_img = np.concatenate((im / 255.0, total_img), axis=1)
+        total_img = np.clip(total_img, 0, 1)
+        total_img *= 255.0
+        total_img = total_img.astype('uint8')
+        return total_img
+    except Exception as e:
+        print(e)
+        return None
 description = "Performs subject agnostic identity transfer from a source face to all target faces."
 examples = [["elon_musk_example.jpg", "rick_astely_example.jpg"], ["10017.png", "9538.png"]]