SwapFace2Pon

Running

App Files Files Community

Harisreedhar commited on Jul 1, 2023

Commit

7f475d2

•

1 Parent(s): 27c3130

Add soft erosion and fix face parsing video

Browse files

Files changed (4) hide show

app.py +40 -24
face_parsing/__init__.py +1 -1
face_parsing/swap.py +60 -17
swapper.py +3 -3

app.py CHANGED Viewed

@@ -17,7 +17,7 @@ from moviepy.editor import VideoFileClip, ImageSequenceClip
 from face_analyser import detect_conditions, analyse_face
 from utils import trim_video, StreamerThread, ProcessBar, open_directory
-from face_parsing import init_parser, swap_regions, mask_regions, mask_regions_to_list
 from swapper import (
     swap_face,
     swap_face_with_condition,
@@ -59,8 +59,9 @@ MASK_INCLUDE = [
     "L-Lip",
     "U-Lip"
 ]
-MASK_EXCLUDE = ["R-Ear", "L-Ear", "Hair", "Hat"]
-MASK_BLUR = 25
 FACE_SWAPPER = None
 FACE_ANALYSER = None
@@ -84,6 +85,8 @@ else:
     USE_CUDA = False
     print("\n********** Running on CPU **********\n")
 ## ------------------------------ LOAD MODELS ------------------------------
@@ -114,7 +117,7 @@ def load_face_parser_model(name="./assets/pretrained_models/79999_iter.pth"):
     global FACE_PARSER
     path = os.path.join(os.path.abspath(os.path.dirname(__file__)), name)
     if FACE_PARSER is None:
-        FACE_PARSER = init_parser(name, use_cuda=USE_CUDA)
 load_face_analyser_model()
@@ -137,9 +140,10 @@ def process(
     distance,
     face_enhance,
     enable_face_parser,
-    mask_include,
-    mask_exclude,
-    mask_blur,
     *specifics,
 ):
     global WORKSPACE
@@ -196,14 +200,18 @@ def process(
     yield "### \n ⌛ Analysing Face...", *ui_before()
-    mi = mask_regions_to_list(mask_include)
-    me = mask_regions_to_list(mask_exclude)
     models = {
         "swap": FACE_SWAPPER,
         "enhance": FACE_ENHANCER,
         "enhance_sett": face_enhance,
         "face_parser": FACE_PARSER,
-        "face_parser_sett": (enable_face_parser, mi, me, int(mask_blur)),
     }
     ## ------------------------------ ANALYSE SOURCE & SPECIFIC ------------------------------
@@ -301,9 +309,9 @@ def process(
             if condition == "Specific Face":
                 swapped = swap_specific(
-                    frame,
-                    analysed_target,
                     analysed_source_specific,
                     models,
                     threshold=distance,
                 )
@@ -381,9 +389,9 @@ def process(
             if condition == "Specific Face":
                 swapped = swap_specific(
-                    target,
-                    analysed_target,
                     analysed_source_specific,
                     models,
                     threshold=distance,
                 )
@@ -636,16 +644,23 @@ with gr.Blocks(css=css) as interface:
                             label="Include",
                             interactive=True,
                         )
-                        mask_exclude = gr.Dropdown(
-                            mask_regions.keys(),
-                            value=MASK_EXCLUDE,
-                            multiselect=True,
-                            label="Exclude",
                             interactive=True,
                         )
-                        mask_blur = gr.Number(
-                            label="Blur Mask",
-                            value=MASK_BLUR,
                             minimum=0,
                             interactive=True,
                         )
@@ -827,8 +842,9 @@ with gr.Blocks(css=css) as interface:
         enable_face_enhance,
         enable_face_parser_mask,
         mask_include,
-        mask_exclude,
-        mask_blur,
         *src_specific_inputs,
     ]

 from face_analyser import detect_conditions, analyse_face
 from utils import trim_video, StreamerThread, ProcessBar, open_directory
+from face_parsing import init_parser, swap_regions, mask_regions, mask_regions_to_list, SoftErosion
 from swapper import (
     swap_face,
     swap_face_with_condition,
     "L-Lip",
     "U-Lip"
 ]
+MASK_SOFT_KERNEL = 17
+MASK_SOFT_ITERATIONS = 7
+MASK_BLUR_AMOUNT = 20
 FACE_SWAPPER = None
 FACE_ANALYSER = None
     USE_CUDA = False
     print("\n********** Running on CPU **********\n")
+device = "cuda" if USE_CUDA else "cpu"
 ## ------------------------------ LOAD MODELS ------------------------------
     global FACE_PARSER
     path = os.path.join(os.path.abspath(os.path.dirname(__file__)), name)
     if FACE_PARSER is None:
+        FACE_PARSER = init_parser(name, mode=device)
 load_face_analyser_model()
     distance,
     face_enhance,
     enable_face_parser,
+    mask_includes,
+    mask_soft_kernel,
+    mask_soft_iterations,
+    blur_amount,
     *specifics,
 ):
     global WORKSPACE
     yield "### \n ⌛ Analysing Face...", *ui_before()
+    includes = mask_regions_to_list(mask_includes)
+    if mask_soft_iterations > 0:
+        smooth_mask = SoftErosion(kernel_size=17, threshold=0.9, iterations=int(mask_soft_iterations)).to(device)
+    else:
+        smooth_mask = None
     models = {
         "swap": FACE_SWAPPER,
         "enhance": FACE_ENHANCER,
         "enhance_sett": face_enhance,
         "face_parser": FACE_PARSER,
+        "face_parser_sett": (enable_face_parser, includes, smooth_mask, int(blur_amount))
     }
     ## ------------------------------ ANALYSE SOURCE & SPECIFIC ------------------------------
             if condition == "Specific Face":
                 swapped = swap_specific(
                     analysed_source_specific,
+                    analysed_target,
+                    frame,
                     models,
                     threshold=distance,
                 )
             if condition == "Specific Face":
                 swapped = swap_specific(
                     analysed_source_specific,
+                    analysed_target,
+                    target,
                     models,
                     threshold=distance,
                 )
                             label="Include",
                             interactive=True,
                         )
+                        mask_soft_kernel = gr.Number(
+                            label="Soft Erode Kernel",
+                            value=MASK_SOFT_KERNEL,
+                            minimum=3,
                             interactive=True,
+                            visible = False
+                        )
+                        mask_soft_iterations = gr.Number(
+                            label="Soft Erode Iterations",
+                            value=MASK_SOFT_ITERATIONS,
+                            minimum=0,
+                            interactive=True,
                         )
+                        blur_amount = gr.Number(
+                            label="Mask Blur",
+                            value=MASK_BLUR_AMOUNT,
                             minimum=0,
                             interactive=True,
                         )
         enable_face_enhance,
         enable_face_parser_mask,
         mask_include,
+        mask_soft_kernel,
+        mask_soft_iterations,
+        blur_amount,
         *src_specific_inputs,
     ]

face_parsing/__init__.py CHANGED Viewed

	@@ -1 +1 @@
1	- from .swap import init_parser, swap_regions, mask_regions, mask_regions_to_list


1	+ from .swap import init_parser, swap_regions, mask_regions, mask_regions_to_list, SoftErosion

face_parsing/swap.py CHANGED Viewed

@@ -1,4 +1,6 @@
 import torch
 import torchvision.transforms as transforms
 import cv2
 import numpy as np
@@ -27,15 +29,44 @@ mask_regions = {
     "Hat":18
 }
-run_with_cuda = False
-def init_parser(pth_path, use_cuda=False):
-    global run_with_cuda
-    run_with_cuda = use_cuda
     n_classes = 19
     net = BiSeNet(n_classes=n_classes)
-    if run_with_cuda:
         net.cuda()
         net.load_state_dict(torch.load(pth_path))
     else:
@@ -55,8 +86,7 @@ def image_to_parsing(img, net):
     img = torch.unsqueeze(img, 0)
     with torch.no_grad():
-        if run_with_cuda:
-            img = img.cuda()
         out = net(img)[0]
         parsing = out.squeeze(0).cpu().numpy().argmax(0)
         return parsing
@@ -68,20 +98,33 @@ def get_mask(parsing, classes):
         res += parsing == val
     return res
-def swap_regions(source, target, net, includes=[1,2,3,4,5,10,11,12,13], excludes=[7,8], blur_size=25):
     parsing = image_to_parsing(source, net)
     if len(includes) == 0:
         return source, np.zeros_like(source)
     include_mask = get_mask(parsing, includes)
-    include_mask = np.repeat(np.expand_dims(include_mask.astype('float32'), axis=2), 3, 2)
-    if len(excludes) > 0:
-        exclude_mask = get_mask(parsing, excludes)
-        exclude_mask = np.repeat(np.expand_dims(exclude_mask.astype('float32'), axis=2), 3, 2)
-        include_mask -= exclude_mask
-    mask = 1 - cv2.GaussianBlur(include_mask.clip(0,1), (0, 0), blur_size)
-    result = (1 - mask) * cv2.resize(source, (512, 512)) + mask * cv2.resize(target, (512, 512))
-    result = cv2.resize(result.astype("float32"), (source.shape[1], source.shape[0]))
-    return result, mask.astype('float32')
 def mask_regions_to_list(values):
     out_ids = []

 import torch
+import torch.nn as nn
+import torch.nn.functional as F
 import torchvision.transforms as transforms
 import cv2
 import numpy as np
     "Hat":18
 }
+# Borrowed from simswap
+# https://github.com/neuralchen/SimSwap/blob/26c84d2901bd56eda4d5e3c5ca6da16e65dc82a6/util/reverse2original.py#L30
+class SoftErosion(nn.Module):
+    def __init__(self, kernel_size=15, threshold=0.6, iterations=1):
+        super(SoftErosion, self).__init__()
+        r = kernel_size // 2
+        self.padding = r
+        self.iterations = iterations
+        self.threshold = threshold
+        # Create kernel
+        y_indices, x_indices = torch.meshgrid(torch.arange(0., kernel_size), torch.arange(0., kernel_size))
+        dist = torch.sqrt((x_indices - r) ** 2 + (y_indices - r) ** 2)
+        kernel = dist.max() - dist
+        kernel /= kernel.sum()
+        kernel = kernel.view(1, 1, *kernel.shape)
+        self.register_buffer('weight', kernel)
+    def forward(self, x):
+        x = x.float()
+        for i in range(self.iterations - 1):
+            x = torch.min(x, F.conv2d(x, weight=self.weight, groups=x.shape[1], padding=self.padding))
+        x = F.conv2d(x, weight=self.weight, groups=x.shape[1], padding=self.padding)
+        mask = x >= self.threshold
+        x[mask] = 1.0
+        x[~mask] /= x[~mask].max()
+        return x, mask
+device = "cpu"
+def init_parser(pth_path, mode="cpu"):
+    global device
+    device = mode
     n_classes = 19
     net = BiSeNet(n_classes=n_classes)
+    if device == "cuda":
         net.cuda()
         net.load_state_dict(torch.load(pth_path))
     else:
     img = torch.unsqueeze(img, 0)
     with torch.no_grad():
+        img = img.to(device)
         out = net(img)[0]
         parsing = out.squeeze(0).cpu().numpy().argmax(0)
         return parsing
         res += parsing == val
     return res
+def swap_regions(source, target, net, smooth_mask, includes=[1,2,3,4,5,10,11,12,13], blur=10):
     parsing = image_to_parsing(source, net)
     if len(includes) == 0:
         return source, np.zeros_like(source)
     include_mask = get_mask(parsing, includes)
+    mask = np.repeat(include_mask[:, :, np.newaxis], 3, axis=2).astype("float32")
+    if smooth_mask is not None:
+        mask_tensor = torch.from_numpy(mask.copy().transpose((2, 0, 1))).float().to(device)
+        face_mask_tensor = mask_tensor[0] + mask_tensor[1]
+        soft_face_mask_tensor, _ = smooth_mask(face_mask_tensor.unsqueeze_(0).unsqueeze_(0))
+        soft_face_mask_tensor.squeeze_()
+        mask = np.repeat(soft_face_mask_tensor.cpu().numpy()[:, :, np.newaxis], 3, axis=2)
+    if blur > 0:
+        mask = cv2.GaussianBlur(mask, (0, 0), blur)
+    resized_source = cv2.resize((source/255).astype("float32"), (512, 512))
+    resized_target = cv2.resize((target/255).astype("float32"), (512, 512))
+    result = mask * resized_source + (1 - mask) * resized_target
+    normalized_result = (result - np.min(result)) / (np.max(result) - np.min(result))
+    result = cv2.resize((result*255).astype("uint8"), (source.shape[1], source.shape[0]))
+    return result
 def mask_regions_to_list(values):
     out_ids = []

swapper.py CHANGED Viewed

@@ -25,10 +25,10 @@ def swap_face(whole_img, target_face, source_face, models):
     aimg, _ = face_align.norm_crop2(whole_img, target_face.kps, image_size=image_size)
     if face_parser is not None:
-        fp_enable, mi, me, mb = models.get("face_parser_sett")
         if fp_enable:
-            bgr_fake, parsed_mask = swap_regions(
-                bgr_fake, aimg, face_parser, includes=mi, excludes=me, blur_size=mb
             )
     if fe_enable:

     aimg, _ = face_align.norm_crop2(whole_img, target_face.kps, image_size=image_size)
     if face_parser is not None:
+        fp_enable, includes, smooth_mask, blur_amount = models.get("face_parser_sett")
         if fp_enable:
+            bgr_fake = swap_regions(
+                bgr_fake, aimg, face_parser, smooth_mask, includes=includes, blur=blur_amount
             )
     if fe_enable: