Spaces:

power2
/

powerswp

Runtime error

sanket kheni commited on Dec 16, 2022

Commit

e20f0de

1 Parent(s): 635c654

init

Browse files

Files changed (24) hide show

.gitattributes +2 -9
.gitignore.txt +4 -0
.idea/.gitignore +3 -0
.idea/AFFA-face-swap.iml +15 -0
.idea/inspectionProfiles/Project_Default.xml +38 -0
.idea/inspectionProfiles/profiles_settings.xml +6 -0
.idea/misc.xml +4 -0
.idea/modules.xml +8 -0
.idea/vcs.xml +9 -0
README.md +40 -6
app.py +216 -0
assets/girl_0.png +0 -0
assets/girl_1.png +0 -0
assets/musk.jpg +0 -0
assets/rick.jpg +0 -0
networks/__pycache__/layers.cpython-37.pyc +0 -0
networks/__pycache__/layers.cpython-38.pyc +0 -0
networks/layers.py +49 -0
options/__pycache__/swap_options.cpython-37.pyc +0 -0
options/__pycache__/swap_options.cpython-38.pyc +0 -0
options/swap_options.py +43 -0
requirements.txt +7 -0
utils/__pycache__/utils.cpython-38.pyc +0 -0
utils/utils.py +377 -0

.gitattributes CHANGED Viewed

@@ -1,34 +1,27 @@
 *.7z filter=lfs diff=lfs merge=lfs -text
 *.arrow filter=lfs diff=lfs merge=lfs -text
 *.bin filter=lfs diff=lfs merge=lfs -text
 *.bz2 filter=lfs diff=lfs merge=lfs -text
-*.ckpt filter=lfs diff=lfs merge=lfs -text
 *.ftz filter=lfs diff=lfs merge=lfs -text
 *.gz filter=lfs diff=lfs merge=lfs -text
 *.h5 filter=lfs diff=lfs merge=lfs -text
 *.joblib filter=lfs diff=lfs merge=lfs -text
 *.lfs.* filter=lfs diff=lfs merge=lfs -text
-*.mlmodel filter=lfs diff=lfs merge=lfs -text
 *.model filter=lfs diff=lfs merge=lfs -text
 *.msgpack filter=lfs diff=lfs merge=lfs -text
-*.npy filter=lfs diff=lfs merge=lfs -text
-*.npz filter=lfs diff=lfs merge=lfs -text
 *.onnx filter=lfs diff=lfs merge=lfs -text
 *.ot filter=lfs diff=lfs merge=lfs -text
 *.parquet filter=lfs diff=lfs merge=lfs -text
 *.pb filter=lfs diff=lfs merge=lfs -text
-*.pickle filter=lfs diff=lfs merge=lfs -text
-*.pkl filter=lfs diff=lfs merge=lfs -text
 *.pt filter=lfs diff=lfs merge=lfs -text
 *.pth filter=lfs diff=lfs merge=lfs -text
 *.rar filter=lfs diff=lfs merge=lfs -text
-*.safetensors filter=lfs diff=lfs merge=lfs -text
 saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.tar.* filter=lfs diff=lfs merge=lfs -text
 *.tflite filter=lfs diff=lfs merge=lfs -text
 *.tgz filter=lfs diff=lfs merge=lfs -text
-*.wasm filter=lfs diff=lfs merge=lfs -text
 *.xz filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
-*.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.7z filter=lfs diff=lfs merge=lfs -text
 *.arrow filter=lfs diff=lfs merge=lfs -text
 *.bin filter=lfs diff=lfs merge=lfs -text
+*.bin.* filter=lfs diff=lfs merge=lfs -text
 *.bz2 filter=lfs diff=lfs merge=lfs -text
 *.ftz filter=lfs diff=lfs merge=lfs -text
 *.gz filter=lfs diff=lfs merge=lfs -text
 *.h5 filter=lfs diff=lfs merge=lfs -text
 *.joblib filter=lfs diff=lfs merge=lfs -text
 *.lfs.* filter=lfs diff=lfs merge=lfs -text
 *.model filter=lfs diff=lfs merge=lfs -text
 *.msgpack filter=lfs diff=lfs merge=lfs -text
 *.onnx filter=lfs diff=lfs merge=lfs -text
 *.ot filter=lfs diff=lfs merge=lfs -text
 *.parquet filter=lfs diff=lfs merge=lfs -text
 *.pb filter=lfs diff=lfs merge=lfs -text
 *.pt filter=lfs diff=lfs merge=lfs -text
 *.pth filter=lfs diff=lfs merge=lfs -text
 *.rar filter=lfs diff=lfs merge=lfs -text
 saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.tar.* filter=lfs diff=lfs merge=lfs -text
 *.tflite filter=lfs diff=lfs merge=lfs -text
 *.tgz filter=lfs diff=lfs merge=lfs -text
 *.xz filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
+*.zstandard filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

.gitignore.txt ADDED Viewed

	@@ -0,0 +1,4 @@

+g_model
+flagged
+arcface_model
+retina_model

.idea/.gitignore ADDED Viewed

	@@ -0,0 +1,3 @@

+# Default ignored files
+/shelf/
+/workspace.xml

.idea/AFFA-face-swap.iml ADDED Viewed

	@@ -0,0 +1,15 @@

+<?xml version="1.0" encoding="UTF-8"?>
+<module type="PYTHON_MODULE" version="4">
+  <component name="NewModuleRootManager">
+    <content url="file://$MODULE_DIR$" />
+    <orderEntry type="jdk" jdkName="Python 3.8 (py38)" jdkType="Python SDK" />
+    <orderEntry type="sourceFolder" forTests="false" />
+  </component>
+  <component name="PyDocumentationSettings">
+    <option name="format" value="PLAIN" />
+    <option name="myDocStringFormat" value="Plain" />
+  </component>
+  <component name="TestRunnerService">
+    <option name="PROJECT_TEST_RUNNER" value="pytest" />
+  </component>
+</module>

.idea/inspectionProfiles/Project_Default.xml ADDED Viewed

	@@ -0,0 +1,38 @@

+<component name="InspectionProjectProfileManager">
+  <profile version="1.0">
+    <option name="myName" value="Project Default" />
+    <inspection_tool class="PyPackageRequirementsInspection" enabled="true" level="WARNING" enabled_by_default="true">
+      <option name="ignoredPackages">
+        <value>
+          <list size="3">
+            <item index="0" class="java.lang.String" itemvalue="ipython" />
+            <item index="1" class="java.lang.String" itemvalue="Cython" />
+            <item index="2" class="java.lang.String" itemvalue="tensorflow-gpu" />
+          </list>
+        </value>
+      </option>
+    </inspection_tool>
+    <inspection_tool class="PyPep8Inspection" enabled="true" level="WEAK WARNING" enabled_by_default="true">
+      <option name="ignoredErrors">
+        <list>
+          <option value="E402" />
+        </list>
+      </option>
+    </inspection_tool>
+    <inspection_tool class="PyPep8NamingInspection" enabled="true" level="WEAK WARNING" enabled_by_default="true">
+      <option name="ignoredErrors">
+        <list>
+          <option value="N806" />
+          <option value="N812" />
+        </list>
+      </option>
+    </inspection_tool>
+    <inspection_tool class="PyUnresolvedReferencesInspection" enabled="true" level="WARNING" enabled_by_default="true">
+      <option name="ignoredIdentifiers">
+        <list>
+          <option value="torch.backends.cudnn" />
+        </list>
+      </option>
+    </inspection_tool>
+  </profile>
+</component>

.idea/inspectionProfiles/profiles_settings.xml ADDED Viewed

	@@ -0,0 +1,6 @@

+<component name="InspectionProjectProfileManager">
+  <settings>
+    <option name="USE_PROJECT_PROFILE" value="false" />
+    <version value="1.0" />
+  </settings>
+</component>

.idea/misc.xml ADDED Viewed

	@@ -0,0 +1,4 @@

+<?xml version="1.0" encoding="UTF-8"?>
+<project version="4">
+  <component name="ProjectRootManager" version="2" project-jdk-name="Python 3.8 (py38)" project-jdk-type="Python SDK" />
+</project>

.idea/modules.xml ADDED Viewed

	@@ -0,0 +1,8 @@

+<?xml version="1.0" encoding="UTF-8"?>
+<project version="4">
+  <component name="ProjectModuleManager">
+    <modules>
+      <module fileurl="file://$PROJECT_DIR$/.idea/AFFA-face-swap.iml" filepath="$PROJECT_DIR$/.idea/AFFA-face-swap.iml" />
+    </modules>
+  </component>
+</project>

.idea/vcs.xml ADDED Viewed

	@@ -0,0 +1,9 @@

+<?xml version="1.0" encoding="UTF-8"?>
+<project version="4">
+  <component name="VcsDirectoryMappings">
+    <mapping directory="$PROJECT_DIR$" vcs="Git" />
+    <mapping directory="$PROJECT_DIR$/arcface_model" vcs="Git" />
+    <mapping directory="$PROJECT_DIR$/g_model" vcs="Git" />
+    <mapping directory="$PROJECT_DIR$/retina_model" vcs="Git" />
+  </component>
+</project>

README.md CHANGED Viewed

@@ -1,12 +1,46 @@
 ---
-title: Powerswp
-emoji: 🌖
-colorFrom: red
-colorTo: yellow
 sdk: gradio
-sdk_version: 3.14.0
 app_file: app.py
 pinned: false
 ---
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: Face Swap
+emoji: 🧙🧙🧙🧙🧙🧙🧙🧙
+colorFrom: purple
+colorTo: green
 sdk: gradio
 app_file: app.py
 pinned: false
+license: cc-by-nc-sa-4.0
 ---
+# Configuration
+`title`: _string_
+Display title for the Space
+`emoji`: _string_
+Space emoji (emoji-only character allowed)
+`colorFrom`: _string_
+Color for Thumbnail gradient (red, yellow, green, blue, indigo, purple, pink, gray)
+`colorTo`: _string_
+Color for Thumbnail gradient (red, yellow, green, blue, indigo, purple, pink, gray)
+`sdk`: _string_
+Can be either `gradio`, `streamlit`, or `static`
+`sdk_version` : _string_
+Only applicable for `streamlit` SDK.
+See [doc](https://hf.co/docs/hub/spaces) for more info on supported versions.
+`app_file`: _string_
+Path to your main application file (which contains either `gradio` or `streamlit` Python code, or `static` html code).
+Path is relative to the root of the repository.
+`models`: _List[string]_
+HF model IDs (like "gpt2" or "deepset/roberta-base-squad2") used in the Space.
+Will be parsed automatically from your code if not specified here.
+`datasets`: _List[string]_
+HF dataset IDs (like "common_voice" or "oscar-corpus/OSCAR-2109") used in the Space.
+Will be parsed automatically from your code if not specified here.
+`pinned`: _boolean_
+Whether the Space stays on top of your list.

app.py ADDED Viewed

	@@ -0,0 +1,216 @@

+import gradio
+from huggingface_hub import Repository
+import os
+from utils.utils import norm_crop, estimate_norm, inverse_estimate_norm, transform_landmark_points, get_lm
+from networks.layers import AdaIN, AdaptiveAttention
+from tensorflow_addons.layers import InstanceNormalization
+import numpy as np
+import cv2
+from scipy.ndimage import gaussian_filter
+from tensorflow.keras.models import load_model
+from options.swap_options import SwapOptions
+# .
+token = os.environ['model_fetch']
+opt = SwapOptions().parse()
+retina_repo = Repository(local_dir="retina_model", clone_from="felixrosberg/retinaface_resnet50",
+                         private=True, use_auth_token=token, git_user="felixrosberg")
+from retina_model.models import *
+RetinaFace = load_model("retina_model/retinaface_res50.h5",
+                        custom_objects={"FPN": FPN,
+                                        "SSH": SSH,
+                                        "BboxHead": BboxHead,
+                                        "LandmarkHead": LandmarkHead,
+                                        "ClassHead": ClassHead})
+arc_repo = Repository(local_dir="arcface_model", clone_from="felixrosberg/arcface_tf",
+                      private=True, use_auth_token=token)
+ArcFace = load_model("arcface_model/arc_res50.h5")
+ArcFaceE = load_model("arcface_model/arc_res50e.h5")
+g_repo = Repository(local_dir="g_model_c_hq", clone_from="felixrosberg/affa_config_c_hq",
+                    private=True, use_auth_token=token)
+G = load_model("g_model_c_hq/generator_t_28.h5", custom_objects={"AdaIN": AdaIN,
+                                                                 "AdaptiveAttention": AdaptiveAttention,
+                                                                 "InstanceNormalization": InstanceNormalization})
+r_repo = Repository(local_dir="reconstruction_attack", clone_from="felixrosberg/reconstruction_attack",
+                    private=True, use_auth_token=token)
+R = load_model("reconstruction_attack/reconstructor_42.h5", custom_objects={"AdaIN": AdaIN,
+                                                                            "AdaptiveAttention": AdaptiveAttention,
+                                                                            "InstanceNormalization": InstanceNormalization})
+permuter_repo = Repository(local_dir="identity_permuter", clone_from="felixrosberg/identitypermuter",
+                           private=True, use_auth_token=token, git_user="felixrosberg")
+from identity_permuter.id_permuter import identity_permuter
+IDP = identity_permuter(emb_size=32, min_arg=False)
+IDP.load_weights("identity_permuter/id_permuter.h5")
+blend_mask_base = np.zeros(shape=(256, 256, 1))
+blend_mask_base[80:244, 32:224] = 1
+blend_mask_base = gaussian_filter(blend_mask_base, sigma=7)
+def run_inference(target, source, slider, adv_slider, settings):
+    try:
+        source = np.array(source)
+        target = np.array(target)
+        # Prepare to load video
+        if "anonymize" not in settings:
+            source_a = RetinaFace(np.expand_dims(source, axis=0)).numpy()[0]
+            source_h, source_w, _ = source.shape
+            source_lm = get_lm(source_a, source_w, source_h)
+            source_aligned = norm_crop(source, source_lm, image_size=256)
+            source_z = ArcFace.predict(np.expand_dims(tf.image.resize(source_aligned, [112, 112]) / 255.0, axis=0))
+        else:
+            source_z = None
+        # read frame
+        im = target
+        im_h, im_w, _ = im.shape
+        im_shape = (im_w, im_h)
+        detection_scale = im_w // 640 if im_w > 640 else 1
+        faces = RetinaFace(np.expand_dims(cv2.resize(im,
+                                                     (im_w // detection_scale,
+                                                      im_h // detection_scale)), axis=0)).numpy()
+        total_img = im / 255.0
+        for annotation in faces:
+            lm_align = np.array([[annotation[4] * im_w, annotation[5] * im_h],
+                                 [annotation[6] * im_w, annotation[7] * im_h],
+                                 [annotation[8] * im_w, annotation[9] * im_h],
+                                 [annotation[10] * im_w, annotation[11] * im_h],
+                                 [annotation[12] * im_w, annotation[13] * im_h]],
+                                dtype=np.float32)
+            # align the detected face
+            M, pose_index = estimate_norm(lm_align, 256, "arcface", shrink_factor=1.0)
+            im_aligned = (cv2.warpAffine(im, M, (256, 256), borderValue=0.0) - 127.5) / 127.5
+            if "adversarial defense" in settings:
+                eps = adv_slider / 200
+                X = tf.convert_to_tensor(np.expand_dims(im_aligned, axis=0))
+                with tf.GradientTape() as tape:
+                    tape.watch(X)
+                    X_z = ArcFaceE(tf.image.resize(X * 0.5 + 0.5, [112, 112]))
+                    output = R([X, X_z])
+                    loss = tf.reduce_mean(tf.abs(0 - output))
+                gradient = tf.sign(tape.gradient(loss, X))
+                adv_x = X + eps * gradient
+                im_aligned = tf.clip_by_value(adv_x, -1, 1)[0]
+            if "anonymize" in settings and "reconstruction attack" not in settings:
+                """source_z = ArcFace.predict(np.expand_dims(tf.image.resize(im_aligned, [112, 112]) / 255.0, axis=0))
+                anon_ratio = int(512 * (slider / 100))
+                anon_vector = np.ones(shape=(1, 512))
+                anon_vector[:, :anon_ratio] = -1
+                np.random.shuffle(anon_vector)
+                source_z *= anon_vector"""
+                slider_weight = slider / 100
+                target_z = ArcFace.predict(np.expand_dims(tf.image.resize(im_aligned, [112, 112]) * 0.5 + 0.5, axis=0))
+                source_z = IDP.predict(target_z)
+                source_z = slider_weight * source_z + (1 - slider_weight) * target_z
+            if "reconstruction attack" in settings:
+                source_z = ArcFaceE.predict(np.expand_dims(tf.image.resize(im_aligned, [112, 112]) * 0.5 + 0.5, axis=0))
+            # face swap
+            if "reconstruction attack" not in settings:
+                changed_face_cage = G.predict([np.expand_dims(im_aligned, axis=0),
+                                               source_z])
+                changed_face = changed_face_cage[0] * 0.5 + 0.5
+                # get inverse transformation landmarks
+                transformed_lmk = transform_landmark_points(M, lm_align)
+                # warp image back
+                iM, _ = inverse_estimate_norm(lm_align, transformed_lmk, 256, "arcface", shrink_factor=1.0)
+                iim_aligned = cv2.warpAffine(changed_face, iM, im_shape, borderValue=0.0)
+                # blend swapped face with target image
+                blend_mask = cv2.warpAffine(blend_mask_base, iM, im_shape, borderValue=0.0)
+                blend_mask = np.expand_dims(blend_mask, axis=-1)
+                total_img = (iim_aligned * blend_mask + total_img * (1 - blend_mask))
+            else:
+                changed_face_cage = R.predict([np.expand_dims(im_aligned, axis=0),
+                                               source_z])
+                changed_face = changed_face_cage[0] * 0.5 + 0.5
+                # get inverse transformation landmarks
+                transformed_lmk = transform_landmark_points(M, lm_align)
+                # warp image back
+                iM, _ = inverse_estimate_norm(lm_align, transformed_lmk, 256, "arcface", shrink_factor=1.0)
+                iim_aligned = cv2.warpAffine(changed_face, iM, im_shape, borderValue=0.0)
+                # blend swapped face with target image
+                blend_mask = cv2.warpAffine(blend_mask_base, iM, im_shape, borderValue=0.0)
+                blend_mask = np.expand_dims(blend_mask, axis=-1)
+                total_img = (iim_aligned * blend_mask + total_img * (1 - blend_mask))
+        if "compare" in settings:
+            total_img = np.concatenate((im / 255.0, total_img), axis=1)
+        total_img = np.clip(total_img, 0, 1)
+        total_img *= 255.0
+        total_img = total_img.astype('uint8')
+        return total_img
+    except Exception as e:
+        print(e)
+        return None
+description = "Performs subject agnostic identity transfer from a source face to all target faces. \n\n" \
+              "Implementation and demo of FaceDancer, accepted to WACV 2023. \n\n" \
+              "Pre-print: https://arxiv.org/abs/2210.10473 \n\n" \
+              "Code: https://github.com/felixrosberg/FaceDancer \n\n" \
+               "\n\n" \
+              "Options:\n\n" \
+              "-Compare returns the target image concatenated with the results.\n\n" \
+              "-Anonymize will ignore the source image and perform an identity permutation of target faces.\n\n" \
+              "-Reconstruction attack will attempt to invert the face swap or the anonymization.\n\n" \
+              "-Adversarial defense will add a permutation noise that disrupts the reconstruction attack.\n\n" \
+              "NOTE: There is no guarantees with the anonymization process currently.\n\n" \
+              "NOTE: source image with too high resolution may not work properly!"
+examples = [["assets/rick.jpg", "assets/musk.jpg", 100, 10, ["compare"]],
+            ["assets/musk.jpg", "assets/musk.jpg", 100, 10, ["anonymize"]]]
+article = """
+Demo is based of recent research from my Ph.D work. Results expects to be published in the coming months.
+"""
+iface = gradio.Interface(run_inference,
+                         [gradio.inputs.Image(shape=None, label='Target'),
+                          gradio.inputs.Image(shape=None, label='Source'),
+                          gradio.inputs.Slider(0, 100, default=100, label="Anonymization ratio (%)"),
+                          gradio.inputs.Slider(0, 100, default=100, label="Adversarial defense ratio (%)"),
+                          gradio.inputs.CheckboxGroup(["compare",
+                                                       "anonymize",
+                                                       "reconstruction attack",
+                                                       "adversarial defense"],
+                                                      label='Options')],
+                         gradio.outputs.Image(),
+                         title="Face Swap",
+                         description=description,
+                         examples=examples,
+                         article=article,
+                         layout="vertical")
+iface.launch()

assets/girl_0.png ADDED Viewed

assets/girl_1.png ADDED Viewed

assets/musk.jpg ADDED Viewed

assets/rick.jpg ADDED Viewed

networks/__pycache__/layers.cpython-37.pyc ADDED Viewed

Binary file (69.1 kB). View file

networks/__pycache__/layers.cpython-38.pyc ADDED Viewed

Binary file (2.12 kB). View file

networks/layers.py ADDED Viewed

	@@ -0,0 +1,49 @@

+import tensorflow as tf
+from tensorflow.keras.layers import Layer, Dense
+def sin_activation(x, omega=30):
+    return tf.math.sin(omega * x)
+class AdaIN(Layer):
+    def __init__(self, **kwargs):
+        super(AdaIN, self).__init__(**kwargs)
+    def build(self, input_shapes):
+        x_shape = input_shapes[0]
+        w_shape = input_shapes[1]
+        self.w_channels = w_shape[-1]
+        self.x_channels = x_shape[-1]
+        self.dense_1 = Dense(self.x_channels)
+        self.dense_2 = Dense(self.x_channels)
+    def call(self, inputs):
+        x, w = inputs
+        ys = tf.reshape(self.dense_1(w), (-1, 1, 1, self.x_channels))
+        yb = tf.reshape(self.dense_2(w), (-1, 1, 1, self.x_channels))
+        return ys * x + yb
+    def get_config(self):
+        config = {
+            #'w_channels': self.w_channels,
+            #'x_channels': self.x_channels
+        }
+        base_config = super(AdaIN, self).get_config()
+        return dict(list(base_config.items()) + list(config.items()))
+class AdaptiveAttention(Layer):
+    def __init__(self, **kwargs):
+        super(AdaptiveAttention, self).__init__(**kwargs)
+    def call(self, inputs):
+        m, a, i = inputs
+        return (1 - m) * a + m * i
+    def get_config(self):
+        base_config = super(AdaptiveAttention, self).get_config()
+        return base_config

options/__pycache__/swap_options.cpython-37.pyc ADDED Viewed

Binary file (6.21 kB). View file

options/__pycache__/swap_options.cpython-38.pyc ADDED Viewed

Binary file (1.65 kB). View file

options/swap_options.py ADDED Viewed

	@@ -0,0 +1,43 @@

+import argparse
+class SwapOptions():
+    def __init__(self):
+        self.parser = argparse.ArgumentParser()
+        self.initialized = False
+    def initialize(self):
+        # paths (data, models, etc...)
+        self.parser.add_argument('--arcface_path', type=str,
+                                 default="arcface_model/arcface/arc_res50.h5",
+                                 help='path to arcface model. Used to extract identity from source.')
+        # Video/Image necessary models
+        self.parser.add_argument('--retina_path', type=str,
+                                 default="retinaface/retinaface_res50.h5",
+                                 help='path to retinaface model.')
+        self.parser.add_argument('--compare', type=bool,
+                                 default=True,
+                                 help='If true, concatenates the frame with the manipulated frame')
+        self.parser.add_argument('--load', type=int,
+                                 default=30,
+                                 help='int of number to load checkpoint weights.')
+        self.parser.add_argument('--device_id', type=int, default=0,
+                                 help='which device to use')
+        # logging and checkpointing
+        self.parser.add_argument('--log_dir', type=str, default='logs/runs/',
+                                 help='logging directory')
+        self.parser.add_argument('--log_name', type=str, default='affa_f',
+                                 help='name of the run, change this to track several experiments')
+        self.parser.add_argument('--chkp_dir', type=str, default='checkpoints/',
+                                 help='checkpoint directory (will use same name as log_name!)')
+        self.initialized = True
+    def parse(self):
+        if not self.initialized:
+            self.initialize()
+        self.opt = self.parser.parse_args()
+        return self.opt

requirements.txt ADDED Viewed

	@@ -0,0 +1,7 @@

+tensorflow
+tensorflow-addons
+opencv-python-headless
+scipy
+pillow
+scikit-image
+huggingface_hub

utils/__pycache__/utils.cpython-38.pyc ADDED Viewed

Binary file (11.6 kB). View file

utils/utils.py ADDED Viewed

	@@ -0,0 +1,377 @@

+import json
+from tensorflow.keras.models import model_from_json
+from networks.layers import AdaIN, AdaptiveAttention
+import tensorflow as tf
+import numpy as np
+import cv2
+import math
+from skimage import transform as trans
+from scipy.signal import convolve2d
+from skimage.color import rgb2yuv, yuv2rgb
+from PIL import Image
+def save_model_internal(model, path, name, num):
+    json_model = model.to_json()
+    with open(path + name + '.json', "w") as json_file:
+        json_file.write(json_model)
+    model.save_weights(path + name + '_' + str(num) + '.h5')
+def load_model_internal(path, name, num):
+    with open(path + name + '.json', 'r') as json_file:
+        model_dict = json_file.read()
+    mod = model_from_json(model_dict, custom_objects={'AdaIN': AdaIN, 'AdaptiveAttention': AdaptiveAttention})
+    mod.load_weights(path + name + '_' + str(num) + '.h5')
+    return mod
+def save_training_meta(state_dict, path, num):
+    with open(path + str(num) + '.json', 'w') as json_file:
+        json.dump(state_dict, json_file, indent=2)
+def load_training_meta(path, num):
+    with open(path + str(num) + '.json', 'r') as json_file:
+        state_dict = json.load(json_file)
+    return state_dict
+def log_info(sw, results_dict, iteration):
+    with sw.as_default():
+        for key in results_dict.keys():
+            tf.summary.scalar(key, results_dict[key], step=iteration)
+src1 = np.array([[51.642, 50.115], [57.617, 49.990], [35.740, 69.007],
+                 [51.157, 89.050], [57.025, 89.702]],
+                dtype=np.float32)
+# <--left
+src2 = np.array([[45.031, 50.118], [65.568, 50.872], [39.677, 68.111],
+                 [45.177, 86.190], [64.246, 86.758]],
+                dtype=np.float32)
+# ---frontal
+src3 = np.array([[39.730, 51.138], [72.270, 51.138], [56.000, 68.493],
+                 [42.463, 87.010], [69.537, 87.010]],
+                dtype=np.float32)
+# -->right
+src4 = np.array([[46.845, 50.872], [67.382, 50.118], [72.737, 68.111],
+                 [48.167, 86.758], [67.236, 86.190]],
+                dtype=np.float32)
+# -->right profile
+src5 = np.array([[54.796, 49.990], [60.771, 50.115], [76.673, 69.007],
+                 [55.388, 89.702], [61.257, 89.050]],
+                dtype=np.float32)
+src = np.array([src1, src2, src3, src4, src5])
+src_map = {112: src, 224: src * 2}
+# Left eye, right eye, nose, left mouth, right mouth
+arcface_src = np.array(
+    [[38.2946, 51.6963], [73.5318, 51.5014], [56.0252, 71.7366],
+     [41.5493, 92.3655], [70.7299, 92.2041]],
+    dtype=np.float32)
+arcface_src = np.expand_dims(arcface_src, axis=0)
+def extract_face(img, bb, absolute_center, mode='arcface', extention_rate=0.05, debug=False):
+    """Extract face from image given a bounding box"""
+    # bbox
+    x1, y1, x2, y2 = bb + 60
+    adjusted_absolute_center = (absolute_center[0] + 60, absolute_center[1] + 60)
+    if debug:
+        print(bb + 60)
+        x1, y1, x2, y2 = bb
+        cv2.rectangle(img, (x1, y1), (x2, y2), (0, 255, 0), 3)
+        cv2.circle(img, absolute_center, 1, (255, 0, 255), 2)
+        Image.fromarray(img).show()
+        x1, y1, x2, y2 = bb + 60
+    # Pad image in case face is out of frame
+    padded_img = np.zeros(shape=(248, 248, 3), dtype=np.uint8)
+    padded_img[60:-60, 60:-60, :] = img
+    if debug:
+        cv2.rectangle(padded_img, (x1, y1), (x2, y2), (0, 255, 255), 3)
+        cv2.circle(padded_img, adjusted_absolute_center, 1, (255, 255, 255), 2)
+        Image.fromarray(padded_img).show()
+    y_len = abs(y1 - y2)
+    x_len = abs(x1 - x2)
+    new_len = (y_len + x_len) // 2
+    extension = int(new_len * extention_rate)
+    x_adjust = (x_len - new_len) // 2
+    y_adjust = (y_len - new_len) // 2
+    x_1_adjusted = x1 + x_adjust - extension
+    x_2_adjusted = x2 - x_adjust + extension
+    if mode == 'arcface':
+        y_1_adjusted = y1 - extension
+        y_2_adjusted = y2 - 2 * y_adjust + extension
+    else:
+        y_1_adjusted = y1 + 2 * y_adjust - extension
+        y_2_adjusted = y2 + extension
+    move_x = adjusted_absolute_center[0] - (x_1_adjusted + x_2_adjusted) // 2
+    move_y = adjusted_absolute_center[1] - (y_1_adjusted + y_2_adjusted) // 2
+    x_1_adjusted = x_1_adjusted + move_x
+    x_2_adjusted = x_2_adjusted + move_x
+    y_1_adjusted = y_1_adjusted + move_y
+    y_2_adjusted = y_2_adjusted + move_y
+    # print(y_1_adjusted, y_2_adjusted, x_1_adjusted, x_2_adjusted)
+    return padded_img[y_1_adjusted:y_2_adjusted, x_1_adjusted:x_2_adjusted]
+def distance(a, b):
+    return np.sqrt((a[0] - b[0]) ** 2 + (a[1] - b[1]) ** 2)
+def euclidean_distance(a, b):
+    x1 = a[0]; y1 = a[1]
+    x2 = b[0]; y2 = b[1]
+    return np.sqrt(((x2 - x1) * (x2 - x1)) + ((y2 - y1) * (y2 - y1)))
+def align_face(img, landmarks, debug=False):
+    nose, right_eye, left_eye = landmarks
+    left_eye_x = left_eye[0]
+    left_eye_y = left_eye[1]
+    right_eye_x = right_eye[0]
+    right_eye_y = right_eye[1]
+    center_eye = ((left_eye[0] + right_eye[0]) // 2, (left_eye[1] + right_eye[1]) // 2)
+    if left_eye_y < right_eye_y:
+        point_3rd = (right_eye_x, left_eye_y)
+        direction = -1
+    else:
+        point_3rd = (left_eye_x, right_eye_y)
+        direction = 1
+    if debug:
+        cv2.circle(img, point_3rd, 1, (255, 0, 0), 1)
+        cv2.circle(img, center_eye, 1, (255, 0, 0), 1)
+        cv2.line(img, right_eye, left_eye, (0, 0, 0), 1)
+        cv2.line(img, left_eye, point_3rd, (0, 0, 0), 1)
+        cv2.line(img, right_eye, point_3rd, (0, 0, 0), 1)
+    a = euclidean_distance(left_eye, point_3rd)
+    b = euclidean_distance(right_eye, left_eye)
+    c = euclidean_distance(right_eye, point_3rd)
+    cos_a = (b * b + c * c - a * a) / (2 * b * c)
+    angle = np.arccos(cos_a)
+    angle = (angle * 180) / np.pi
+    if direction == -1:
+        angle = 90 - angle
+        ang = math.radians(direction * angle)
+    else:
+        ang = math.radians(direction * angle)
+        angle = 0 - angle
+    M = cv2.getRotationMatrix2D((64, 64), angle, 1)
+    new_img = cv2.warpAffine(img, M, (128, 128),
+                            flags=cv2.INTER_CUBIC)
+    rotated_nose = (int((nose[0] - 64) * np.cos(ang) - (nose[1] - 64) * np.sin(ang) + 64),
+                    int((nose[0] - 64) * np.sin(ang) + (nose[1] - 64) * np.cos(ang) + 64))
+    rotated_center_eye = (int((center_eye[0] - 64) * np.cos(ang) - (center_eye[1] - 64) * np.sin(ang) + 64),
+                          int((center_eye[0] - 64) * np.sin(ang) + (center_eye[1] - 64) * np.cos(ang) + 64))
+    abolute_center = (rotated_center_eye[0], (rotated_nose[1] + rotated_center_eye[1]) // 2)
+    if debug:
+        cv2.circle(new_img, rotated_nose, 1, (0, 0, 255), 1)
+        cv2.circle(new_img, rotated_center_eye, 1, (0, 0, 255), 1)
+        cv2.circle(new_img, abolute_center, 1, (0, 0, 255), 1)
+    return new_img, abolute_center
+def estimate_norm(lmk, image_size=112, mode='arcface', shrink_factor=1.0):
+    assert lmk.shape == (5, 2)
+    tform = trans.SimilarityTransform()
+    lmk_tran = np.insert(lmk, 2, values=np.ones(5), axis=1)
+    min_M = []
+    min_index = []
+    min_error = float('inf')
+    src_factor = image_size / 112
+    if mode == 'arcface':
+        src = arcface_src * shrink_factor + (1 - shrink_factor) * 56
+        src = src * src_factor
+    else:
+        src = src_map[image_size] * src_factor
+    for i in np.arange(src.shape[0]):
+        tform.estimate(lmk, src[i])
+        M = tform.params[0:2, :]
+        results = np.dot(M, lmk_tran.T)
+        results = results.T
+        error = np.sum(np.sqrt(np.sum((results - src[i])**2, axis=1)))
+        #         print(error)
+        if error < min_error:
+            min_error = error
+            min_M = M
+            min_index = i
+    return min_M, min_index
+def inverse_estimate_norm(lmk, t_lmk, image_size=112, mode='arcface', shrink_factor=1.0):
+    assert lmk.shape == (5, 2)
+    tform = trans.SimilarityTransform()
+    lmk_tran = np.insert(lmk, 2, values=np.ones(5), axis=1)
+    min_M = []
+    min_index = []
+    min_error = float('inf')
+    src_factor = image_size / 112
+    if mode == 'arcface':
+        src = arcface_src * shrink_factor + (1 - shrink_factor) * 56
+        src = src * src_factor
+    else:
+        src = src_map[image_size] * src_factor
+    for i in np.arange(src.shape[0]):
+        tform.estimate(t_lmk, lmk)
+        M = tform.params[0:2, :]
+        results = np.dot(M, lmk_tran.T)
+        results = results.T
+        error = np.sum(np.sqrt(np.sum((results - src[i])**2, axis=1)))
+        #         print(error)
+        if error < min_error:
+            min_error = error
+            min_M = M
+            min_index = i
+    return min_M, min_index
+def norm_crop(img, landmark, image_size=112, mode='arcface', shrink_factor=1.0):
+    """
+    Align and crop the image based of the facial landmarks in the image. The alignment is done with
+    a similarity transformation based of source coordinates.
+    :param img: Image to transform.
+    :param landmark: Five landmark coordinates in the image.
+    :param image_size: Desired output size after transformation.
+    :param mode: 'arcface' aligns the face for the use of Arcface facial recognition model. Useful for
+    both facial recognition tasks and face swapping tasks.
+    :param shrink_factor: Shrink factor that shrinks the source landmark coordinates. This will include more border
+    information around the face. Useful when you want to include more background information when performing face swaps.
+    The lower the shrink factor the more of the face is included. Default value 1.0 will align the image to be ready
+    for the Arcface recognition model, but usually omits part of the chin. Value of 0.0 would transform all source points
+    to the middle of the image, probably rendering the alignment procedure useless.
+    If you process the image with a shrink factor of 0.85 and then want to extract the identity embedding with arcface,
+    you simply do a central crop of factor 0.85 to yield same cropped result as using shrink factor 1.0. This will
+    reduce the resolution, the recommendation is to processed images to output resolutions higher than 112 is using
+    Arcface. This will make sure no information is lost by resampling the image after central crop.
+    :return: Returns the transformed image.
+    """
+    M, pose_index = estimate_norm(landmark, image_size, mode, shrink_factor=shrink_factor)
+    warped = cv2.warpAffine(img, M, (image_size, image_size), borderValue=0.0)
+    return warped
+def transform_landmark_points(M, points):
+    lmk_tran = np.insert(points, 2, values=np.ones(5), axis=1)
+    transformed_lmk = np.dot(M, lmk_tran.T)
+    transformed_lmk = transformed_lmk.T
+    return transformed_lmk
+def multi_convolver(image, kernel, iterations):
+    if kernel == "Sharpen":
+        kernel = np.array([[0, -1, 0],
+                           [-1, 5, -1],
+                           [0, -1, 0]])
+    elif kernel == "Unsharp_mask":
+        kernel = np.array([[1, 4, 6, 4, 1],
+                           [4, 16, 24, 16, 1],
+                           [6, 24, -476, 24, 1],
+                           [4, 16, 24, 16, 1],
+                           [1, 4, 6, 4, 1]]) * (-1 / 256)
+    elif kernel == "Blur":
+        kernel = (1 / 16.0) * np.array([[1., 2., 1.],
+                                        [2., 4., 2.],
+                                        [1., 2., 1.]])
+    for i in range(iterations):
+        image = convolve2d(image, kernel, 'same', boundary='fill', fillvalue = 0)
+    return image
+def convolve_rgb(image, kernel, iterations=1):
+    img_yuv = rgb2yuv(image)
+    img_yuv[:, :, 0] = multi_convolver(img_yuv[:, :, 0], kernel,
+                                       iterations)
+    final_image = yuv2rgb(img_yuv)
+    return final_image.astype('float32')
+def generate_mask_from_landmarks(lms, im_size):
+    blend_mask_lm = np.zeros(shape=(im_size, im_size, 3), dtype='float32')
+    # EYES
+    blend_mask_lm = cv2.circle(blend_mask_lm,
+                               (int(lms[0][0]), int(lms[0][1])), 12, (255, 255, 255), 30)
+    blend_mask_lm = cv2.circle(blend_mask_lm,
+                               (int(lms[1][0]), int(lms[1][1])), 12, (255, 255, 255), 30)
+    blend_mask_lm = cv2.circle(blend_mask_lm,
+                               (int((lms[0][0] + lms[1][0]) / 2), int((lms[0][1] + lms[1][1]) / 2)),
+                               16, (255, 255, 255), 65)
+    # NOSE
+    blend_mask_lm = cv2.circle(blend_mask_lm,
+                               (int(lms[2][0]), int(lms[2][1])), 5, (255, 255, 255), 5)
+    blend_mask_lm = cv2.circle(blend_mask_lm,
+                               (int((lms[0][0] + lms[1][0]) / 2), int(lms[2][1])), 16, (255, 255, 255), 100)
+    # MOUTH
+    blend_mask_lm = cv2.circle(blend_mask_lm,
+                               (int(lms[3][0]), int(lms[3][1])), 6, (255, 255, 255), 30)
+    blend_mask_lm = cv2.circle(blend_mask_lm,
+                               (int(lms[4][0]), int(lms[4][1])), 6, (255, 255, 255), 30)
+    blend_mask_lm = cv2.circle(blend_mask_lm,
+                               (int((lms[3][0] + lms[4][0]) / 2), int((lms[3][1] + lms[4][1]) / 2)),
+                               16, (255, 255, 255), 40)
+    return blend_mask_lm
+def display_distance_text(im, distance, lms, im_w, im_h, scale=2):
+    blended_insert = cv2.putText(im, str(distance)[:4],
+                                 (int(lms[4] * im_w * 0.5), int(lms[5] * im_h * 0.8)),
+                                 cv2.FONT_HERSHEY_SIMPLEX, scale * 0.5, (0.08, 0.16, 0.08), int(scale * 2))
+    blended_insert = cv2.putText(blended_insert, str(distance)[:4],
+                                 (int(lms[4] * im_w * 0.5), int(lms[5] * im_h * 0.8)),
+                                 cv2.FONT_HERSHEY_SIMPLEX, scale*  0.5, (0.3, 0.7, 0.32), int(scale * 1))
+    return blended_insert
+def get_lm(annotation, im_w, im_h):
+    lm_align = np.array([[annotation[4] * im_w, annotation[5] * im_h],
+                         [annotation[6] * im_w, annotation[7] * im_h],
+                         [annotation[8] * im_w, annotation[9] * im_h],
+                         [annotation[10] * im_w, annotation[11] * im_h],
+                         [annotation[12] * im_w, annotation[13] * im_h]],
+                        dtype=np.float32)
+    return lm_align