Spaces:

Norod78
/

PumpkinHeads

Build error

App Files Files Community

Doron Adler commited on Oct 24, 2022

Commit

d98412d

1 Parent(s): c63f589

Head Pumpkinizer

Browse files

Files changed (11) hide show

.gitattributes +2 -0
Example00001.jpg +0 -0
Example00002.jpg +0 -0
Example00003.jpg +0 -0
Example00004.jpg +0 -0
README.md +33 -7
app.py +102 -0
face_detection.py +140 -0
ffhq2pumpkinheads_pix2pixHD_e03_itr4500-simp.onnx +3 -0
requirements.txt +7 -0
shape_predictor_5_face_landmarks.dat +3 -0

.gitattributes CHANGED Viewed

@@ -31,3 +31,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+ffhq2pumpkinheads_pix2pixHD_e03_itr4500-simp.onnx filter=lfs diff=lfs merge=lfs -text
+shape_predictor_5_face_landmarks.dat filter=lfs diff=lfs merge=lfs -text

Example00001.jpg ADDED Viewed

Example00002.jpg ADDED Viewed

Example00003.jpg ADDED Viewed

Example00004.jpg ADDED Viewed

README.md CHANGED Viewed

@@ -1,13 +1,39 @@
 ---
-title: PumpkinHeads
-emoji: 🐨
-colorFrom: purple
-colorTo: indigo
 sdk: gradio
-sdk_version: 3.6
 app_file: app.py
 pinned: false
-license: mit
 ---
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: Pumpkin heads
+emoji: 🎃
+colorFrom: orange
+colorTo: yellow
 sdk: gradio
 app_file: app.py
 pinned: false
 ---
+Check out the configuration reference at https://huggingface.co/docs/hub/spaces#reference
+# Configuration
+`title`: _string_
+Display title for the Space
+`emoji`: _string_
+Space emoji (emoji-only character allowed)
+`colorFrom`: _string_
+Color for Thumbnail gradient (red, yellow, green, blue, indigo, purple, pink, gray)
+`colorTo`: _string_
+Color for Thumbnail gradient (red, yellow, green, blue, indigo, purple, pink, gray)
+`sdk`: _string_
+Can be either `gradio` or `streamlit`
+`sdk_version` : _string_
+Only applicable for `streamlit` SDK.
+See [doc](https://hf.co/docs/hub/spaces) for more info on supported versions.
+`app_file`: _string_
+Path to your main application file (which contains either `gradio` or `streamlit` Python code).
+Path is relative to the root of the repository.
+`pinned`: _boolean_
+Whether the Space stays on top of your list.

app.py ADDED Viewed

	@@ -0,0 +1,102 @@

+import os
+import onnxruntime as rt
+import sys
+import PIL
+from PIL import Image, ImageOps, ImageFile
+import numpy as np
+from pathlib import Path
+import collections
+from typing import Union, List
+import scipy.ndimage
+import requests
+MODEL_FILE = "ffhq2pumpkinheads_pix2pixHD_e03_itr4500-simp.onnx"
+so = rt.SessionOptions()
+so.inter_op_num_threads = 4
+so.intra_op_num_threads = 4
+session = rt.InferenceSession(MODEL_FILE, sess_options=so)
+input_name = session.get_inputs()[0].name
+print("input_name = " + str(input_name))
+output_name = session.get_outputs()[0].name
+print("output_name = " + str(output_name))
+import os
+os.system("pip install dlib")
+import face_detection
+def array_to_image(array_in):
+    array_in = np.squeeze(255*(array_in + 1)/2)
+    array_in = np.transpose(array_in, (1, 2, 0))
+    im = Image.fromarray(array_in.astype(np.uint8))
+    return im
+def image_as_array(image_in):
+    im_array = np.array(image_in, np.float32)
+    im_array = (im_array/255)*2 - 1
+    im_array = np.transpose(im_array, (2, 0, 1))
+    im_array = np.expand_dims(im_array, 0)
+    return im_array
+def find_aligned_face(image_in, size=1024):
+    aligned_image, n_faces, quad = face_detection.align(image_in, face_index=0, output_size=size)
+    return aligned_image, n_faces, quad
+def align_first_face(image_in, size=1024):
+    aligned_image, n_faces, quad = find_aligned_face(image_in,size=size)
+    if n_faces == 0:
+        try:
+            image_in = ImageOps.exif_transpose(image_in)
+        except:
+            print("exif problem, not rotating")
+        image_in = image_in.resize((size, size))
+        im_array = image_as_array(image_in)
+    else:
+        im_array = image_as_array(aligned_image)
+    return im_array
+def img_concat_h(im1, im2):
+    dst = Image.new('RGB', (im1.width + im2.width, im1.height))
+    dst.paste(im1, (0, 0))
+    dst.paste(im2, (im1.width, 0))
+    return dst
+import gradio as gr
+def face2vintage(
+    img: Image.Image,
+    size: int
+) -> Image.Image:
+    aligned_img = align_first_face(img)
+    if aligned_img is None:
+        output=None
+    else:
+        output = session.run([output_name], {input_name: aligned_img})[0]
+        output = array_to_image(output)
+        aligned_img = array_to_image(aligned_img).resize((output.width, output.height))
+        output = img_concat_h(aligned_img, output)
+    return output
+def inference(img):
+    out = face2vintage(img, 1024)
+    return out
+title = "Pumpkin head Pix2PixHD"
+description = "Pumpkinize your head. Upload an image with a face, or click on one of the examples below. If a face could not be detected, an image will still be created."
+article = "<hr><p style='text-align: center'>See the <a href='https://github.com/justinpinkney/pix2pixHD' target='_blank'>Github Repo</a></p><p>The \"Pumpkin Head\" Pix2PixHD model was trained by <a href='https://linktr.ee/Norod78' target='_blank'>Doron Adler</a></p>"
+examples=[['Example00001.jpg'],['Example00002.jpg'],['Example00003.jpg'],['Example00004.jpg']]
+gr.Interface(
+    inference,
+    gr.inputs.Image(type="pil", label="Input"),
+    gr.outputs.Image(type="pil", label="Output"),
+    title=title,
+    description=description,
+    article=article,
+    examples=examples,
+    enable_queue=True,
+    allow_flagging=False
+    ).launch()

face_detection.py ADDED Viewed

	@@ -0,0 +1,140 @@

+# Copyright (c) 2021 Justin Pinkney
+import dlib
+import numpy as np
+import os
+from PIL import Image
+from PIL import ImageOps
+from scipy.ndimage import gaussian_filter
+import cv2
+MODEL_PATH = "shape_predictor_5_face_landmarks.dat"
+detector = dlib.get_frontal_face_detector()
+def align(image_in, face_index=0, output_size=256):
+    try:
+        image_in = ImageOps.exif_transpose(image_in)
+    except:
+        print("exif problem, not rotating")
+    landmarks = list(get_landmarks(image_in))
+    n_faces = len(landmarks)
+    face_index = min(n_faces-1, face_index)
+    if n_faces == 0:
+        aligned_image = image_in
+        quad = None
+    else:
+        aligned_image, quad = image_align(image_in, landmarks[face_index], output_size=output_size)
+    return aligned_image, n_faces, quad
+def composite_images(quad, img, output):
+    """Composite an image into and output canvas according to transformed co-ords"""
+    output = output.convert("RGBA")
+    img = img.convert("RGBA")
+    input_size = img.size
+    src = np.array(((0, 0), (0, input_size[1]), input_size, (input_size[0], 0)), dtype=np.float32)
+    dst = np.float32(quad)
+    mtx = cv2.getPerspectiveTransform(dst, src)
+    img = img.transform(output.size, Image.PERSPECTIVE, mtx.flatten(), Image.BILINEAR)
+    output.alpha_composite(img)
+    return output.convert("RGB")
+def get_landmarks(image):
+    """Get landmarks from PIL image"""
+    shape_predictor = dlib.shape_predictor(MODEL_PATH)
+    max_size = max(image.size)
+    reduction_scale = int(max_size/512)
+    if reduction_scale == 0:
+        reduction_scale = 1
+    downscaled = image.reduce(reduction_scale)
+    img = np.array(downscaled)
+    detections = detector(img, 0)
+    for detection in detections:
+        try:
+            face_landmarks = [(reduction_scale*item.x, reduction_scale*item.y) for item in shape_predictor(img, detection).parts()]
+            yield face_landmarks
+        except Exception as e:
+            print(e)
+def image_align(src_img, face_landmarks, output_size=512, transform_size=2048, enable_padding=True, x_scale=1, y_scale=1, em_scale=0.1, alpha=False):
+        # Align function modified from ffhq-dataset
+        # See https://github.com/NVlabs/ffhq-dataset for license
+        lm = np.array(face_landmarks)
+        lm_eye_left      = lm[2:3]  # left-clockwise
+        lm_eye_right     = lm[0:1]  # left-clockwise
+        # Calculate auxiliary vectors.
+        eye_left     = np.mean(lm_eye_left, axis=0)
+        eye_right    = np.mean(lm_eye_right, axis=0)
+        eye_avg      = (eye_left + eye_right) * 0.5
+        eye_to_eye   = 0.71*(eye_right - eye_left)
+        mouth_avg    = lm[4]
+        eye_to_mouth = 1.35*(mouth_avg - eye_avg)
+        # Choose oriented crop rectangle.
+        x = eye_to_eye.copy()
+        x /= np.hypot(*x)
+        x *= max(np.hypot(*eye_to_eye) * 2.0, np.hypot(*eye_to_mouth) * 1.8)
+        x *= x_scale
+        y = np.flipud(x) * [-y_scale, y_scale]
+        c = eye_avg + eye_to_mouth * em_scale
+        quad = np.stack([c - x - y, c - x + y, c + x + y, c + x - y])
+        quad_orig = quad.copy()
+        qsize = np.hypot(*x) * 2
+        img = src_img.convert('RGBA').convert('RGB')
+        # Shrink.
+        shrink = int(np.floor(qsize / output_size * 0.5))
+        if shrink > 1:
+            rsize = (int(np.rint(float(img.size[0]) / shrink)), int(np.rint(float(img.size[1]) / shrink)))
+            img = img.resize(rsize, Image.ANTIALIAS)
+            quad /= shrink
+            qsize /= shrink
+        # Crop.
+        border = max(int(np.rint(qsize * 0.1)), 3)
+        crop = (int(np.floor(min(quad[:,0]))), int(np.floor(min(quad[:,1]))), int(np.ceil(max(quad[:,0]))), int(np.ceil(max(quad[:,1]))))
+        crop = (max(crop[0] - border, 0), max(crop[1] - border, 0), min(crop[2] + border, img.size[0]), min(crop[3] + border, img.size[1]))
+        if crop[2] - crop[0] < img.size[0] or crop[3] - crop[1] < img.size[1]:
+            img = img.crop(crop)
+            quad -= crop[0:2]
+        # Pad.
+        pad = (int(np.floor(min(quad[:,0]))), int(np.floor(min(quad[:,1]))), int(np.ceil(max(quad[:,0]))), int(np.ceil(max(quad[:,1]))))
+        pad = (max(-pad[0] + border, 0), max(-pad[1] + border, 0), max(pad[2] - img.size[0] + border, 0), max(pad[3] - img.size[1] + border, 0))
+        if enable_padding and max(pad) > border - 4:
+            pad = np.maximum(pad, int(np.rint(qsize * 0.3)))
+            img = np.pad(np.float32(img), ((pad[1], pad[3]), (pad[0], pad[2]), (0, 0)), 'reflect')
+            h, w, _ = img.shape
+            y, x, _ = np.ogrid[:h, :w, :1]
+            mask = np.maximum(1.0 - np.minimum(np.float32(x) / pad[0], np.float32(w-1-x) / pad[2]), 1.0 - np.minimum(np.float32(y) / pad[1], np.float32(h-1-y) / pad[3]))
+            blur = qsize * 0.02
+            img += (gaussian_filter(img, [blur, blur, 0]) - img) * np.clip(mask * 3.0 + 1.0, 0.0, 1.0)
+            img += (np.median(img, axis=(0,1)) - img) * np.clip(mask, 0.0, 1.0)
+            img = np.uint8(np.clip(np.rint(img), 0, 255))
+            if alpha:
+                mask = 1-np.clip(3.0 * mask, 0.0, 1.0)
+                mask = np.uint8(np.clip(np.rint(mask*255), 0, 255))
+                img = np.concatenate((img, mask), axis=2)
+                img = Image.fromarray(img, 'RGBA')
+            else:
+                img = Image.fromarray(img, 'RGB')
+            quad += pad[:2]
+        # Transform.
+        img = img.transform((transform_size, transform_size), Image.QUAD, (quad + 0.5).flatten(), Image.BILINEAR)
+        if output_size < transform_size:
+            img = img.resize((output_size, output_size), Image.ANTIALIAS)
+        return img, quad_orig

ffhq2pumpkinheads_pix2pixHD_e03_itr4500-simp.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f3dc9bc6902dbc85c7168adf07ed999d4f5f7638bafa23166a5b8c17166851a9
+size 729804826

requirements.txt ADDED Viewed

	@@ -0,0 +1,7 @@

+numpy
+opencv-python-headless
+Pillow
+scikit-image
+onnxruntime
+scipy
+cmake

shape_predictor_5_face_landmarks.dat ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c4b1e9804792707d3a405c2c16a80a20269e6675021f64a41d30fffafbc41888
+size 9150489