Spaces:

dataroots
/

SofaStyler

Build error

App Files Files Community

Sophie98 commited on May 4, 2022

Commit

210920a

•

2 Parent(s): ab92204 033b042

Merge branch 'main' of https://huggingface.co/spaces/SophieDC/SofaStyler into main

Browse files

Files changed (2) hide show

box_ops.py +88 -0
segmentation.py +72 -0

box_ops.py ADDED Viewed

	@@ -0,0 +1,88 @@

+# Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved
+"""
+Utilities for bounding box manipulation and GIoU.
+"""
+import torch
+from torchvision.ops.boxes import box_area
+def box_cxcywh_to_xyxy(x):
+    x_c, y_c, w, h = x.unbind(-1)
+    b = [(x_c - 0.5 * w), (y_c - 0.5 * h),
+         (x_c + 0.5 * w), (y_c + 0.5 * h)]
+    return torch.stack(b, dim=-1)
+def box_xyxy_to_cxcywh(x):
+    x0, y0, x1, y1 = x.unbind(-1)
+    b = [(x0 + x1) / 2, (y0 + y1) / 2,
+         (x1 - x0), (y1 - y0)]
+    return torch.stack(b, dim=-1)
+# modified from torchvision to also return the union
+def box_iou(boxes1, boxes2):
+    area1 = box_area(boxes1)
+    area2 = box_area(boxes2)
+    lt = torch.max(boxes1[:, None, :2], boxes2[:, :2])  # [N,M,2]
+    rb = torch.min(boxes1[:, None, 2:], boxes2[:, 2:])  # [N,M,2]
+    wh = (rb - lt).clamp(min=0)  # [N,M,2]
+    inter = wh[:, :, 0] * wh[:, :, 1]  # [N,M]
+    union = area1[:, None] + area2 - inter
+    iou = inter / union
+    return iou, union
+def generalized_box_iou(boxes1, boxes2):
+    """
+    Generalized IoU from https://giou.stanford.edu/
+    The boxes should be in [x0, y0, x1, y1] format
+    Returns a [N, M] pairwise matrix, where N = len(boxes1)
+    and M = len(boxes2)
+    """
+    # degenerate boxes gives inf / nan results
+    # so do an early check
+    assert (boxes1[:, 2:] >= boxes1[:, :2]).all()
+    assert (boxes2[:, 2:] >= boxes2[:, :2]).all()
+    iou, union = box_iou(boxes1, boxes2)
+    lt = torch.min(boxes1[:, None, :2], boxes2[:, :2])
+    rb = torch.max(boxes1[:, None, 2:], boxes2[:, 2:])
+    wh = (rb - lt).clamp(min=0)  # [N,M,2]
+    area = wh[:, :, 0] * wh[:, :, 1]
+    return iou - (area - union) / area
+def masks_to_boxes(masks):
+    """Compute the bounding boxes around the provided masks
+    The masks should be in format [N, H, W] where N is the number of masks, (H, W) are the spatial dimensions.
+    Returns a [N, 4] tensors, with the boxes in xyxy format
+    """
+    if masks.numel() == 0:
+        return torch.zeros((0, 4), device=masks.device)
+    h, w = masks.shape[-2:]
+    y = torch.arange(0, h, dtype=torch.float)
+    x = torch.arange(0, w, dtype=torch.float)
+    y, x = torch.meshgrid(y, x)
+    x_mask = (masks * x.unsqueeze(0))
+    x_max = x_mask.flatten(1).max(-1)[0]
+    x_min = x_mask.masked_fill(~(masks.bool()), 1e8).flatten(1).min(-1)[0]
+    y_mask = (masks * y.unsqueeze(0))
+    y_max = y_mask.flatten(1).max(-1)[0]
+    y_min = y_mask.masked_fill(~(masks.bool()), 1e8).flatten(1).min(-1)[0]
+    return torch.stack([x_min, y_min, x_max, y_max], 1)

segmentation.py ADDED Viewed

	@@ -0,0 +1,72 @@

+# Import libraries
+import cv2
+from tensorflow import keras
+import numpy as np
+import matplotlib.pyplot as plt
+from PIL import Image
+import segmentation_models as sm
+def get_mask(image):
+    model_path = "Segmentation/model_checkpoint.h5"
+    CLASSES = ['sofa']
+    BACKBONE = 'resnet50'
+    # define network parameters
+    n_classes = 1 if len(CLASSES) == 1 else (len(CLASSES) + 1)  # case for binary and multiclass segmentation
+    activation = 'sigmoid' if n_classes == 1 else 'softmax'
+    preprocess_input = sm.get_preprocessing(BACKBONE)
+    sm.set_framework('tf.keras')
+    LR=0.0001
+    #create model architecture
+    model = sm.Unet(BACKBONE, classes=n_classes, activation=activation)
+    # define optomizer
+    optim = keras.optimizers.Adam(LR)
+    # Segmentation models losses can be combined together by '+' and scaled by integer or float factor
+    dice_loss = sm.losses.DiceLoss()
+    focal_loss = sm.losses.BinaryFocalLoss() if n_classes == 1 else sm.losses.CategoricalFocalLoss()
+    total_loss = dice_loss + (1 * focal_loss)
+    # actulally total_loss can be imported directly from library, above example just show you how to manipulate with losses
+    # total_loss = sm.losses.binary_focal_dice_loss # or sm.losses.categorical_focal_dice_loss
+    metrics = [sm.metrics.IOUScore(threshold=0.5), sm.metrics.FScore(threshold=0.5)]
+    # compile keras model with defined optimozer, loss and metrics
+    model.compile(optim, total_loss, metrics)
+    #load model
+    model.load_weights(model_path)
+    test_img = np.array(image)#cv2.imread(path, cv2.IMREAD_COLOR)
+    test_img = cv2.resize(test_img, (640, 640))
+    test_img = cv2.cvtColor(test_img, cv2.COLOR_RGB2BGR)
+    test_img = np.expand_dims(test_img, axis=0)
+    prediction = model.predict(test_img).round()
+    mask = Image.fromarray(prediction[...,0].squeeze()*255).convert("L")
+    mask.save("masks/sofa.jpg")
+    return np.array(mask)
+def replace_sofa(image,mask,styled_sofa):
+    # print(mask.shape)
+    # mask = cv2.cvtColor(mask, cv2.COLOR_BGR2GRAY)
+    # print(mask.shape)
+    image = np.array(image)
+    #image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+    styled_sofa = cv2.cvtColor(styled_sofa, cv2.COLOR_BGR2RGB)
+    _, mask = cv2.threshold(mask, 10, 255, cv2.THRESH_BINARY)
+    mask_inv = cv2.bitwise_not(mask)
+    image_bg = cv2.bitwise_and(image,image,mask = mask_inv)
+    sofa_fg = cv2.bitwise_and(styled_sofa,styled_sofa,mask = mask)
+    new_image = cv2.add(image_bg,sofa_fg)
+    return new_image
+# image = cv2.imread('input/sofa.jpg')
+# mask = cv2.imread('masks/sofa.jpg')
+# styled_sofa = cv2.imread('output/sofa_stylized_style.jpg')
+# #get_mask(image)
+# plt.imshow(replace_sofa(image,mask,styled_sofa))
+# plt.show()