Spaces:
Paused
Paused
import json | |
import cv2 | |
import numpy as np | |
import os | |
from torch.utils.data import Dataset | |
from PIL import Image | |
import cv2 | |
from .data_utils import * | |
from .base import BaseDataset | |
class DreamBoothDataset(BaseDataset): | |
def __init__(self, fg_dir, bg_dir): | |
self.bg_dir = bg_dir | |
bg_data = os.listdir(self.bg_dir) | |
self.bg_data = [i for i in bg_data if 'mask' in i] | |
self.image_dir = fg_dir | |
self.data = os.listdir(self.image_dir) | |
self.size = (512,512) | |
self.clip_size = (224,224) | |
''' | |
Dynamic: | |
0: Static View, High Quality | |
1: Multi-view, Low Quality | |
2: Multi-view, High Quality | |
''' | |
self.dynamic = 1 | |
def __len__(self): | |
return len(self.data) | |
def __getitem__(self, idx): | |
idx = np.random.randint(0, len(self.data)-1) | |
item = self.get_sample(idx) | |
return item | |
def check_region_size(self, image, yyxx, ratio, mode = 'max'): | |
pass_flag = True | |
H,W = image.shape[0], image.shape[1] | |
H,W = H * ratio, W * ratio | |
y1,y2,x1,x2 = yyxx | |
h,w = y2-y1,x2-x1 | |
if mode == 'max': | |
if h > H and w > W: | |
pass_flag = False | |
elif mode == 'min': | |
if h < H and w < W: | |
pass_flag = False | |
return pass_flag | |
def get_alpha_mask(self, mask_path): | |
image = cv2.imread( mask_path, cv2.IMREAD_UNCHANGED) | |
mask = (image[:,:,-1] > 128).astype(np.uint8) | |
return mask | |
def get_sample(self, idx): | |
dir_name = self.data[idx] | |
dir_path = os.path.join(self.image_dir, dir_name) | |
images = os.listdir(dir_path) | |
image_name = [i for i in images if '.png' in i][0] | |
image_path = os.path.join(dir_path, image_name) | |
image = cv2.imread( image_path, cv2.IMREAD_UNCHANGED) | |
mask = (image[:,:,-1] > 128).astype(np.uint8) | |
image = image[:,:,:-1] | |
image = cv2.cvtColor(image.copy(), cv2.COLOR_BGR2RGB) | |
ref_image = image | |
ref_mask = mask | |
ref_image, ref_mask = expand_image_mask(image, mask, ratio=1.4) | |
bg_idx = np.random.randint(0, len(self.bg_data)-1) | |
tar_mask_name = self.bg_data[bg_idx] | |
tar_mask_path = os.path.join(self.bg_dir, tar_mask_name) | |
tar_image_path = tar_mask_path.replace('_mask','_GT') | |
tar_image = cv2.imread(tar_image_path).astype(np.uint8) | |
tar_image = cv2.cvtColor(tar_image, cv2.COLOR_BGR2RGB) | |
tar_mask = (cv2.imread(tar_mask_path) > 128).astype(np.uint8)[:,:,0] | |
item_with_collage = self.process_pairs(ref_image, ref_mask, tar_image, tar_mask) | |
sampled_time_steps = self.sample_timestep() | |
item_with_collage['time_steps'] = sampled_time_steps | |
return item_with_collage | |