mangaaa / dataset /datasets.py
Keiser41's picture
Update dataset/datasets.py
a78fa78
raw
history blame contribute delete
No virus
4.4 kB
import torch
import os
import torchvision.transforms as transforms
import matplotlib.pyplot as plt
import numpy as np
from utils.utils import generate_mask
class TrainDataset(torch.utils.data.Dataset):
def __init__(self, data_path, transform=None, mults_amount=1):
self.data = os.listdir(os.path.join(data_path, "color"))
self.data_path = data_path
self.transform = transform
self.mults_amount = mults_amount
self.ToTensor = transforms.ToTensor()
def __len__(self):
return len(self.data)
def __getitem__(self, idx):
image_name = self.data[idx]
try:
color_img = plt.imread(os.path.join(self.data_path, 'color', image_name))
except SyntaxError:
print(f"Archivo {image_name} no es un PNG válido. Saltando...")
return None # O alguna otra acción que prefieras
if self.mults_amount > 1:
mult_number = np.random.choice(range(self.mults_amount))
bw_name = (
image_name[: image_name.rfind(".")] + "_" + str(mult_number) + ".png"
)
dfm_name = (
image_name[: image_name.rfind(".")]
+ "_"
+ str(mult_number)
+ "_dfm.png"
)
else:
bw_name = self.data[idx]
dfm_name = os.path.splitext(self.data[idx])[0] + "0_dfm.png"
bw_img = np.expand_dims(
plt.imread(os.path.join(self.data_path, "bw", bw_name)), 2
)
dfm_img = np.expand_dims(
plt.imread(os.path.join(self.data_path, "bw", dfm_name)), 2
)
bw_img = np.concatenate([bw_img, dfm_img], axis=2)
if self.transform:
result = self.transform(image=color_img, mask=bw_img)
color_img = result["image"]
bw_img = result["mask"]
dfm_img = bw_img[:, :, 1]
bw_img = bw_img[:, :, 0]
color_img = self.ToTensor(color_img)
bw_img = self.ToTensor(bw_img)
dfm_img = self.ToTensor(dfm_img)
color_img = (color_img - 0.5) / 0.5
mask = generate_mask(bw_img.shape[1], bw_img.shape[2])
hint = torch.cat((color_img * mask, mask), 0)
return bw_img, color_img, hint, dfm_img
class FineTuningDataset(torch.utils.data.Dataset):
def __init__(self, data_path, transform=None, mult_amount=1):
self.data = [
x
for x in os.listdir(os.path.join(data_path, "real_manga"))
if x.find("_dfm") == -1
]
self.color_data = [x for x in os.listdir(os.path.join(data_path, "color"))]
self.data_path = data_path
self.transform = transform
self.mults_amount = mult_amount
np.random.shuffle(self.color_data)
self.ToTensor = transforms.ToTensor()
def __len__(self):
return len(self.data)
def __getitem__(self, idx):
color_img = plt.imread(
os.path.join(self.data_path, "color", self.color_data[idx])
)
image_name = self.data[idx]
if self.mults_amount > 1:
mult_number = np.random.choice(range(self.mults_amount))
bw_name = (
image_name[: image_name.rfind(".")]
+ "_"
+ str(self.mults_amount)
+ ".png"
)
dfm_name = (
image_name[: image_name.rfind(".")]
+ "_"
+ str(self.mults_amount)
+ "_dfm.png"
)
else:
bw_name = self.data[idx]
dfm_name = os.path.splitext(self.data[idx])[0] + "_dfm.png"
bw_img = np.expand_dims(
plt.imread(os.path.join(self.data_path, "real_manga", image_name)), 2
)
dfm_img = np.expand_dims(
plt.imread(os.path.join(self.data_path, "real_manga", dfm_name)), 2
)
if self.transform:
result = self.transform(image=color_img)
color_img = result["image"]
result = self.transform(image=bw_img, mask=dfm_img)
bw_img = result["image"]
dfm_img = result["mask"]
color_img = self.ToTensor(color_img)
bw_img = self.ToTensor(bw_img)
dfm_img = self.ToTensor(dfm_img)
color_img = (color_img - 0.5) / 0.5
return bw_img, dfm_img, color_img