SAFMN / app.py
Meloo's picture
Update app.py
54d5611 verified
raw
history blame
7.39 kB
import os
import cv2
import argparse
import glob
import numpy as np
import os
import torch
import torch.nn.functional as F
import gradio as gr
from PIL import Image
from utils.download_url import load_file_from_url
from utils.color_fix import wavelet_reconstruction
from models.safmn_arch import SAFMN
from gradio_imageslider import ImageSlider
pretrain_model_url = {
'safmn_x2': 'https://github.com/sunny2109/SAFMN/releases/download/v0.1.0/SAFMN_L_Real_LSDIR_x2-v2.pth',
'safmn_x4': 'https://github.com/sunny2109/SAFMN/releases/download/v0.1.0/SAFMN_L_Real_LSDIR_x4-v2.pth',
}
# download weights
if not os.path.exists('pretrained_models/SAFMN_L_Real_LSDIR_x2-v2.pth'):
load_file_from_url(url=pretrain_model_url['safmn_x2'], model_dir='./pretrained_models/', progress=True, file_name=None)
if not os.path.exists('pretrained_models/SAFMN_L_Real_LSDIR_x4-v2.pth'):
load_file_from_url(url=pretrain_model_url['safmn_x4'], model_dir='./pretrained_models/', progress=True, file_name=None)
device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
def set_safmn(upscale):
model = SAFMN(dim=128, n_blocks=16, ffn_scale=2.0, upscaling_factor=upscale)
if upscale == 2:
model_path = 'pretrained_models/SAFMN_L_Real_LSDIR_x2-v2.pth'
elif upscale == 4:
model_path = 'pretrained_models/SAFMN_L_Real_LSDIR_x4-v2.pth'
else:
raise NotImplementedError('Only support x2/x4 upscaling!')
model.load_state_dict(torch.load(model_path, weights_only=True)['params'], strict=True)
model.eval()
return model.to(device)
def img2patch(lq, scale=4, crop_size=512):
b, c, hl, wl = lq.size()
h, w = hl*scale, wl*scale
sr_size = (b, c, h, w)
assert b == 1
crop_size_h, crop_size_w = crop_size // scale * scale, crop_size // scale * scale
#adaptive step_i, step_j
num_row = (h - 1) // crop_size_h + 1
num_col = (w - 1) // crop_size_w + 1
import math
step_j = crop_size_w if num_col == 1 else math.ceil((w - crop_size_w) / (num_col - 1) - 1e-8)
step_i = crop_size_h if num_row == 1 else math.ceil((h - crop_size_h) / (num_row - 1) - 1e-8)
step_i = step_i // scale * scale
step_j = step_j // scale * scale
parts = []
idxes = []
i = 0 # 0~h-1
last_i = False
while i < h and not last_i:
j = 0
if i + crop_size_h >= h:
i = h - crop_size_h
last_i = True
last_j = False
while j < w and not last_j:
if j + crop_size_w >= w:
j = w - crop_size_w
last_j = True
parts.append(lq[:, :, i // scale :(i + crop_size_h) // scale, j // scale:(j + crop_size_w) // scale])
idxes.append({'i': i, 'j': j})
j = j + step_j
i = i + step_i
return torch.cat(parts, dim=0), idxes, sr_size
def patch2img(outs, idxes, sr_size, scale=4, crop_size=512):
preds = torch.zeros(sr_size).to(outs.device)
b, c, h, w = sr_size
count_mt = torch.zeros((b, 1, h, w)).to(outs.device)
crop_size_h, crop_size_w = crop_size // scale * scale, crop_size // scale * scale
for cnt, each_idx in enumerate(idxes):
i = each_idx['i']
j = each_idx['j']
preds[0, :, i: i + crop_size_h, j: j + crop_size_w] += outs[cnt]
count_mt[0, 0, i: i + crop_size_h, j: j + crop_size_w] += 1.
return (preds / count_mt).to(outs.device)
def inference(image, upscale, large_input_flag, color_fix):
if upscale is None or not isinstance(upscale, (int, float)) or upscale == 3.:
upscale = 2
upscale = int(upscale)
model = set_safmn(upscale)
# img2tensor
y = np.array(image).astype(np.float32) / 255.
y = torch.from_numpy(np.transpose(y[:, :, [2, 1, 0]], (2, 0, 1))).float()
y = y.unsqueeze(0).to(device)
# inference
if large_input_flag:
patches, idx, size = img2patch(y, scale=upscale)
with torch.no_grad():
n = len(patches)
outs = []
m = 1
i = 0
while i < n:
j = i + m
if j >= n:
j = n
pred = output = model(patches[i:j])
if isinstance(pred, list):
pred = pred[-1]
outs.append(pred.detach())
i = j
output = torch.cat(outs, dim=0)
output = patch2img(output, idx, size, scale=upscale)
else:
with torch.no_grad():
output = model(y)
# color fix
if color_fix:
y = F.interpolate(y, scale_factor=upscale, mode='bilinear')
output = wavelet_reconstruction(output, y)
# tensor2img
output = output.data.squeeze().float().cpu().clamp_(0, 1).numpy()
if output.ndim == 3:
output = np.transpose(output[[2, 1, 0], :, :], (1, 2, 0))
output = (output * 255.0).round().astype(np.uint8)
# save results
save_path = './out.png'
cv2.imwrite(save_path, output[:, :, ::-1])
return (image, Image.fromarray(output)), save_path
title = "SAFMN for Real-world SR (running on CPU)"
description = ''' ### Spatially-Adaptive Feature Modulation for Efficient Image Super-Resolution - ICCV 2023
### [Long Sun](https://github.com/sunny2109), [Jiangxin Dong](https://scholar.google.com/citations?user=ruebFVEAAAAJ&hl=zh-CN&oi=ao), [Jinhui Tang](https://scholar.google.com/citations?user=ByBLlEwAAAAJ&hl=zh-CN), and [Jinshan Pan](https://jspan.github.io/)
### [IMAG Lab](https://imag-njust.net/), Nanjing University of Science and Technology
### Drag the slider on the super-resolution image left and right to see the changes in the image details.
### SAFMN performs x2/x4 upscaling on the input image. If the input image is larger than 720P, it is recommended to use Memory-efficient inference.
### If our work is useful for your research, please consider citing:
<br>
<code>
@inproceedings{sun2023safmn,
title={Spatially-Adaptive Feature Modulation for Efficient Image Super-Resolution},
author={Sun, Long and Dong, Jiangxin and Tang, Jinhui and Pan, Jinshan},
booktitle={ICCV},
year={2023}
}
</code>
<br>
'''
article = "<p style='text-align: center'><a href='https://github.com/sunny2109/SAFMN/tree/main' target='_blank'>Spatially-Adaptive Feature Modulation for Efficient Image Super-Resolution</a></p>"
#### Image examples
examples = [
['real_testdata/060.png'],
['real_testdata/004.png'],
['real_testdata/013.png'],
['real_testdata/014.png'],
['real_testdata/015.png'],
['real_testdata/021.png'],
['real_testdata/032.png'],
['real_testdata/045.png'],
['real_testdata/036.png'],
['real_testdata/058.png'],
]
css = """
.image-frame img, .image-container img {
width: auto;
height: auto;
max-width: none;
}
"""
demo = gr.Interface(
fn=inference,
inputs=[
gr.Image(value="real_testdata/060.png", type="pil", label="Input"),
gr.Number(minimum=2, maximum=4, label="Upscaling factor (up to 4)"),
gr.Checkbox(value=False, label="Memory-efficient inference"),
gr.Checkbox(value=False, label="Color correction"),
],
outputs = [
ImageSlider(label="Super-Resolved Image",
type="pil",
show_download_button=True,
),
gr.File(label="Download Output")
# gr.Image(
# label="Download Output",
# type='filepath',
# ),
],
title=title,
description=description,
article=article,
examples=examples,
css=css,
)
if __name__ == "__main__":
demo.launch()