Spaces:
Sleeping
Sleeping
File size: 3,372 Bytes
a1739b9 0297809 a1739b9 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 |
from PIL import Image
import cv2
import numpy as np
import os
import tempfile
def resize(img, size):
assert img.dtype == np.uint8
pil_image = Image.fromarray(img)
pil_image = pil_image.resize(size, Image.LANCZOS)
resized_img = np.array(pil_image)
return resized_img
def crop(img, start_h, start_w, crop_h, crop_w):
img_src = np.zeros((crop_h, crop_w, *img.shape[2:]), dtype=img.dtype)
hsize, wsize = crop_h, crop_w
dh, dw, sh, sw = start_h, start_w, 0, 0
if dh < 0:
sh = -dh
hsize += dh
dh = 0
if dh + hsize > img.shape[0]:
hsize = img.shape[0] - dh
if dw < 0:
sw = -dw
wsize += dw
dw = 0
if dw + wsize > img.shape[1]:
wsize = img.shape[1] - dw
img_src[sh : sh + hsize, sw : sw + wsize] = img[dh : dh + hsize, dw : dw + wsize]
return img_src
def imresize_max(img, size, min_side=False):
new_img = []
for i, _img in enumerate(img):
h, w = _img.shape[:2]
ori_size = min(h, w) if min_side else max(h, w)
_resize = min(size / ori_size, 1.0)
new_size = (int(w * _resize), int(h * _resize))
new_img.append(resize(_img, new_size))
return new_img
def imcrop_multi(img, multiple=32):
new_img = []
for i, _img in enumerate(img):
crop_size = (
_img.shape[0] // multiple * multiple,
_img.shape[1] // multiple * multiple,
)
start_h = int(0.5 * max(0, _img.shape[0] - crop_size[0]))
start_w = int(0.5 * max(0, _img.shape[1] - crop_size[1]))
_img_src = crop(_img, start_h, start_w, crop_size[0], crop_size[1])
new_img.append(_img_src)
return new_img
def read_video(video_path, max_frames=None):
cap = cv2.VideoCapture(video_path)
fps = cap.get(cv2.CAP_PROP_FPS)
frames = []
count = 0
while True:
ret, frame = cap.read()
if not ret:
break
frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
frames.append(frame)
count += 1
if max_frames is not None and count >= max_frames:
break
cap.release()
# (N, H, W, 3)
return frames, fps
def read_image(image_path):
frame = cv2.imread(image_path)
frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
# (1, H, W, 3)
return [frame]
def write_video(video_path, frames, fps):
# tmp_dir = os.path.join(os.path.dirname(video_path), "tmp")
# os.makedirs(tmp_dir, exist_ok=True)
# for i, frame in enumerate(frames):
# write_image(os.path.join(tmp_dir, f"{i:06d}.png"), frame)
# # it will cause visual compression artifacts
# ffmpeg_command = [
# "ffmpeg",
# "-f",
# "image2",
# "-framerate",
# f"{fps}",
# "-i",
# os.path.join(tmp_dir, "%06d.png"),
# "-b:v",
# "5626k",
# "-y",
# video_path,
# ]
# os.system(" ".join(ffmpeg_command))
# os.system(f"rm -rf {tmp_dir}")
h, w = frames[0].shape[:2]
fourcc = cv2.VideoWriter_fourcc(*"mp4v")
out = cv2.VideoWriter(video_path, fourcc, fps, (w, h))
for frame in frames:
frame = cv2.cvtColor(frame, cv2.COLOR_RGB2BGR)
out.write(frame)
out.release()
def write_image(image_path, frame):
frame = cv2.cvtColor(frame, cv2.COLOR_RGB2BGR)
cv2.imwrite(image_path, frame)
|