IOPaint/lama_cleaner/helper.py

125 lines
3.4 KiB
Python
Raw Normal View History

2021-11-15 08:22:34 +01:00
import os
import sys
2022-03-23 03:02:01 +01:00
from typing import List
2021-11-15 08:22:34 +01:00
from urllib.parse import urlparse
import cv2
import numpy as np
import torch
from torch.hub import download_url_to_file, get_dir
2022-03-04 06:44:53 +01:00
def download_model(url):
2021-11-15 08:22:34 +01:00
parts = urlparse(url)
hub_dir = get_dir()
model_dir = os.path.join(hub_dir, "checkpoints")
2021-11-15 20:11:46 +01:00
if not os.path.isdir(model_dir):
os.makedirs(os.path.join(model_dir, "hub", "checkpoints"))
2021-11-15 08:22:34 +01:00
filename = os.path.basename(parts.path)
cached_file = os.path.join(model_dir, filename)
if not os.path.exists(cached_file):
sys.stderr.write('Downloading: "{}" to {}\n'.format(url, cached_file))
hash_prefix = None
download_url_to_file(url, cached_file, hash_prefix, progress=True)
return cached_file
def ceil_modulo(x, mod):
if x % mod == 0:
return x
return (x // mod + 1) * mod
2022-04-09 01:23:33 +02:00
def numpy_to_bytes(image_numpy: np.ndarray, ext: str) -> bytes:
2022-04-15 18:11:51 +02:00
data = cv2.imencode(f".{ext}", image_numpy,
[
int(cv2.IMWRITE_JPEG_QUALITY), 100,
int(cv2.IMWRITE_PNG_COMPRESSION), 0
])[1]
2021-11-15 08:22:34 +01:00
image_bytes = data.tobytes()
return image_bytes
def load_img(img_bytes, gray: bool = False):
2022-04-09 02:12:37 +02:00
alpha_channel = None
2021-11-15 08:22:34 +01:00
nparr = np.frombuffer(img_bytes, np.uint8)
if gray:
np_img = cv2.imdecode(nparr, cv2.IMREAD_GRAYSCALE)
2021-11-15 08:22:34 +01:00
else:
np_img = cv2.imdecode(nparr, cv2.IMREAD_UNCHANGED)
if len(np_img.shape) == 3 and np_img.shape[2] == 4:
2022-04-09 02:12:37 +02:00
alpha_channel = np_img[:, :, -1]
np_img = cv2.cvtColor(np_img, cv2.COLOR_BGRA2RGB)
else:
np_img = cv2.cvtColor(np_img, cv2.COLOR_BGR2RGB)
2022-04-09 02:12:37 +02:00
return np_img, alpha_channel
2021-11-15 08:22:34 +01:00
def norm_img(np_img):
if len(np_img.shape) == 2:
np_img = np_img[:, :, np.newaxis]
np_img = np.transpose(np_img, (2, 0, 1))
np_img = np_img.astype("float32") / 255
2021-11-15 08:22:34 +01:00
return np_img
def resize_max_size(
np_img, size_limit: int, interpolation=cv2.INTER_CUBIC
) -> np.ndarray:
# Resize image's longer size to size_limit if longer size larger than size_limit
h, w = np_img.shape[:2]
if max(h, w) > size_limit:
ratio = size_limit / max(h, w)
new_w = int(w * ratio + 0.5)
new_h = int(h * ratio + 0.5)
return cv2.resize(np_img, dsize=(new_w, new_h), interpolation=interpolation)
else:
return np_img
2022-04-15 18:11:51 +02:00
def pad_img_to_modulo(img: np.ndarray, mod: int):
"""
Args:
img: [H, W, C]
mod:
Returns:
"""
if len(img.shape) == 2:
img = img[:, :, np.newaxis]
height, width = img.shape[:2]
2021-11-15 08:22:34 +01:00
out_height = ceil_modulo(height, mod)
out_width = ceil_modulo(width, mod)
return np.pad(
img,
2022-04-15 18:11:51 +02:00
((0, out_height - height), (0, out_width - width), (0, 0)),
2021-11-15 08:22:34 +01:00
mode="symmetric",
)
2022-03-23 03:02:01 +01:00
def boxes_from_mask(mask: np.ndarray) -> List[np.ndarray]:
"""
Args:
2022-04-15 18:11:51 +02:00
mask: (h, w, 1) 0~255
2022-03-23 03:02:01 +01:00
Returns:
"""
2022-04-15 18:11:51 +02:00
height, width = mask.shape[:2]
_, thresh = cv2.threshold(mask, 127, 255, 0)
2022-03-23 03:02:01 +01:00
contours, _ = cv2.findContours(thresh, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
boxes = []
for cnt in contours:
x, y, w, h = cv2.boundingRect(cnt)
box = np.array([x, y, x + w, y + h]).astype(np.int)
box[::2] = np.clip(box[::2], 0, width)
box[1::2] = np.clip(box[1::2], 0, height)
boxes.append(box)
return boxes