IOPaint/iopaint/model/anytext/utils.py

import os
import datetime
import cv2
import numpy as np
from PIL import Image, ImageDraw


def save_images(img_list, folder):
    if not os.path.exists(folder):
        os.makedirs(folder)
    now = datetime.datetime.now()
    date_str = now.strftime("%Y-%m-%d")
    folder_path = os.path.join(folder, date_str)
    if not os.path.exists(folder_path):
        os.makedirs(folder_path)
    time_str = now.strftime("%H_%M_%S")
    for idx, img in enumerate(img_list):
        image_number = idx + 1
        filename = f"{time_str}_{image_number}.jpg"
        save_path = os.path.join(folder_path, filename)
        cv2.imwrite(save_path, img[..., ::-1])


def check_channels(image):
    channels = image.shape[2] if len(image.shape) == 3 else 1
    if channels == 1:
        image = cv2.cvtColor(image, cv2.COLOR_GRAY2BGR)
    elif channels > 3:
        image = image[:, :, :3]
    return image


def resize_image(img, max_length=768):
    height, width = img.shape[:2]
    max_dimension = max(height, width)

    if max_dimension > max_length:
        scale_factor = max_length / max_dimension
        new_width = int(round(width * scale_factor))
        new_height = int(round(height * scale_factor))
        new_size = (new_width, new_height)
        img = cv2.resize(img, new_size)
    height, width = img.shape[:2]
    img = cv2.resize(img, (width - (width % 64), height - (height % 64)))
    return img


def insert_spaces(string, nSpace):
    if nSpace == 0:
        return string
    new_string = ""
    for char in string:
        new_string += char + " " * nSpace
    return new_string[:-nSpace]


def draw_glyph(font, text):
    g_size = 50
    W, H = (512, 80)
    new_font = font.font_variant(size=g_size)
    img = Image.new(mode="1", size=(W, H), color=0)
    draw = ImageDraw.Draw(img)
    left, top, right, bottom = new_font.getbbox(text)
    text_width = max(right - left, 5)
    text_height = max(bottom - top, 5)
    ratio = min(W * 0.9 / text_width, H * 0.9 / text_height)
    new_font = font.font_variant(size=int(g_size * ratio))

    text_width, text_height = new_font.getsize(text)
    offset_x, offset_y = new_font.getoffset(text)
    x = (img.width - text_width) // 2
    y = (img.height - text_height) // 2 - offset_y // 2
    draw.text((x, y), text, font=new_font, fill="white")
    img = np.expand_dims(np.array(img), axis=2).astype(np.float64)
    return img


def draw_glyph2(
    font, text, polygon, vertAng=10, scale=1, width=512, height=512, add_space=True
):
    enlarge_polygon = polygon * scale
    rect = cv2.minAreaRect(enlarge_polygon)
    box = cv2.boxPoints(rect)
    box = np.int0(box)
    w, h = rect[1]
    angle = rect[2]
    if angle < -45:
        angle += 90
    angle = -angle
    if w < h:
        angle += 90

    vert = False
    if abs(angle) % 90 < vertAng or abs(90 - abs(angle) % 90) % 90 < vertAng:
        _w = max(box[:, 0]) - min(box[:, 0])
        _h = max(box[:, 1]) - min(box[:, 1])
        if _h >= _w:
            vert = True
            angle = 0

    img = np.zeros((height * scale, width * scale, 3), np.uint8)
    img = Image.fromarray(img)

    # infer font size
    image4ratio = Image.new("RGB", img.size, "white")
    draw = ImageDraw.Draw(image4ratio)
    _, _, _tw, _th = draw.textbbox(xy=(0, 0), text=text, font=font)
    text_w = min(w, h) * (_tw / _th)
    if text_w <= max(w, h):
        # add space
        if len(text) > 1 and not vert and add_space:
            for i in range(1, 100):
                text_space = insert_spaces(text, i)
                _, _, _tw2, _th2 = draw.textbbox(xy=(0, 0), text=text_space, font=font)
                if min(w, h) * (_tw2 / _th2) > max(w, h):
                    break
            text = insert_spaces(text, i - 1)
        font_size = min(w, h) * 0.80
    else:
        shrink = 0.75 if vert else 0.85
        font_size = min(w, h) / (text_w / max(w, h)) * shrink
    new_font = font.font_variant(size=int(font_size))

    left, top, right, bottom = new_font.getbbox(text)
    text_width = right - left
    text_height = bottom - top

    layer = Image.new("RGBA", img.size, (0, 0, 0, 0))
    draw = ImageDraw.Draw(layer)
    if not vert:
        draw.text(
            (rect[0][0] - text_width // 2, rect[0][1] - text_height // 2 - top),
            text,
            font=new_font,
            fill=(255, 255, 255, 255),
        )
    else:
        x_s = min(box[:, 0]) + _w // 2 - text_height // 2
        y_s = min(box[:, 1])
        for c in text:
            draw.text((x_s, y_s), c, font=new_font, fill=(255, 255, 255, 255))
            _, _t, _, _b = new_font.getbbox(c)
            y_s += _b

    rotated_layer = layer.rotate(angle, expand=1, center=(rect[0][0], rect[0][1]))

    x_offset = int((img.width - rotated_layer.width) / 2)
    y_offset = int((img.height - rotated_layer.height) / 2)
    img.paste(rotated_layer, (x_offset, y_offset), rotated_layer)
    img = np.expand_dims(np.array(img.convert("1")), axis=2).astype(np.float64)
    return img
anytext init 2024-01-21 05:30:49 +01:00			`import os`
			`import datetime`
			`import cv2`
			`import numpy as np`
			`from PIL import Image, ImageDraw`


			`def save_images(img_list, folder):`
			`if not os.path.exists(folder):`
			`os.makedirs(folder)`
			`now = datetime.datetime.now()`
			`date_str = now.strftime("%Y-%m-%d")`
			`folder_path = os.path.join(folder, date_str)`
			`if not os.path.exists(folder_path):`
			`os.makedirs(folder_path)`
			`time_str = now.strftime("%H_%M_%S")`
			`for idx, img in enumerate(img_list):`
			`image_number = idx + 1`
			`filename = f"{time_str}_{image_number}.jpg"`
			`save_path = os.path.join(folder_path, filename)`
			`cv2.imwrite(save_path, img[..., ::-1])`


			`def check_channels(image):`
			`channels = image.shape[2] if len(image.shape) == 3 else 1`
			`if channels == 1:`
			`image = cv2.cvtColor(image, cv2.COLOR_GRAY2BGR)`
			`elif channels > 3:`
			`image = image[:, :, :3]`
			`return image`


			`def resize_image(img, max_length=768):`
			`height, width = img.shape[:2]`
			`max_dimension = max(height, width)`

			`if max_dimension > max_length:`
			`scale_factor = max_length / max_dimension`
			`new_width = int(round(width * scale_factor))`
			`new_height = int(round(height * scale_factor))`
			`new_size = (new_width, new_height)`
			`img = cv2.resize(img, new_size)`
			`height, width = img.shape[:2]`
			`img = cv2.resize(img, (width - (width % 64), height - (height % 64)))`
			`return img`


			`def insert_spaces(string, nSpace):`
			`if nSpace == 0:`
			`return string`
			`new_string = ""`
			`for char in string:`
			`new_string += char + " " * nSpace`
			`return new_string[:-nSpace]`


			`def draw_glyph(font, text):`
			`g_size = 50`
			`W, H = (512, 80)`
			`new_font = font.font_variant(size=g_size)`
			`img = Image.new(mode="1", size=(W, H), color=0)`
			`draw = ImageDraw.Draw(img)`
			`left, top, right, bottom = new_font.getbbox(text)`
			`text_width = max(right - left, 5)`
			`text_height = max(bottom - top, 5)`
			`ratio = min(W * 0.9 / text_width, H * 0.9 / text_height)`
			`new_font = font.font_variant(size=int(g_size * ratio))`

			`text_width, text_height = new_font.getsize(text)`
			`offset_x, offset_y = new_font.getoffset(text)`
			`x = (img.width - text_width) // 2`
			`y = (img.height - text_height) // 2 - offset_y // 2`
			`draw.text((x, y), text, font=new_font, fill="white")`
			`img = np.expand_dims(np.array(img), axis=2).astype(np.float64)`
			`return img`


			`def draw_glyph2(`
			`font, text, polygon, vertAng=10, scale=1, width=512, height=512, add_space=True`
			`):`
			`enlarge_polygon = polygon * scale`
			`rect = cv2.minAreaRect(enlarge_polygon)`
			`box = cv2.boxPoints(rect)`
			`box = np.int0(box)`
			`w, h = rect[1]`
			`angle = rect[2]`
			`if angle < -45:`
			`angle += 90`
			`angle = -angle`
			`if w < h:`
			`angle += 90`

			`vert = False`
			`if abs(angle) % 90 < vertAng or abs(90 - abs(angle) % 90) % 90 < vertAng:`
			`_w = max(box[:, 0]) - min(box[:, 0])`
			`_h = max(box[:, 1]) - min(box[:, 1])`
			`if _h >= _w:`
			`vert = True`
			`angle = 0`

			`img = np.zeros((height * scale, width * scale, 3), np.uint8)`
			`img = Image.fromarray(img)`

			`# infer font size`
			`image4ratio = Image.new("RGB", img.size, "white")`
			`draw = ImageDraw.Draw(image4ratio)`
			`_, _, _tw, _th = draw.textbbox(xy=(0, 0), text=text, font=font)`
			`text_w = min(w, h) * (_tw / _th)`
			`if text_w <= max(w, h):`
			`# add space`
			`if len(text) > 1 and not vert and add_space:`
			`for i in range(1, 100):`
			`text_space = insert_spaces(text, i)`
			`_, _, _tw2, _th2 = draw.textbbox(xy=(0, 0), text=text_space, font=font)`
			`if min(w, h) * (_tw2 / _th2) > max(w, h):`
			`break`
			`text = insert_spaces(text, i - 1)`
			`font_size = min(w, h) * 0.80`
			`else:`
			`shrink = 0.75 if vert else 0.85`
			`font_size = min(w, h) / (text_w / max(w, h)) * shrink`
			`new_font = font.font_variant(size=int(font_size))`

			`left, top, right, bottom = new_font.getbbox(text)`
			`text_width = right - left`
			`text_height = bottom - top`

			`layer = Image.new("RGBA", img.size, (0, 0, 0, 0))`
			`draw = ImageDraw.Draw(layer)`
			`if not vert:`
			`draw.text(`
			`(rect[0][0] - text_width // 2, rect[0][1] - text_height // 2 - top),`
			`text,`
			`font=new_font,`
			`fill=(255, 255, 255, 255),`
			`)`
			`else:`
			`x_s = min(box[:, 0]) + _w // 2 - text_height // 2`
			`y_s = min(box[:, 1])`
			`for c in text:`
			`draw.text((x_s, y_s), c, font=new_font, fill=(255, 255, 255, 255))`
			`_, _t, _, _b = new_font.getbbox(c)`
			`y_s += _b`

			`rotated_layer = layer.rotate(angle, expand=1, center=(rect[0][0], rect[0][1]))`

			`x_offset = int((img.width - rotated_layer.width) / 2)`
			`y_offset = int((img.height - rotated_layer.height) / 2)`
			`img.paste(rotated_layer, (x_offset, y_offset), rotated_layer)`
			`img = np.expand_dims(np.array(img.convert("1")), axis=2).astype(np.float64)`
			`return img`