Spaces:
Running
on
T4
Running
on
T4
from PIL import Image, ImageFont, ImageDraw | |
import random | |
# resize height to image_height first, then shrink or pad to image_width | |
def resize_and_pad_image(pil_image, image_size): | |
if isinstance(image_size, (tuple, list)) and len(image_size) == 2: | |
image_width, image_height = image_size | |
elif isinstance(image_size, int): | |
image_width = image_height = image_size | |
else: | |
raise ValueError(f"Image size should be int or list/tuple of int not {image_size}") | |
while pil_image.size[1] >= 2 * image_height: | |
pil_image = pil_image.resize( | |
tuple(x // 2 for x in pil_image.size), resample=Image.BOX | |
) | |
scale = image_height / pil_image.size[1] | |
pil_image = pil_image.resize(tuple(round(x * scale) for x in pil_image.size),resample=Image.BICUBIC) | |
# shrink | |
if pil_image.size[0] > image_width: | |
pil_image = pil_image.resize((image_width, image_height),resample=Image.BICUBIC) | |
# padding | |
if pil_image.size[0] < image_width: | |
img = Image.new(mode="RGB",size=(image_width,image_height), color="white") | |
width, _ = pil_image.size | |
img.paste(pil_image,((image_width - width)//2, 0)) | |
pil_image = img | |
return pil_image | |
def render_text_image_custom(image_size, bboxes, rendered_txt_values, num_rows_values, align = "center"): | |
# aligns = ["center", "left", "right"] | |
"""Render text image based on the list of bbox called `bboxes`. | |
Support font that can be choosed. | |
""" | |
print(image_size, bboxes, rendered_txt_values, num_rows_values, align) | |
background = Image.new("RGB", image_size, "white") | |
font = ImageFont.truetype("calibri.ttf", encoding='utf-8', size=512) | |
for text, bbox, num_rows in zip(rendered_txt_values, bboxes, num_rows_values): | |
if len(text) == 0: | |
continue | |
text = text.strip() | |
if num_rows != 1: | |
word_tokens = text.split() | |
num_tokens = len(word_tokens) | |
index_list = range(1, num_tokens + 1) | |
if num_tokens > num_rows: | |
index_list = random.sample(index_list, num_rows) | |
index_list.sort() | |
line_list = [] | |
start_idx = 0 | |
for index in index_list: | |
line_list.append( | |
" ".join(word_tokens | |
[start_idx: index] | |
) | |
) | |
start_idx = index | |
text = "\n".join(line_list) | |
if 'ratio' not in bbox or bbox['ratio'] == 0 or bbox['ratio'] < 1e-4: | |
image4ratio = Image.new("RGB", (512, 512), "white") | |
draw = ImageDraw.Draw(image4ratio) | |
_, _ , w, h = draw.textbbox(xy=(0,0),text = text, font=font) | |
ratio = w / h | |
else: | |
ratio = bbox['ratio'] | |
width = int(bbox['width'] * image_size[1]) | |
height = int(width / ratio) | |
top_left_x = int(bbox['top_left_x'] * image_size[0]) | |
top_left_y = int(bbox['top_left_y'] * image_size[1]) | |
yaw = bbox['yaw'] | |
text_image = Image.new("RGB", (512, 512), "white") | |
draw = ImageDraw.Draw(text_image) | |
x,y,w,h = draw.textbbox(xy=(0,0),text = text, font=font) | |
text_image = Image.new("RGB", (w, h), "white") | |
draw = ImageDraw.Draw(text_image) | |
draw.text((-x/2,-y/2), text, "black", font=font, align=align) | |
text_image = resize_and_pad_image(text_image, (width, height)) | |
text_image = text_image.rotate(angle=-yaw, expand=True, fillcolor="white") | |
# image = Image.new("RGB", (w, h), "white") | |
# draw = ImageDraw.Draw(image) | |
background.paste(text_image, (top_left_x, top_left_y)) | |
return background | |