GlyphControl / annotator /render_images.py
yyk19's picture
first trial
0902a5f
raw
history blame
3.88 kB
from PIL import Image, ImageFont, ImageDraw
import random
# resize height to image_height first, then shrink or pad to image_width
def resize_and_pad_image(pil_image, image_size):
if isinstance(image_size, (tuple, list)) and len(image_size) == 2:
image_width, image_height = image_size
elif isinstance(image_size, int):
image_width = image_height = image_size
else:
raise ValueError(f"Image size should be int or list/tuple of int not {image_size}")
while pil_image.size[1] >= 2 * image_height:
pil_image = pil_image.resize(
tuple(x // 2 for x in pil_image.size), resample=Image.BOX
)
scale = image_height / pil_image.size[1]
pil_image = pil_image.resize(tuple(round(x * scale) for x in pil_image.size),resample=Image.BICUBIC)
# shrink
if pil_image.size[0] > image_width:
pil_image = pil_image.resize((image_width, image_height),resample=Image.BICUBIC)
# padding
if pil_image.size[0] < image_width:
img = Image.new(mode="RGB",size=(image_width,image_height), color="white")
width, _ = pil_image.size
img.paste(pil_image,((image_width - width)//2, 0))
pil_image = img
return pil_image
def render_text_image_custom(image_size, bboxes, rendered_txt_values, num_rows_values, align = "center"):
# aligns = ["center", "left", "right"]
"""Render text image based on the list of bbox called `bboxes`.
Support font that can be choosed.
"""
print(image_size, bboxes, rendered_txt_values, num_rows_values, align)
background = Image.new("RGB", image_size, "white")
font = ImageFont.truetype("calibri.ttf", encoding='utf-8', size=512)
for text, bbox, num_rows in zip(rendered_txt_values, bboxes, num_rows_values):
if len(text) == 0:
continue
text = text.strip()
if num_rows != 1:
word_tokens = text.split()
num_tokens = len(word_tokens)
index_list = range(1, num_tokens + 1)
if num_tokens > num_rows:
index_list = random.sample(index_list, num_rows)
index_list.sort()
line_list = []
start_idx = 0
for index in index_list:
line_list.append(
" ".join(word_tokens
[start_idx: index]
)
)
start_idx = index
text = "\n".join(line_list)
if 'ratio' not in bbox or bbox['ratio'] == 0 or bbox['ratio'] < 1e-4:
image4ratio = Image.new("RGB", (512, 512), "white")
draw = ImageDraw.Draw(image4ratio)
_, _ , w, h = draw.textbbox(xy=(0,0),text = text, font=font)
ratio = w / h
else:
ratio = bbox['ratio']
width = int(bbox['width'] * image_size[1])
height = int(width / ratio)
top_left_x = int(bbox['top_left_x'] * image_size[0])
top_left_y = int(bbox['top_left_y'] * image_size[1])
yaw = bbox['yaw']
text_image = Image.new("RGB", (512, 512), "white")
draw = ImageDraw.Draw(text_image)
x,y,w,h = draw.textbbox(xy=(0,0),text = text, font=font)
text_image = Image.new("RGB", (w, h), "white")
draw = ImageDraw.Draw(text_image)
draw.text((-x/2,-y/2), text, "black", font=font, align=align)
text_image = resize_and_pad_image(text_image, (width, height))
text_image = text_image.rotate(angle=-yaw, expand=True, fillcolor="white")
# image = Image.new("RGB", (w, h), "white")
# draw = ImageDraw.Draw(image)
background.paste(text_image, (top_left_x, top_left_y))
return background