| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778 |
- # copyright (c) 2024 PaddlePaddle Authors. All Rights Reserve.
- #
- # Licensed under the Apache License, Version 2.0 (the "License");
- # you may not use this file except in compliance with the License.
- # You may obtain a copy of the License at
- #
- # http://www.apache.org/licenses/LICENSE-2.0
- #
- # Unless required by applicable law or agreed to in writing, software
- # distributed under the License is distributed on an "AS IS" BASIS,
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- # See the License for the specific language governing permissions and
- # limitations under the License.
- import math
- import random
- from pathlib import Path
- import numpy as np
- import cv2
- import PIL
- from PIL import Image, ImageDraw, ImageFont
- from ....utils.fonts import PINGFANG_FONT_FILE_PATH, create_font
- from ...common.result import BaseCVResult
- class DocPreprocessorResult(BaseCVResult):
- """doc preprocessor result"""
- def save_to_img(self, save_path: str, *args, **kwargs) -> None:
- """
- Save the image to the specified path.
- Args:
- save_path (str): The path to save the image.
- If the path does not end with '.jpg' or '.png', it appends '_res_doc_preprocess_<img_id>.jpg'
- to the path where <img_id> is retrieved from the object's 'img_id' attribute.
- *args: Variable length argument list.
- **kwargs: Arbitrary keyword arguments.
- Returns:
- None
- """
- if not str(save_path).lower().endswith((".jpg", ".png")):
- img_id = self["img_id"]
- save_path = Path(save_path) / f"res_doc_preprocess_{img_id}.jpg"
- super().save_to_img(save_path, *args, **kwargs)
- def _to_img(self) -> PIL.Image:
- """
- Generate an image combining the original, rotated, and unwarping images.
- Returns:
- PIL.Image: A new image that displays the original, rotated, and unwarping images side by side.
- """
- image = self["input_image"][:, :, ::-1]
- angle = self["angle"]
- rot_img = self["rot_img"][:, :, ::-1]
- output_img = self["output_img"][:, :, ::-1]
- h1, w1 = image.shape[0:2]
- h2, w2 = rot_img.shape[0:2]
- h3, w3 = output_img.shape[0:2]
- h = max(max(h1, h2), h3)
- img_show = Image.new("RGB", (w1 + w2 + w3, h + 25), (255, 255, 255))
- img_show.paste(Image.fromarray(image), (0, 0, w1, h1))
- img_show.paste(Image.fromarray(rot_img), (w1, 0, w1 + w2, h2))
- img_show.paste(Image.fromarray(output_img), (w1 + w2, 0, w1 + w2 + w3, h3))
- draw_text = ImageDraw.Draw(img_show)
- txt_list = ["Original Image", "Rotated Image", "Unwarping Image"]
- region_w_list = [w1, w2, w3]
- beg_w_list = [0, w1, w1 + w2]
- for tno in range(len(txt_list)):
- txt = txt_list[tno]
- font = create_font(txt, (region_w_list[tno], 20), PINGFANG_FONT_FILE_PATH)
- draw_text.text(
- [10 + beg_w_list[tno], h + 2], txt, fill=(0, 0, 0), font=font
- )
- return img_show
|