| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108 |
- # copyright (c) 2024 PaddlePaddle Authors. All Rights Reserve.
- #
- # Licensed under the Apache License, Version 2.0 (the "License");
- # you may not use this file except in compliance with the License.
- # You may obtain a copy of the License at
- #
- # http://www.apache.org/licenses/LICENSE-2.0
- #
- # Unless required by applicable law or agreed to in writing, software
- # distributed under the License is distributed on an "AS IS" BASIS,
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- # See the License for the specific language governing permissions and
- # limitations under the License.
- import cv2
- import numpy as np
- from pathlib import Path
- import PIL
- from PIL import Image, ImageDraw, ImageFont
- from ...common.result import BaseResult, BaseCVResult, HtmlMixin, XlsxMixin
- class TableRecResult(BaseCVResult):
- """SaveTableResults"""
- def __init__(self, data):
- super().__init__(data)
- def _to_img(self):
- image = self["input_img"]
- bbox_res = self["bbox"]
- if len(bbox_res) > 0 and len(bbox_res[0]) == 4:
- vis_img = self.draw_rectangle(image, bbox_res)
- else:
- vis_img = self.draw_bbox(image, bbox_res)
- return vis_img
- def draw_rectangle(self, image, boxes):
- """draw_rectangle"""
- boxes = np.array(boxes)
- img_show = image.copy()
- for box in boxes.astype(int):
- x1, y1, x2, y2 = box
- cv2.rectangle(img_show, (x1, y1), (x2, y2), (255, 0, 0), 2)
- return img_show
- def draw_bbox(self, image, boxes):
- """draw_bbox"""
- for box in boxes:
- box = np.reshape(np.array(box), [-1, 1, 2]).astype(np.int64)
- image = cv2.polylines(np.array(image), [box], True, (255, 0, 0), 2)
- return image
- class StructureTableResult(TableRecResult, HtmlMixin, XlsxMixin):
- """StructureTableResult"""
- def __init__(self, data):
- super().__init__(data)
- HtmlMixin.__init__(self)
- XlsxMixin.__init__(self)
- def _to_html(self):
- return self["html"]
- class TableResult(BaseCVResult, HtmlMixin, XlsxMixin):
- """TableResult"""
- def __init__(self, data):
- super().__init__(data)
- HtmlMixin.__init__(self)
- XlsxMixin.__init__(self)
- def save_to_html(self, save_path):
- if not save_path.lower().endswith(("html")):
- input_path = self["input_path"]
- save_path = Path(save_path) / f"{Path(input_path).stem}"
- else:
- save_path = Path(save_path).stem
- for table_result in self["table_result"]:
- table_result.save_to_html(save_path)
- def save_to_xlsx(self, save_path):
- if not save_path.lower().endswith(("xlsx")):
- input_path = self["input_path"]
- save_path = Path(save_path) / f"{Path(input_path).stem}"
- else:
- save_path = Path(save_path).stem
- for table_result in self["table_result"]:
- table_result.save_to_xlsx(save_path)
- def save_to_img(self, save_path):
- if not save_path.lower().endswith((".jpg", ".png")):
- input_path = self["input_path"]
- save_path = Path(save_path) / f"{Path(input_path).stem}"
- else:
- save_path = Path(save_path).stem
- layout_save_path = f"{save_path}_layout.jpg"
- ocr_save_path = f"{save_path}_ocr.jpg"
- table_save_path = f"{save_path}_table"
- layout_result = self["layout_result"]
- layout_result.save_to_img(layout_save_path)
- ocr_result = self["ocr_result"]
- ocr_result.save_to_img(ocr_save_path)
- for idx, table_result in enumerate(self["table_result"]):
- table_result.save_to_img(f"{table_save_path}_{idx}.jpg")
|