topk.py 3.2 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586
  1. # copyright (c) 2024 PaddlePaddle Authors. All Rights Reserve.
  2. #
  3. # Licensed under the Apache License, Version 2.0 (the "License");
  4. # you may not use this file except in compliance with the License.
  5. # You may obtain a copy of the License at
  6. #
  7. # http://www.apache.org/licenses/LICENSE-2.0
  8. #
  9. # Unless required by applicable law or agreed to in writing, software
  10. # distributed under the License is distributed on an "AS IS" BASIS,
  11. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. # See the License for the specific language governing permissions and
  13. # limitations under the License.
  14. import PIL
  15. from PIL import ImageDraw, ImageFont
  16. import numpy as np
  17. from ...utils.fonts import PINGFANG_FONT_FILE_PATH
  18. from ..utils.color_map import get_colormap
  19. from .base import BaseResult
  20. class TopkResult(BaseResult):
  21. def __init__(self, data):
  22. super().__init__(data)
  23. self._img_reader.set_backend("pillow")
  24. self._img_writer.set_backend("pillow")
  25. def _get_res_img(self):
  26. """Draw label on image"""
  27. labels = self.get("label_names", self["class_ids"])
  28. label_str = f"{labels[0]} {self['scores'][0]:.2f}"
  29. image = self._img_reader.read(self["img_path"])
  30. image = image.convert("RGB")
  31. image_size = image.size
  32. draw = ImageDraw.Draw(image)
  33. min_font_size = int(image_size[0] * 0.02)
  34. max_font_size = int(image_size[0] * 0.05)
  35. for font_size in range(max_font_size, min_font_size - 1, -1):
  36. font = ImageFont.truetype(
  37. PINGFANG_FONT_FILE_PATH, font_size, encoding="utf-8"
  38. )
  39. if tuple(map(int, PIL.__version__.split("."))) <= (10, 0, 0):
  40. text_width_tmp, text_height_tmp = draw.textsize(label_str, font)
  41. else:
  42. left, top, right, bottom = draw.textbbox((0, 0), label_str, font)
  43. text_width_tmp, text_height_tmp = right - left, bottom - top
  44. if text_width_tmp <= image_size[0]:
  45. break
  46. else:
  47. font = ImageFont.truetype(PINGFANG_FONT_FILE_PATH, min_font_size)
  48. color_list = get_colormap(rgb=True)
  49. color = tuple(color_list[0])
  50. font_color = tuple(self._get_font_colormap(3))
  51. if tuple(map(int, PIL.__version__.split("."))) <= (10, 0, 0):
  52. text_width, text_height = draw.textsize(label_str, font)
  53. else:
  54. left, top, right, bottom = draw.textbbox((0, 0), label_str, font)
  55. text_width, text_height = right - left, bottom - top
  56. rect_left = 3
  57. rect_top = 3
  58. rect_right = rect_left + text_width + 3
  59. rect_bottom = rect_top + text_height + 6
  60. draw.rectangle([(rect_left, rect_top), (rect_right, rect_bottom)], fill=color)
  61. text_x = rect_left + 3
  62. text_y = rect_top
  63. draw.text((text_x, text_y), label_str, fill=font_color, font=font)
  64. return image
  65. def _get_font_colormap(self, color_index):
  66. """
  67. Get font colormap
  68. """
  69. dark = np.array([0x14, 0x0E, 0x35])
  70. light = np.array([0xFF, 0xFF, 0xFF])
  71. light_indexs = [0, 3, 4, 8, 9, 13, 14, 18, 19]
  72. if color_index in light_indexs:
  73. return light.astype("int32")
  74. else:
  75. return dark.astype("int32")