| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223 |
- # Copyright (c) 2024 PaddlePaddle Authors. All Rights Reserved.
- #
- # Licensed under the Apache License, Version 2.0 (the "License");
- # you may not use this file except in compliance with the License.
- # You may obtain a copy of the License at
- #
- # http://www.apache.org/licenses/LICENSE-2.0
- #
- # Unless required by applicable law or agreed to in writing, software
- # distributed under the License is distributed on an "AS IS" BASIS,
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- # See the License for the specific language governing permissions and
- # limitations under the License.
- import numpy as np
- import PIL
- from PIL import Image, ImageDraw, ImageFont
- from ......utils import logging
- from ......utils.deps import function_requires_deps, is_dep_available
- from ......utils.fonts import PINGFANG_FONT
- if is_dep_available("pycocotools"):
- from pycocotools.coco import COCO
- def colormap(rgb=False):
- """
- Get colormap
- The code of this function is copied from https://github.com/facebookresearch/Detectron/blob/main/detectron/\
- utils/colormap.py
- """
- color_list = np.array(
- [
- 0xFF,
- 0x00,
- 0x00,
- 0xCC,
- 0xFF,
- 0x00,
- 0x00,
- 0xFF,
- 0x66,
- 0x00,
- 0x66,
- 0xFF,
- 0xCC,
- 0x00,
- 0xFF,
- 0xFF,
- 0x4D,
- 0x00,
- 0x80,
- 0xFF,
- 0x00,
- 0x00,
- 0xFF,
- 0xB2,
- 0x00,
- 0x1A,
- 0xFF,
- 0xFF,
- 0x00,
- 0xE5,
- 0xFF,
- 0x99,
- 0x00,
- 0x33,
- 0xFF,
- 0x00,
- 0x00,
- 0xFF,
- 0xFF,
- 0x33,
- 0x00,
- 0xFF,
- 0xFF,
- 0x00,
- 0x99,
- 0xFF,
- 0xE5,
- 0x00,
- 0x00,
- 0xFF,
- 0x1A,
- 0x00,
- 0xB2,
- 0xFF,
- 0x80,
- 0x00,
- 0xFF,
- 0xFF,
- 0x00,
- 0x4D,
- ]
- ).astype(np.float32)
- color_list = color_list.reshape((-1, 3))
- if not rgb:
- color_list = color_list[:, ::-1]
- return color_list.astype("int32")
- def font_colormap(color_index):
- """
- Get font color according to the index of colormap
- """
- dark = np.array([0x14, 0x0E, 0x35])
- light = np.array([0xFF, 0xFF, 0xFF])
- light_indexs = [0, 3, 4, 8, 9, 13, 14, 18, 19]
- if color_index in light_indexs:
- return light.astype("int32")
- else:
- return dark.astype("int32")
- @function_requires_deps("pycocotools")
- def draw_bbox(image, coco_info: "COCO", img_id):
- """
- Draw bbox on image
- """
- try:
- image_info = coco_info.loadImgs(img_id)[0]
- font_size = int(0.024 * int(image_info["width"])) + 2
- except:
- font_size = 12
- font = ImageFont.truetype(PINGFANG_FONT.path, font_size, encoding="utf-8")
- image = image.convert("RGB")
- draw = ImageDraw.Draw(image)
- image_size = image.size
- width = int(max(image_size) * 0.005)
- catid2color = {}
- catid2fontcolor = {}
- catid_num_dict = {}
- color_list = colormap(rgb=True)
- annotations = coco_info.loadAnns(coco_info.getAnnIds(imgIds=img_id))
- for ann in annotations:
- catid = ann["category_id"]
- catid_num_dict[catid] = catid_num_dict.get(catid, 0) + 1
- for i, (catid, _) in enumerate(
- sorted(catid_num_dict.items(), key=lambda x: x[1], reverse=True)
- ):
- if catid not in catid2color:
- color_index = i % len(color_list)
- catid2color[catid] = color_list[color_index]
- catid2fontcolor[catid] = font_colormap(color_index)
- for ann in annotations:
- catid, bbox = ann["category_id"], ann["bbox"]
- color = tuple(catid2color[catid])
- font_color = tuple(catid2fontcolor[catid])
- if len(bbox) == 4:
- # draw bbox
- xmin, ymin, w, h = bbox
- xmax = xmin + w
- ymax = ymin + h
- draw.line(
- [(xmin, ymin), (xmin, ymax), (xmax, ymax), (xmax, ymin), (xmin, ymin)],
- width=width,
- fill=color,
- )
- elif len(bbox) == 8:
- x1, y1, x2, y2, x3, y3, x4, y4 = bbox
- draw.line(
- [(x1, y1), (x2, y2), (x3, y3), (x4, y4), (x1, y1)],
- width=width,
- fill=color,
- )
- xmin = min(x1, x2, x3, x4)
- ymin = min(y1, y2, y3, y4)
- else:
- logging.info("Error: The shape of bbox must be [M, 4] or [M, 8]!")
- # draw label
- label = coco_info.loadCats(catid)[0]["name"]
- text = "{}".format(label)
- if tuple(map(int, PIL.__version__.split("."))) <= (10, 0, 0):
- tw, th = draw.textsize(text, font=font)
- else:
- left, top, right, bottom = draw.textbbox((0, 0), text, font)
- tw, th = right - left, bottom - top
- if ymin < th:
- draw.rectangle([(xmin, ymin), (xmin + tw + 4, ymin + th + 1)], fill=color)
- draw.text((xmin + 2, ymin - 2), text, fill=font_color, font=font)
- else:
- draw.rectangle([(xmin, ymin - th), (xmin + tw + 4, ymin + 1)], fill=color)
- draw.text((xmin + 2, ymin - th - 2), text, fill=font_color, font=font)
- return image
- @function_requires_deps("pycocotools")
- def draw_mask(image, coco_info: "COCO", img_id):
- """
- Draw mask on image
- """
- mask_color_id = 0
- w_ratio = 0.4
- alpha = 0.6
- color_list = colormap(rgb=True)
- img_array = np.array(image).astype("float32")
- h, w = img_array.shape[:2]
- annotations = coco_info.loadAnns(coco_info.getAnnIds(imgIds=img_id))
- for ann in annotations:
- segm = ann["segmentation"]
- if not segm:
- continue
- import pycocotools.mask as mask_util
- rles = mask_util.frPyObjects(segm, h, w)
- rle = mask_util.merge(rles)
- mask = mask_util.decode(rle) * 255
- color_mask = color_list[mask_color_id % len(color_list), 0:3]
- mask_color_id += 1
- for c in range(3):
- color_mask[c] = color_mask[c] * (1 - w_ratio) + w_ratio * 255
- idx = np.nonzero(mask)
- img_array[idx[0], idx[1], :] *= 1.0 - alpha
- img_array[idx[0], idx[1], :] += alpha * color_mask
- return Image.fromarray(img_array.astype("uint8"))
|