draw_bbox.py 3.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778
  1. from magic_pdf.libs.commons import fitz # PyMuPDF
  2. from magic_pdf.libs.ocr_content_type import ContentType
  3. def draw_bbox_without_number(i, bbox_list, page, rgb_config):
  4. new_rgb = []
  5. for item in rgb_config:
  6. item = float(item) / 255
  7. new_rgb.append(item)
  8. page_data = bbox_list[i]
  9. for bbox in page_data:
  10. x0, y0, x1, y1 = bbox
  11. rect_coords = fitz.Rect(x0, y0, x1, y1) # Define the rectangle
  12. page.draw_rect(rect_coords, color=new_rgb, fill=None, width=0.5, overlay=True) # Draw the rectangle
  13. def draw_bbox_with_number(i, bbox_list, page, rgb_config):
  14. new_rgb = []
  15. for item in rgb_config:
  16. item = float(item) / 255
  17. new_rgb.append(item)
  18. page_data = bbox_list[i]
  19. for j, bbox in enumerate(page_data):
  20. x0, y0, x1, y1 = bbox
  21. rect_coords = fitz.Rect(x0, y0, x1, y1) # Define the rectangle
  22. page.draw_rect(rect_coords, color=new_rgb, fill=None, width=0.5, overlay=True) # Draw the rectangle
  23. page.insert_text((x0, y0), str(j + 1), fontsize=10, color=new_rgb) # Insert the index at the top left corner of the rectangle
  24. def draw_layout_bbox(pdf_info_dict, pdf_bytes, out_path):
  25. layout_bbox_list = []
  26. dropped_bbox_list = []
  27. for page in pdf_info_dict.values():
  28. page_layout_list = []
  29. page_dropped_list = []
  30. for layout in page['layout_bboxes']:
  31. page_layout_list.append(layout['layout_bbox'])
  32. layout_bbox_list.append(page_layout_list)
  33. for drop_tag, dropped_bboxes in page['droped_bboxes'].items():
  34. for dropped_bbox in dropped_bboxes:
  35. page_dropped_list.append(dropped_bbox)
  36. dropped_bbox_list.append(page_dropped_list)
  37. pdf_docs = fitz.open("pdf", pdf_bytes)
  38. for i, page in enumerate(pdf_docs):
  39. draw_bbox_with_number(i, layout_bbox_list, page, [255, 0, 0])
  40. draw_bbox_without_number(i, dropped_bbox_list, page, [0, 255, 0])
  41. # Save the PDF
  42. pdf_docs.save(f"{out_path}/layout.pdf")
  43. def draw_text_bbox(pdf_info_dict, pdf_bytes, out_path):
  44. text_list = []
  45. inline_equation_list = []
  46. interline_equation_list = []
  47. for page in pdf_info_dict.values():
  48. page_text_list = []
  49. page_inline_equation_list = []
  50. page_interline_equation_list = []
  51. for block in page['preproc_blocks']:
  52. for line in block['lines']:
  53. for span in line['spans']:
  54. if span['type'] == ContentType.Text:
  55. page_text_list.append(span['bbox'])
  56. elif span['type'] == ContentType.InlineEquation:
  57. page_inline_equation_list.append(span['bbox'])
  58. elif span['type'] == ContentType.InterlineEquation:
  59. page_interline_equation_list.append(span['bbox'])
  60. text_list.append(page_text_list)
  61. inline_equation_list.append(page_inline_equation_list)
  62. interline_equation_list.append(page_interline_equation_list)
  63. pdf_docs = fitz.open("pdf", pdf_bytes)
  64. for i, page in enumerate(pdf_docs):
  65. # 获取当前页面的数据
  66. draw_bbox_without_number(i, text_list, page, [255, 0, 0])
  67. draw_bbox_without_number(i, inline_equation_list, page, [0, 255, 0])
  68. draw_bbox_without_number(i, interline_equation_list, page, [0, 0, 255])
  69. # Save the PDF
  70. pdf_docs.save(f"{out_path}/text.pdf")