| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116 |
- from magic_pdf.libs.commons import fitz # PyMuPDF
- from magic_pdf.libs.ocr_content_type import ContentType, BlockType
- def draw_bbox_without_number(i, bbox_list, page, rgb_config, fill_config):
- new_rgb = []
- for item in rgb_config:
- item = float(item) / 255
- new_rgb.append(item)
- page_data = bbox_list[i]
- for bbox in page_data:
- x0, y0, x1, y1 = bbox
- rect_coords = fitz.Rect(x0, y0, x1, y1) # Define the rectangle
- if fill_config:
- page.draw_rect(rect_coords, color=None, fill=new_rgb, fill_opacity=0.3, width=0.5, overlay=True) # Draw the rectangle
- else:
- page.draw_rect(rect_coords, color=new_rgb, fill=None, fill_opacity=1, width=0.5, overlay=True) # Draw the rectangle
- def draw_bbox_with_number(i, bbox_list, page, rgb_config, fill_config):
- new_rgb = []
- for item in rgb_config:
- item = float(item) / 255
- new_rgb.append(item)
- page_data = bbox_list[i]
- for j, bbox in enumerate(page_data):
- x0, y0, x1, y1 = bbox
- rect_coords = fitz.Rect(x0, y0, x1, y1) # Define the rectangle
- if fill_config:
- page.draw_rect(rect_coords, color=None, fill=new_rgb, fill_opacity=0.3, width=0.5, overlay=True) # Draw the rectangle
- else:
- page.draw_rect(rect_coords, color=new_rgb, fill=None, fill_opacity=1, width=0.5, overlay=True) # Draw the rectangle
- page.insert_text((x0, y0+10), str(j + 1), fontsize=10, color=new_rgb) # Insert the index at the top left corner of the rectangle
- def draw_layout_bbox(pdf_info, pdf_bytes, out_path):
- layout_bbox_list = []
- blocks_bbox_list = []
- dropped_bbox_list = []
- for page in pdf_info:
- page_layout_list = []
- page_dropped_list = []
- page_blocks_bbox_list = []
- for layout in page['layout_bboxes']:
- page_layout_list.append(layout['layout_bbox'])
- layout_bbox_list.append(page_layout_list)
- for dropped_bbox in page['discarded_blocks']:
- page_dropped_list.append(dropped_bbox['bbox'])
- dropped_bbox_list.append(page_dropped_list)
- for block in page['para_blocks']:
- page_blocks_bbox_list.append(block['bbox'])
- blocks_bbox_list.append(page_blocks_bbox_list)
- pdf_docs = fitz.open("pdf", pdf_bytes)
- for i, page in enumerate(pdf_docs):
- draw_bbox_with_number(i, layout_bbox_list, page, [255, 0, 0], False)
- draw_bbox_without_number(i, dropped_bbox_list, page, [0, 255, 0], True)
- draw_bbox_without_number(i, blocks_bbox_list, page, [0, 0, 255], True)
- # Save the PDF
- pdf_docs.save(f"{out_path}/layout.pdf")
- def draw_span_bbox(pdf_info, pdf_bytes, out_path):
- text_list = []
- inline_equation_list = []
- interline_equation_list = []
- image_list = []
- table_list = []
- for page in pdf_info:
- page_text_list = []
- page_inline_equation_list = []
- page_interline_equation_list = []
- page_image_list = []
- page_table_list = []
- for block in page['para_blocks']:
- if block['type'] in [BlockType.Text, BlockType.Title, BlockType.InterlineEquation]:
- for line in block['lines']:
- for span in line['spans']:
- if span['type'] == ContentType.Text:
- page_text_list.append(span['bbox'])
- elif span['type'] == ContentType.InlineEquation:
- page_inline_equation_list.append(span['bbox'])
- elif span['type'] == ContentType.InterlineEquation:
- page_interline_equation_list.append(span['bbox'])
- elif span['type'] == ContentType.Image:
- page_image_list.append(span['bbox'])
- elif span['type'] == ContentType.Table:
- page_table_list.append(span['bbox'])
- elif block['type'] in [BlockType.Image, BlockType.Table]:
- for sub_block in block["blocks"]:
- for line in sub_block['lines']:
- for span in line['spans']:
- if span['type'] == ContentType.Text:
- page_text_list.append(span['bbox'])
- elif span['type'] == ContentType.InlineEquation:
- page_inline_equation_list.append(span['bbox'])
- elif span['type'] == ContentType.InterlineEquation:
- page_interline_equation_list.append(span['bbox'])
- elif span['type'] == ContentType.Image:
- page_image_list.append(span['bbox'])
- elif span['type'] == ContentType.Table:
- page_table_list.append(span['bbox'])
- text_list.append(page_text_list)
- inline_equation_list.append(page_inline_equation_list)
- interline_equation_list.append(page_interline_equation_list)
- image_list.append(page_image_list)
- table_list.append(page_table_list)
- pdf_docs = fitz.open("pdf", pdf_bytes)
- for i, page in enumerate(pdf_docs):
- # 获取当前页面的数据
- draw_bbox_without_number(i, text_list, page, [255, 0, 0], False)
- draw_bbox_without_number(i, inline_equation_list, page, [0, 255, 0], False)
- draw_bbox_without_number(i, interline_equation_list, page, [0, 0, 255], False)
- draw_bbox_without_number(i, image_list, page, [255, 204, 0], False)
- draw_bbox_without_number(i, table_list, page, [204, 0, 255], False)
- # Save the PDF
- pdf_docs.save(f"{out_path}/spans.pdf")
|