draw_bbox.py 3.21 KB
Newer Older
1
from magic_pdf.libs.commons import fitz  # PyMuPDF
赵小蒙's avatar
赵小蒙 committed
2

赵小蒙's avatar
赵小蒙 committed
3
def draw_bbox_without_number(i, bbox_list, page, rgb_config):
4
5
6
7
8
9
10
    new_rgb = []
    for item in rgb_config:
        item = float(item) / 255
        new_rgb.append(item)
    page_data = bbox_list[i]
    for bbox in page_data:
        x0, y0, x1, y1 = bbox
赵小蒙's avatar
赵小蒙 committed
11
        rect_coords = fitz.Rect(x0, y0, x1, y1)  # Define the rectangle
12
        page.draw_rect(rect_coords, color=new_rgb, fill=None, width=0.5, overlay=True)  # Draw the rectangle
赵小蒙's avatar
赵小蒙 committed
13

14

赵小蒙's avatar
赵小蒙 committed
15
16
17
18
19
20
21
22
23
24
25
26
27
def draw_bbox_with_number(i, bbox_list, page, rgb_config):
    new_rgb = []
    for item in rgb_config:
        item = float(item) / 255
        new_rgb.append(item)
    page_data = bbox_list[i]
    for j, bbox in enumerate(page_data):
        x0, y0, x1, y1 = bbox
        rect_coords = fitz.Rect(x0, y0, x1, y1)  # Define the rectangle
        page.draw_rect(rect_coords, color=new_rgb, fill=None, width=0.5, overlay=True)  # Draw the rectangle
        page.insert_text((x0, y0), str(j + 1), fontsize=10, color=new_rgb)  # Insert the index at the top left corner of the rectangle


28
29
def draw_layout_bbox(pdf_info_dict, input_path, out_path):
    layout_bbox_list = []
赵小蒙's avatar
赵小蒙 committed
30
    dropped_bbox_list = []
31
    for page in pdf_info_dict.values():
赵小蒙's avatar
赵小蒙 committed
32
33
        page_layout_list = []
        page_dropped_list = []
34
        for layout in page['layout_bboxes']:
赵小蒙's avatar
赵小蒙 committed
35
36
37
38
39
40
            page_layout_list.append(layout['layout_bbox'])
        layout_bbox_list.append(page_layout_list)
        for drop_tag, dropped_bboxes in page['dropped_bboxes'].items():
            for dropped_bbox in dropped_bboxes:
                page_dropped_list.append(dropped_bbox)
        dropped_bbox_list.append(page_dropped_list)
41
42
43

    doc = fitz.open(input_path)
    for i, page in enumerate(doc):
赵小蒙's avatar
赵小蒙 committed
44
        draw_bbox_with_number(i, layout_bbox_list, page, [255, 0, 0])
赵小蒙's avatar
赵小蒙 committed
45
        draw_bbox_without_number(i, dropped_bbox_list, page, [0, 255, 0])
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
    # Save the PDF
    doc.save(f"{out_path}/layout.pdf")

def draw_text_bbox(pdf_info_dict, input_path, out_path):
    text_list = []
    inline_equation_list = []
    displayed_equation_list = []
    for page in pdf_info_dict.values():
        page_text_list = []
        page_inline_equation_list = []
        page_displayed_equation_list = []
        for block in page['preproc_blocks']:
            for line in block['lines']:
                for span in line['spans']:
                    if span['type'] == 'text':
                        page_text_list.append(span['bbox'])
                    elif span['type'] == 'inline_equation':
                        page_inline_equation_list.append(span['bbox'])
                    elif span['type'] == 'displayed_equation':
                        page_displayed_equation_list.append(span['bbox'])
        text_list.append(page_text_list)
        inline_equation_list.append(page_inline_equation_list)
        displayed_equation_list.append(page_displayed_equation_list)

    doc = fitz.open(input_path)
    for i, page in enumerate(doc):
        # 获取当前页面的数据
赵小蒙's avatar
赵小蒙 committed
73
74
75
        draw_bbox_without_number(i, text_list, page, [255, 0, 0])
        draw_bbox_without_number(i, inline_equation_list, page, [0, 255, 0])
        draw_bbox_without_number(i, displayed_equation_list, page, [0, 0, 255])
76
77
78

    # Save the PDF
    doc.save(f"{out_path}/text.pdf")