"src/targets/vscode:/vscode.git/clone" did not exist on "602924d4fef24fee79a861e229e40e90bbd1fcd4"
pdf_parse_by_txt.py 540 Bytes
Newer Older
1
from magic_pdf.pdf_parse_union_core_v2 import pdf_parse_union
赵小蒙's avatar
赵小蒙 committed
2

赵小蒙's avatar
赵小蒙 committed
3
4
5
6
7
8
9
10
11

def parse_pdf_by_txt(
    pdf_bytes,
    model_list,
    imageWriter,
    start_page_id=0,
    end_page_id=None,
    debug_mode=False,
):
赵小蒙's avatar
赵小蒙 committed
12
13
14
    return pdf_parse_union(pdf_bytes,
                           model_list,
                           imageWriter,
赵小蒙's avatar
赵小蒙 committed
15
                           "txt",
赵小蒙's avatar
赵小蒙 committed
16
17
18
19
                           start_page_id=start_page_id,
                           end_page_id=end_page_id,
                           debug_mode=debug_mode,
                           )