Commit d5dbed73 authored by 赵小蒙's avatar 赵小蒙
Browse files

目录重构

parent 7c7910e4
...@@ -10,7 +10,7 @@ import spacy ...@@ -10,7 +10,7 @@ import spacy
import en_core_web_sm import en_core_web_sm
import zh_core_web_sm import zh_core_web_sm
from pdf_tools.libs.language import detect_lang from magic_pdf.libs.language import detect_lang
class NLPModels: class NLPModels:
......
...@@ -4,9 +4,9 @@ from typing import Tuple ...@@ -4,9 +4,9 @@ from typing import Tuple
import io import io
# from app.common.s3 import get_s3_client # from app.common.s3 import get_s3_client
from pdf_tools.libs.commons import fitz from magic_pdf.libs.commons import fitz
from loguru import logger from loguru import logger
from pdf_tools.libs.commons import parse_bucket_key, join_path from magic_pdf.libs.commons import parse_bucket_key, join_path
def cut_image(bbox: Tuple, page_num: int, page: fitz.Page, save_parent_path: str, s3_return_path=None, img_s3_client=None, upload_switch=True): def cut_image(bbox: Tuple, page_num: int, page: fitz.Page, save_parent_path: str, s3_return_path=None, img_s3_client=None, upload_switch=True):
......
from pdf_tools.libs.commons import fitz from magic_pdf.libs.commons import fitz
import os import os
......
import os import os
import unicodedata import unicodedata
from pdf_tools.para.commons import * from magic_pdf.para.commons import *
if sys.version_info[0] >= 3: if sys.version_info[0] >= 3:
......
from pdf_tools.para.commons import * from magic_pdf.para.commons import *
if sys.version_info[0] >= 3: if sys.version_info[0] >= 3:
......
import sys import sys
from pdf_tools.libs.commons import fitz from magic_pdf.libs.commons import fitz
from termcolor import cprint from termcolor import cprint
......
import math import math
from collections import defaultdict from collections import defaultdict
from pdf_tools.para.commons import * from magic_pdf.para.commons import *
if sys.version_info[0] >= 3: if sys.version_info[0] >= 3:
sys.stdout.reconfigure(encoding="utf-8") # type: ignore sys.stdout.reconfigure(encoding="utf-8") # type: ignore
......
from pdf_tools.libs.commons import fitz from magic_pdf.libs.commons import fitz
from pdf_tools.para.commons import * from magic_pdf.para.commons import *
if sys.version_info[0] >= 3: if sys.version_info[0] >= 3:
......
import math import math
from pdf_tools.para.commons import * from magic_pdf.para.commons import *
if sys.version_info[0] >= 3: if sys.version_info[0] >= 3:
......
import os import os
import json import json
from pdf_tools.para.commons import * from magic_pdf.para.commons import *
from pdf_tools.para.raw_processor import RawBlockProcessor from magic_pdf.para.raw_processor import RawBlockProcessor
from pdf_tools.para.layout_match_processor import LayoutFilterProcessor from magic_pdf.para.layout_match_processor import LayoutFilterProcessor
from pdf_tools.para.stats import BlockStatisticsCalculator from magic_pdf.para.stats import BlockStatisticsCalculator
from pdf_tools.para.stats import DocStatisticsCalculator from magic_pdf.para.stats import DocStatisticsCalculator
from pdf_tools.para.title_processor import TitleProcessor from magic_pdf.para.title_processor import TitleProcessor
from pdf_tools.para.block_termination_processor import BlockTerminationProcessor from magic_pdf.para.block_termination_processor import BlockTerminationProcessor
from pdf_tools.para.block_continuation_processor import BlockContinuationProcessor from magic_pdf.para.block_continuation_processor import BlockContinuationProcessor
from pdf_tools.para.draw import DrawAnnos from magic_pdf.para.draw import DrawAnnos
from pdf_tools.para.exceptions import ( from magic_pdf.para.exceptions import (
DenseSingleLineBlockException, DenseSingleLineBlockException,
TitleDetectionException, TitleDetectionException,
TitleLevelException, TitleLevelException,
......
from collections import Counter from collections import Counter
import numpy as np import numpy as np
from pdf_tools.para.commons import * from magic_pdf.para.commons import *
if sys.version_info[0] >= 3: if sys.version_info[0] >= 3:
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment