Unverified Commit 2c1f06b3 authored by Xiaomeng Zhao's avatar Xiaomeng Zhao Committed by GitHub
Browse files

Merge pull request #1459 from myhloli/dev

Dev
parents aa535316 a80ff051
...@@ -24,11 +24,11 @@ def get_model_config(): ...@@ -24,11 +24,11 @@ def get_model_config():
config_path = os.path.join(model_config_dir, 'model_configs.yaml') config_path = os.path.join(model_config_dir, 'model_configs.yaml')
with open(config_path, 'r', encoding='utf-8') as f: with open(config_path, 'r', encoding='utf-8') as f:
configs = yaml.load(f, Loader=yaml.FullLoader) configs = yaml.load(f, Loader=yaml.FullLoader)
return local_models_dir, device, configs return root_dir, local_models_dir, device, configs
def get_text_images(simple_images): def get_text_images(simple_images):
local_models_dir, device, configs = get_model_config() _, local_models_dir, device, configs = get_model_config()
atom_model_manager = AtomModelSingleton() atom_model_manager = AtomModelSingleton()
temp_layout_model = atom_model_manager.get_atom_model( temp_layout_model = atom_model_manager.get_atom_model(
atom_model_name=AtomicModel.Layout, atom_model_name=AtomicModel.Layout,
...@@ -69,15 +69,11 @@ def model_init(model_name: str): ...@@ -69,15 +69,11 @@ def model_init(model_name: str):
atom_model_manager = AtomModelSingleton() atom_model_manager = AtomModelSingleton()
if model_name == MODEL_NAME.YOLO_V11_LangDetect: if model_name == MODEL_NAME.YOLO_V11_LangDetect:
local_models_dir, device, configs = get_model_config() root_dir, _, device, _ = get_model_config()
model = atom_model_manager.get_atom_model( model = atom_model_manager.get_atom_model(
atom_model_name=AtomicModel.LangDetect, atom_model_name=AtomicModel.LangDetect,
langdetect_model_name=MODEL_NAME.YOLO_V11_LangDetect, langdetect_model_name=MODEL_NAME.YOLO_V11_LangDetect,
langdetect_model_weight=str( langdetect_model_weight=str(os.path.join(root_dir, 'resources', 'yolov11-langdetect', 'yolo_v11_ft.pt')),
os.path.join(
local_models_dir, configs['weights'][MODEL_NAME.YOLO_V11_LangDetect]
)
),
device=device, device=device,
) )
else: else:
......
...@@ -768,6 +768,11 @@ def parse_page_core( ...@@ -768,6 +768,11 @@ def parse_page_core(
"""重排block""" """重排block"""
sorted_blocks = sorted(fix_blocks, key=lambda b: b['index']) sorted_blocks = sorted(fix_blocks, key=lambda b: b['index'])
"""block内重排(img和table的block内多个caption或footnote的排序)"""
for block in sorted_blocks:
if block['type'] in [BlockType.Image, BlockType.Table]:
block['blocks'] = sorted(block['blocks'], key=lambda b: b['index'])
"""获取QA需要外置的list""" """获取QA需要外置的list"""
images, tables, interline_equations = get_qa_need_list_v2(sorted_blocks) images, tables, interline_equations = get_qa_need_list_v2(sorted_blocks)
......
...@@ -5,5 +5,4 @@ weights: ...@@ -5,5 +5,4 @@ weights:
unimernet_small: MFR/unimernet_small unimernet_small: MFR/unimernet_small
struct_eqtable: TabRec/StructEqTable struct_eqtable: TabRec/StructEqTable
tablemaster: TabRec/TableMaster tablemaster: TabRec/TableMaster
rapid_table: TabRec/RapidTable rapid_table: TabRec/RapidTable
yolo_v11n_langdetect: LangDetect/YOLO/yolo_v11_ft.pt \ No newline at end of file
\ No newline at end of file
No preview for this file type
...@@ -51,7 +51,7 @@ if __name__ == '__main__': ...@@ -51,7 +51,7 @@ if __name__ == '__main__':
"doclayout_yolo==0.0.2", # doclayout_yolo "doclayout_yolo==0.0.2", # doclayout_yolo
"rapidocr-paddle", # rapidocr-paddle "rapidocr-paddle", # rapidocr-paddle
"rapidocr_onnxruntime", "rapidocr_onnxruntime",
"rapid_table", # rapid_table "rapid_table==0.3.0", # rapid_table
"PyYAML", # yaml "PyYAML", # yaml
"openai", # openai SDK "openai", # openai SDK
"detectron2" "detectron2"
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment