perf(model): enable bfloat16 for layoutreader on supported devices

- Add bf_16_support check for CUDA and MPS devices - Use bfloat16 precision for layoutreader model on supported devices - Improve performance on devices with bf_16 support

perf(model): enable bfloat16 for layoutreader on supported devices
- Add bf_16_support check for CUDA and MPS devices - Use bfloat16 precision for layoutreader model on supported devices - Improve performance on devices with bf_16 support
7210f7a6 · myhloli · cf4ea78d · 7210f7a6
Commit 7210f7a6 authored Mar 20, 2025 by myhloli
Hide whitespace changes
Inline Side-by-side

Showing with 12 additions and 3 deletions

magic_pdf/pdf_parse_union_core_v2.py magic_pdf/pdf_parse_union_core_v2.py +12 -3

No files found.
--- a/magic_pdf/pdf_parse_union_core_v2.py
+++ b/magic_pdf/pdf_parse_union_core_v2.py
@@ -333,8 +333,14 @@ def txt_spans_extract_v2(pdf_page, spans, all_bboxes, all_discarded_blocks, lang
 def model_init(model_name: str):
    from transformers import LayoutLMv3ForTokenClassification
-    device = torch.device(get_device())
+    device_name = get_device()
+    bf_16_support = False
+    if device_name.startswith("cuda"):
+        bf_16_support = torch.cuda.is_bf16_supported()
+    elif device_name.startswith("mps"):
+        bf_16_support = True
+    device = torch.device(device_name)
    if model_name == 'layoutreader':
        # 检测modelscope的缓存目录是否存在
        layoutreader_model_dir = get_local_layoutreader_model_dir()
@@ -349,7 +355,10 @@ def model_init(model_name: str):
            model = LayoutLMv3ForTokenClassification.from_pretrained(
                'hantian/layoutreader'
            )
-        model.to(device).eval()
+        if bf_16_support:
+            model.to(device).eval().bfloat16()
+        else:
+            model.to(device).eval()
    else:
        logger.error('model name not allow')
        exit(1)