Merge pull request #1595 from myhloli/dev

perf(magic_pdf): optimize batch processing for GPU

Merge pull request #1595 from myhloli/dev
perf(magic_pdf): optimize batch processing for GPU
98c05682 · Xiaomeng Zhao · GitHub · 08a9558f · b6710b99 · 98c05682
Unverified Commit 98c05682 authored Jan 21, 2025 by Xiaomeng Zhao Committed by GitHub Jan 21, 2025
Show whitespace changes
Inline Side-by-side

Showing with 12 additions and 1 deletion

magic_pdf/model/doc_analyze_by_custom_model.py magic_pdf/model/doc_analyze_by_custom_model.py +12 -1

No files found.
--- a/magic_pdf/model/doc_analyze_by_custom_model.py
+++ b/magic_pdf/model/doc_analyze_by_custom_model.py
@@ -177,7 +177,18 @@ def doc_analyze(
    if torch.cuda.is_available() and device != 'cpu' or npu_support:
        gpu_memory = int(os.getenv("VIRTUAL_VRAM_SIZE", round(get_vram(device))))
        if gpu_memory is not None and gpu_memory >= 8:
-            batch_ratio = int(gpu_memory-6)
+
+            if 8 <= gpu_memory < 10:
+                batch_ratio = 2
+            elif 10 <= gpu_memory <= 12:
+                batch_ratio = 4
+            elif 12 < gpu_memory <= 16:
+                batch_ratio = 8
+            elif 16 < gpu_memory <= 24:
+                batch_ratio = 16
+            else:
+                batch_ratio = 32
+
            if batch_ratio >= 1:
                logger.info(f'gpu_memory: {gpu_memory} GB, batch_ratio: {batch_ratio}')
                batch_model = BatchAnalyze(model=custom_model, batch_ratio=batch_ratio)