perf(model): optimize batch ratio for different GPU memory sizes

- Update batch ratio calculation logic to better utilize available GPU memory - Improve logging for all GPU memory sizes

perf(model): optimize batch ratio for different GPU memory sizes
- Update batch ratio calculation logic to better utilize available GPU memory - Improve logging for all GPU memory sizes
b1ac7afd · myhloli · 29e7a948 · b1ac7afd
Commit b1ac7afd authored Feb 07, 2025 by myhloli
Hide whitespace changes
Inline Side-by-side

Showing with 11 additions and 12 deletions

magic_pdf/model/doc_analyze_by_custom_model.py magic_pdf/model/doc_analyze_by_custom_model.py +11 -12

No files found.
--- a/magic_pdf/model/doc_analyze_by_custom_model.py
+++ b/magic_pdf/model/doc_analyze_by_custom_model.py
@@ -178,21 +178,20 @@ def doc_analyze(
        gpu_memory = int(os.getenv("VIRTUAL_VRAM_SIZE", round(get_vram(device))))
        if gpu_memory is not None and gpu_memory >= 8:
-            if 8 <= gpu_memory < 10:
+            if gpu_memory >= 40:
-                batch_ratio = 2
+                batch_ratio = 32
-            elif 10 <= gpu_memory <= 12:
+            elif gpu_memory >=20:
-                batch_ratio = 4
-            elif 12 < gpu_memory <= 20:
-                batch_ratio = 8
-            elif 20 < gpu_memory <= 32:
                batch_ratio = 16
+            elif gpu_memory >= 16:
+                batch_ratio = 8
+            elif gpu_memory >= 10:
+                batch_ratio = 4
            else:
-                batch_ratio = 32
+                batch_ratio = 2
-            if batch_ratio >= 1:
+            logger.info(f'gpu_memory: {gpu_memory} GB, batch_ratio: {batch_ratio}')
-                logger.info(f'gpu_memory: {gpu_memory} GB, batch_ratio: {batch_ratio}')
+            batch_model = BatchAnalyze(model=custom_model, batch_ratio=batch_ratio)
-                batch_model = BatchAnalyze(model=custom_model, batch_ratio=batch_ratio)
+            batch_analyze = True
-                batch_analyze = True
    model_json = []
    doc_analyze_start = time.time()