"test/torchscript_consistency_impl.py" did not exist on "5f5df1d649de8504c68ec532195ab1ba3fb54680"
Commit 0b05dff7 authored by myhloli's avatar myhloli
Browse files

perf(inference): adjust batch ratio for high GPU memory

- Increase batch ratio to 8 for GPU memory >=16GB
- Improve inference performance on systems with higher GPU memory
parent f20ab37d
......@@ -170,7 +170,9 @@ def doc_analyze(
gpu_memory = int(os.getenv("VIRTUAL_VRAM_SIZE", round(get_vram(device))))
if gpu_memory is not None and gpu_memory >= 8:
if gpu_memory >= 10:
if gpu_memory >= 16:
batch_ratio = 8
elif gpu_memory >= 10:
batch_ratio = 4
else:
batch_ratio = 2
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment