"examples/git@developer.sourcefind.cn:OpenDAS/ollama.git" did not exist on "42b797ed9c9138c35e118f39041e9699ea6e6843"
Unverified Commit b420094b authored by Xiaomeng Zhao's avatar Xiaomeng Zhao Committed by GitHub
Browse files

Merge branch 'opendatalab:dev' into dev

parents e7649e43 9e6256c5
# Documentation:
# https://docs.sglang.ai/backend/server_arguments.html#common-launch-commands
services: services:
mineru-sglang: mineru-sglang:
image: mineru-sglang:latest image: mineru-sglang:latest
...@@ -11,6 +13,10 @@ services: ...@@ -11,6 +13,10 @@ services:
command: command:
--host 0.0.0.0 --host 0.0.0.0
--port 30000 --port 30000
# --enable-torch-compile # You can also enable torch.compile to accelerate inference speed by approximately 15%
# --dp 2 # If you have more than two GPUs with 24GB VRAM or above, you can use sglang's multi-GPU parallel mode to increase throughput
# --tp 2 # If you have two GPUs with 12GB or 16GB VRAM, you can use the Tensor Parallel (TP) mode
# --mem-fraction-static 0.7 # If you have two GPUs with 11GB VRAM, in addition to Tensor Parallel mode, you need to reduce the KV cache size
ulimits: ulimits:
memlock: -1 memlock: -1
stack: 67108864 stack: 67108864
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment