"examples/runtime/multimodal/llava_onevision_server.py" did not exist on "c9064e6fd9a5356ee579e9d452bfad725f8e6f2c"
Dockerfile 342 Bytes
Newer Older
Ying Sheng's avatar
Ying Sheng committed
1
2
3
4
5
6
FROM vllm/vllm-openai

RUN pip install --upgrade pip
RUN pip install "sglang[all]"
RUN pip uninstall -y triton triton-nightly && pip install --no-deps --index-url https://aiinfra.pkgs.visualstudio.com/PublicPackages/_packaging/Triton-Nightly/pypi/simple/ triton-nightly
RUN pip install flashinfer -i https://flashinfer.ai/whl/cu121/torch2.3/