{# # SPDX-FileCopyrightText: Copyright (c) 2024-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved. # SPDX-License-Identifier: Apache-2.0 #} # === BEGIN templates/dynamo_runtime.Dockerfile === ####################################### ########## Runtime image ############## ####################################### FROM dynamo_base AS runtime ARG ARCH_ALT ARG PYTHON_VERSION # Create dynamo user with group 0 for OpenShift compatibility RUN userdel -r ubuntu > /dev/null 2>&1 || true \ && useradd -m -s /bin/bash -g 0 dynamo \ && [ `id -u dynamo` -eq 1000 ] \ && mkdir -p /home/dynamo/.cache /opt/dynamo \ # Non-recursive chown - only the directories themselves, not contents && chown dynamo:0 /home/dynamo /home/dynamo/.cache /opt/dynamo /workspace \ # No chmod needed: umask 002 handles new files, COPY --chmod handles copied content # Set umask globally for all subsequent RUN commands (must be done as root before USER dynamo) # NOTE: Setting ENV UMASK=002 does NOT work - umask is a shell builtin, not an environment variable && mkdir -p /etc/profile.d && echo 'umask 002' > /etc/profile.d/00-umask.sh # NIXL environment variables ENV NIXL_PREFIX=/opt/nvidia/nvda_nixl \ NIXL_LIB_DIR=/opt/nvidia/nvda_nixl/lib/${ARCH_ALT}-linux-gnu \ NIXL_PLUGIN_DIR=/opt/nvidia/nvda_nixl/lib/${ARCH_ALT}-linux-gnu/plugins \ CARGO_TARGET_DIR=/opt/dynamo/target ENV LD_LIBRARY_PATH=\ ${NIXL_LIB_DIR}:\ ${NIXL_PLUGIN_DIR}:\ /usr/local/ucx/lib:\ /usr/local/ucx/lib/ucx:\ ${LD_LIBRARY_PATH} # Copy ucx and nixl libs COPY --chown=dynamo: --from=wheel_builder /usr/local/ucx/ /usr/local/ucx/ COPY --chown=dynamo: --from=wheel_builder ${NIXL_PREFIX}/ ${NIXL_PREFIX}/ COPY --chown=dynamo: --from=wheel_builder /opt/nvidia/nvda_nixl/lib64/. ${NIXL_LIB_DIR}/ COPY --chown=dynamo: --from=wheel_builder /opt/dynamo/dist/nixl/ /opt/dynamo/wheelhouse/nixl/ COPY --chown=dynamo: --from=wheel_builder /workspace/nixl/build/src/bindings/python/nixl-meta/nixl-*.whl /opt/dynamo/wheelhouse/nixl/ # Always copy FFmpeg so libs are available for Rust checks in CI RUN --mount=type=bind,from=wheel_builder,source=/usr/local/,target=/tmp/usr/local/ \ mkdir -p /usr/local/lib/pkgconfig && \ cp -rnL /tmp/usr/local/include/libav* /tmp/usr/local/include/libsw* /usr/local/include/ && \ cp -nL /tmp/usr/local/lib/libav*.so /tmp/usr/local/lib/libsw*.so /usr/local/lib/ && \ cp -nL /tmp/usr/local/lib/pkgconfig/libav*.pc /tmp/usr/local/lib/pkgconfig/libsw*.pc /usr/local/lib/pkgconfig/ && \ cp -r /tmp/usr/local/src/ffmpeg /usr/local/src/ {% if target not in ("dev", "local-dev") %} # Copy built artifacts (not needed for dev/local-dev; users build from source) COPY --chown=dynamo: --from=wheel_builder $CARGO_TARGET_DIR $CARGO_TARGET_DIR {% endif %} COPY --chown=dynamo: --from=wheel_builder /opt/dynamo/dist/*.whl /opt/dynamo/wheelhouse/ # Install Python for framework=none runtime (cuda-dl-base doesn't include Python) # This is needed to create venv and install dynamo packages ARG PYTHON_VERSION # Cache apt downloads; sharing=locked avoids apt/dpkg races with concurrent builds. # Clear partial downloads first to avoid stale rename failures from prior interrupted builds. RUN --mount=type=cache,target=/var/cache/apt,sharing=locked \ rm -rf /var/cache/apt/archives/partial/* && \ apt-get update && \ DEBIAN_FRONTEND=noninteractive apt-get install -y --no-install-recommends \ python${PYTHON_VERSION}-dev \ python${PYTHON_VERSION}-venv \ build-essential \ cmake \ protobuf-compiler \ pkg-config \ clang \ libclang-dev \ patchelf \ git \ git-lfs && \ rm -rf /var/lib/apt/lists/* && \ ln -sf /usr/bin/python${PYTHON_VERSION} /usr/bin/python3 # Switch to dynamo user and create virtual environment USER dynamo ENV HOME=/home/dynamo # Create and activate virtual environment # Use login shell to pick up umask 002 from /etc/profile.d/00-umask.sh for group-writable files SHELL ["/bin/bash", "-l", "-o", "pipefail", "-c"] # Cache uv downloads; uv handles its own locking for the cache. RUN --mount=type=cache,target=/home/dynamo/.cache/uv,uid=1000,gid=0,mode=0775 \ export UV_CACHE_DIR=/home/dynamo/.cache/uv && \ uv venv /opt/dynamo/venv --python ${PYTHON_VERSION} ENV VIRTUAL_ENV=/opt/dynamo/venv \ PATH="/opt/dynamo/venv/bin:${PATH}" {% if target not in ("dev", "local-dev") %} # Install dynamo wheels (runtime packages only, no test dependencies) # uv handles its own locking for the cache, no need to add sharing=locked ARG ENABLE_KVBM RUN --mount=type=cache,target=/home/dynamo/.cache/uv,uid=1000,gid=0,mode=0775 \ export UV_CACHE_DIR=/home/dynamo/.cache/uv && \ uv pip install \ /opt/dynamo/wheelhouse/ai_dynamo_runtime*.whl \ /opt/dynamo/wheelhouse/ai_dynamo*any.whl \ /opt/dynamo/wheelhouse/nixl/nixl*.whl && \ if [ "$ENABLE_KVBM" = "true" ]; then \ KVBM_WHEEL=$(ls /opt/dynamo/wheelhouse/kvbm*.whl 2>/dev/null | head -1); \ if [ -z "$KVBM_WHEEL" ]; then \ echo "ERROR: ENABLE_KVBM is true but no KVBM wheel found in wheelhouse" >&2; \ exit 1; \ fi; \ uv pip install "$KVBM_WHEEL"; \ fi {% else %} # Dev/local-dev: skip dynamo wheel install (users build from source via cargo build + maturin develop). # Install NIXL wheel only (pre-built C++ binary, not buildable from source). RUN --mount=type=cache,target=/home/dynamo/.cache/uv,uid=1000,gid=0,mode=0775 \ export UV_CACHE_DIR=/home/dynamo/.cache/uv && \ uv pip install /opt/dynamo/wheelhouse/nixl/nixl*.whl {% endif %} # Install gpu_memory_service wheel if enabled (all targets) ARG ENABLE_GPU_MEMORY_SERVICE RUN --mount=type=cache,target=/home/dynamo/.cache/uv,uid=1000,gid=0,mode=0775 \ if [ "${ENABLE_GPU_MEMORY_SERVICE}" = "true" ]; then \ export UV_CACHE_DIR=/home/dynamo/.cache/uv && \ GMS_WHEEL=$(ls /opt/dynamo/wheelhouse/gpu_memory_service*.whl 2>/dev/null | head -1); \ if [ -n "$GMS_WHEEL" ]; then uv pip install "$GMS_WHEEL"; fi; \ fi # Initialize Git LFS (required for git+https dependencies with LFS artifacts) RUN git lfs install # Install runtime dependencies (common + planner + frontend). # Frontend deps (tritonclient + grpcio/protobuf pins) are installed here so the resolver # sees all constraints in one pass, avoiding grpcio downgrades in the test layer. # Test and dev dependencies are NOT installed here — they go in the test and dev images. RUN --mount=type=bind,source=./container/deps/requirements.common.txt,target=/tmp/requirements.common.txt \ --mount=type=bind,source=./container/deps/requirements.planner.txt,target=/tmp/requirements.planner.txt \ --mount=type=bind,source=./container/deps/requirements.frontend.txt,target=/tmp/requirements.frontend.txt \ --mount=type=cache,target=/home/dynamo/.cache/uv,uid=1000,gid=0,mode=0775 \ export UV_CACHE_DIR=/home/dynamo/.cache/uv UV_GIT_LFS=1 UV_HTTP_TIMEOUT=300 UV_HTTP_RETRIES=5 && \ uv pip install \ --index-strategy unsafe-best-match \ --extra-index-url https://download.pytorch.org/whl/cu130 \ --requirement /tmp/requirements.common.txt \ --requirement /tmp/requirements.planner.txt \ --requirement /tmp/requirements.frontend.txt # TODO: skip /workspace COPY for dev/local-dev (bind-mounted from host, gets shadowed) # Copy workspace source code ARG WORKSPACE_DIR=/workspace WORKDIR ${WORKSPACE_DIR} COPY --chmod=775 --chown=dynamo:0 ./ ${WORKSPACE_DIR}/ RUN chmod g+w ${WORKSPACE_DIR} ARG DYNAMO_COMMIT_SHA ENV DYNAMO_COMMIT_SHA=$DYNAMO_COMMIT_SHA ENTRYPOINT ["/opt/nvidia/nvidia_entrypoint.sh"] CMD []