Unverified Commit 01c99a99 authored by Mick's avatar Mick Committed by GitHub
Browse files

chore: update Dockerfile (#8872)


Co-authored-by: default avatarzhyncs <me@zhyncs.com>
parent b114a810
...@@ -14,7 +14,7 @@ ENV PATH="${PATH}:/usr/local/nvidia/bin" \ ...@@ -14,7 +14,7 @@ ENV PATH="${PATH}:/usr/local/nvidia/bin" \
RUN apt update && apt install wget -y && apt install software-properties-common -y \ RUN apt update && apt install wget -y && apt install software-properties-common -y \
&& add-apt-repository ppa:deadsnakes/ppa -y \ && add-apt-repository ppa:deadsnakes/ppa -y \
&& apt install python3.12-full -y \ && apt install python3.12-full python3.12-dev python3.10-venv -y \
&& update-alternatives --install /usr/bin/python3 python3 /usr/bin/python3.10 1 \ && update-alternatives --install /usr/bin/python3 python3 /usr/bin/python3.10 1 \
&& update-alternatives --install /usr/bin/python3 python3 /usr/bin/python3.12 2 \ && update-alternatives --install /usr/bin/python3 python3 /usr/bin/python3.12 2 \
&& update-alternatives --set python3 /usr/bin/python3.12 \ && update-alternatives --set python3 /usr/bin/python3.12 \
...@@ -28,7 +28,6 @@ RUN echo 'tzdata tzdata/Areas select America' | debconf-set-selections \ ...@@ -28,7 +28,6 @@ RUN echo 'tzdata tzdata/Areas select America' | debconf-set-selections \
tzdata \ tzdata \
software-properties-common netcat-openbsd kmod unzip openssh-server \ software-properties-common netcat-openbsd kmod unzip openssh-server \
curl wget lsof zsh ccache tmux htop git-lfs tree \ curl wget lsof zsh ccache tmux htop git-lfs tree \
python3 python3-pip python3-dev libpython3-dev python3-venv \
build-essential cmake \ build-essential cmake \
libopenmpi-dev libnuma1 libnuma-dev \ libopenmpi-dev libnuma1 libnuma-dev \
libibverbs-dev libibverbs1 libibumad3 \ libibverbs-dev libibverbs1 libibumad3 \
...@@ -44,7 +43,7 @@ RUN echo 'tzdata tzdata/Areas select America' | debconf-set-selections \ ...@@ -44,7 +43,7 @@ RUN echo 'tzdata tzdata/Areas select America' | debconf-set-selections \
patchelf \ patchelf \
nvidia-dkms-550 \ nvidia-dkms-550 \
devscripts debhelper fakeroot dkms check libsubunit0 libsubunit-dev \ devscripts debhelper fakeroot dkms check libsubunit0 libsubunit-dev \
&& ln -sf /usr/bin/python3 /usr/bin/python \ && ln -sf /usr/bin/python3.12 /usr/bin/python \
&& rm -rf /var/lib/apt/lists/* \ && rm -rf /var/lib/apt/lists/* \
&& apt-get clean && apt-get clean
...@@ -67,12 +66,16 @@ RUN python3 -m pip install --no-cache-dir --upgrade pip setuptools wheel html5li ...@@ -67,12 +66,16 @@ RUN python3 -m pip install --no-cache-dir --upgrade pip setuptools wheel html5li
&& case "$CUDA_VERSION" in \ && case "$CUDA_VERSION" in \
12.6.1) CUINDEX=126 ;; \ 12.6.1) CUINDEX=126 ;; \
12.8.1) CUINDEX=128 ;; \ 12.8.1) CUINDEX=128 ;; \
12.9.1) CUINDEX=129 ;; \
*) echo "Unsupported CUDA version: $CUDA_VERSION" && exit 1 ;; \ *) echo "Unsupported CUDA version: $CUDA_VERSION" && exit 1 ;; \
esac \ esac \
&& python3 -m pip install --no-cache-dir -e "python[${BUILD_TYPE}]" --extra-index-url https://download.pytorch.org/whl/cu${CUINDEX} \ && python3 -m pip install --no-cache-dir -e "python[${BUILD_TYPE}]" --extra-index-url https://download.pytorch.org/whl/test/cu${CUINDEX} \
&& python3 -m pip install --no-cache-dir nvidia-nccl-cu12==2.27.6 --force-reinstall --no-deps \ && python3 -m pip install --no-cache-dir nvidia-nccl-cu12==2.27.6 --force-reinstall --no-deps \
&& if [ "$CUDA_VERSION" = "12.8.1" ]; then \ && if [ "$CUDA_VERSION" = "12.8.1" ]; then \
python3 -m pip install --no-cache-dir https://github.com/sgl-project/whl/releases/download/v0.2.9/sgl_kernel-0.2.9+cu128-cp39-abi3-manylinux2014_x86_64.whl --force-reinstall --no-deps ; \ python3 -m pip install --no-cache-dir https://github.com/sgl-project/whl/releases/download/v0.3.2/sgl_kernel-0.3.2+cu128-cp39-abi3-manylinux2014_x86_64.whl --force-reinstall --no-deps ; \
fi \
&& if [ "$CUDA_VERSION" = "12.9.1" ]; then \
python3 -m pip install --no-cache-dir https://github.com/sgl-project/whl/releases/download/v0.3.2/sgl_kernel-0.3.2-cp39-abi3-manylinux2014_x86_64.whl --force-reinstall --no-deps ; \
fi fi
# Build and install NVSHMEM + DeepEP # Build and install NVSHMEM + DeepEP
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment