hotfix: update nccl

a8950294 · OlivierDehaene · e7e3aa6c · a8950294 · a8950294
Unverified Commit a8950294 authored Jul 23, 2024 by OlivierDehaene
Show whitespace changes
Inline Side-by-side

Showing with 5 additions and 1 deletion

Dockerfile Dockerfile +4 -1

server/Makefile server/Makefile +1 -0

No files found.
--- a/Dockerfile
+++ b/Dockerfile
@@ -252,7 +252,10 @@ COPY server/Makefile server/Makefile
 RUN cd server && \
    make gen-server && \
    pip install -r requirements_cuda.txt && \
-    pip install ".[bnb, accelerate, quantize, peft, outlines]" --no-cache-dir
+    pip install ".[bnb, accelerate, quantize, peft, outlines]" --no-cache-dir && \
+    pip install nvidia-nccl-cu12==2.22.3
+
+ENV LD_PRELOAD=/opt/conda/lib/python3.10/site-packages/nvidia/nccl/lib/libnccl.so.2

 # Deps before the binaries
 # The binaries change on every build given we burn the SHA into them

--- a/server/Makefile
+++ b/server/Makefile
@@ -30,6 +30,7 @@ install: install-cuda

 install-cuda: install-server install-flash-attention-v2-cuda install-vllm-cuda install-flash-attention install-fbgemm
 	pip install -e ".[bnb]"
+	pip install nvidia-nccl-cu12==2.22.3

 install-rocm: install-server install-flash-attention-v2-rocm  install-vllm-rocm