Unverified Commit 58da4ee0 authored by Ryan Rock's avatar Ryan Rock Committed by GitHub
Browse files

[AMD][CI] Update DeepEP branch (#38396)


Signed-off-by: default avatarRyan Rock <ryan.rock@amd.com>
parent 1ae11e2b
...@@ -2613,6 +2613,7 @@ steps: ...@@ -2613,6 +2613,7 @@ steps:
- vllm/platforms/rocm.py - vllm/platforms/rocm.py
commands: commands:
- export TORCH_NCCL_BLOCKING_WAIT=1 - export TORCH_NCCL_BLOCKING_WAIT=1
- VLLM_LOGGING_LEVEL=DEBUG python3 examples/offline_inference/data_parallel.py --model=Qwen/Qwen1.5-MoE-A2.7B -tp=1 -dp=2 --max-model-len=2048 --all2all-backend=deepep_high_throughput
- pytest -v -s tests/v1/distributed/test_dbo.py - pytest -v -s tests/v1/distributed/test_dbo.py
...@@ -3601,7 +3602,6 @@ steps: ...@@ -3601,7 +3602,6 @@ steps:
commands: commands:
- export TORCH_NCCL_BLOCKING_WAIT=1 - export TORCH_NCCL_BLOCKING_WAIT=1
- pytest -v -s tests/distributed/test_context_parallel.py - pytest -v -s tests/distributed/test_context_parallel.py
- VLLM_LOGGING_LEVEL=DEBUG python3 examples/offline_inference/data_parallel.py --model=Qwen/Qwen1.5-MoE-A2.7B -tp=1 -dp=2 --max-model-len=2048 --all2all-backend=deepep_high_throughput
- pytest -v -s tests/v1/distributed/test_dbo.py - pytest -v -s tests/v1/distributed/test_dbo.py
......
...@@ -192,9 +192,10 @@ RUN cd /opt/rixl && mkdir -p /app/install && \ ...@@ -192,9 +192,10 @@ RUN cd /opt/rixl && mkdir -p /app/install && \
FROM base AS build_deep FROM base AS build_deep
ARG ROCSHMEM_BRANCH="ba0bf0f3" ARG ROCSHMEM_BRANCH="ba0bf0f3"
ARG ROCSHMEM_REPO="https://github.com/ROCm/rocm-systems.git" ARG ROCSHMEM_REPO="https://github.com/ROCm/rocm-systems.git"
ARG DEEPEP_BRANCH="e84464ec" ARG DEEPEP_BRANCH="5d90af8b"
ARG DEEPEP_REPO="https://github.com/ROCm/DeepEP.git" ARG DEEPEP_REPO="https://github.com/ROCm/DeepEP.git"
ARG DEEPEP_NIC="cx7" ARG DEEPEP_NIC="cx7"
ARG DEEPEP_ROCM_ARCH="gfx942;gfx950"
ENV ROCSHMEM_DIR=/opt/rocshmem ENV ROCSHMEM_DIR=/opt/rocshmem
RUN git clone ${ROCSHMEM_REPO} \ RUN git clone ${ROCSHMEM_REPO} \
...@@ -202,13 +203,11 @@ RUN git clone ${ROCSHMEM_REPO} \ ...@@ -202,13 +203,11 @@ RUN git clone ${ROCSHMEM_REPO} \
&& git checkout ${ROCSHMEM_BRANCH} \ && git checkout ${ROCSHMEM_BRANCH} \
&& mkdir -p projects/rocshmem/build \ && mkdir -p projects/rocshmem/build \
&& cd projects/rocshmem/build \ && cd projects/rocshmem/build \
&& cmake .. \ && bash ../scripts/build_configs/all_backends \
-DCMAKE_INSTALL_PREFIX="${ROCSHMEM_DIR}" \ -DCMAKE_INSTALL_PREFIX="${ROCSHMEM_DIR}" \
-DROCM_PATH=/opt/rocm \ -DROCM_PATH=/opt/rocm \
-DCMAKE_POSITION_INDEPENDENT_CODE=ON \ -DGPU_TARGETS="${DEEPEP_ROCM_ARCH}" \
-DUSE_EXTERNAL_MPI=OFF \ -DUSE_EXTERNAL_MPI=OFF
&& make -j \
&& make install
# Build DeepEP wheel. # Build DeepEP wheel.
# DeepEP looks for rocshmem at ROCSHMEM_DIR. # DeepEP looks for rocshmem at ROCSHMEM_DIR.
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment