Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
tsoc
superbenchmark
Commits
b015ceeb
Unverified
Commit
b015ceeb
authored
Apr 23, 2026
by
one
Committed by
GitHub
Apr 23, 2026
Browse files
Dockerfiles: Use different dockerfiles for pytorch/vllm base images (#16)
parent
4fa10f4d
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
233 additions
and
20 deletions
+233
-20
dockerfile/dtk26.04-pytorch2.7.1.dockerfile
dockerfile/dtk26.04-pytorch2.7.1.dockerfile
+189
-0
dockerfile/dtk26.04-vllm0.11.0.dockerfile
dockerfile/dtk26.04-vllm0.11.0.dockerfile
+22
-10
dockerfile/dtk26.04_docker18.dockerfile
dockerfile/dtk26.04_docker18.dockerfile
+22
-10
No files found.
dockerfile/dtk26.04-pytorch2.7.1.dockerfile
0 → 100644
View file @
b015ceeb
ARG
BASE_IMAGE=harbor.sourcefind.cn:5443/dcu/admin/base/pytorch:2.7.1-ubuntu22.04-dtk26.04-py3.11
FROM
${BASE_IMAGE}
# Included in the base image:
# - Ubuntu: 22.04
# - Python: 3.11
# - DTK: 26.04
# - AMD SMI: 24.5.3+02cbffb.dirty
# - Torch: 2.7.1+das.opt1.dtk2604
# - Torchvision: 0.22.0+das.opt1.dtk2604.torch271
# - vLLM: 0.11.0+das.opt1.dtk2604.torch271
# - ONNX Runtime: 1.19.2+das.opt1.dtk2604.torch271
# - DeepSpeed: 0.18.2+das.opt1.dtk2604.torch271
# - Apex: 1.7.0+das.opt1.dtk2604.torch271
# - FlashAttention: 2.6.1+das.opt1.dtk2604.torch271
# - Transformer Engine: 2.10.0+das.opt1.dtk2604.torch271
# - Triton: 3.1.0+das.opt1.dtk2604.torch271
# - Megatron Core: 0.15.4+das.opt1.dtk2604.torch271
# - DCU Megatron: 0.15.0+das.opt1.dtk2604.torch271
# - Byte Flux: 1.0.4+das.opt1.dtk2604.torch271
# Added or changed by this Dockerfile:
# - Docker client: 20.10.8
# - UCX: 1.20.0, built with DTK/ROCm support
# - Open MPI: 5.0.9, built with UCX and DTK/ROCm support
# - Intel MLC: v3.12
# - rocblas-bench and hipblaslt-bench command symlinks
# - RCCL topology mapping override for DTK
# - SSH and ulimit configuration
LABEL
maintainer="SuperBench"
ENV
DEBIAN_FRONTEND=noninteractive
RUN
apt-get update
&&
\
apt-get
-q
install
-y
--no-install-recommends
\
autoconf
\
automake
\
bc
\
build-essential
\
curl
\
dmidecode
\
git
\
iproute2
\
jq
\
libaio-dev
\
libboost-program-options-dev
\
libcap2
\
libcurl4-openssl-dev
\
libnuma-dev
\
libpci-dev
\
libssl-dev
\
libtinfo5
\
libtool
\
lshw
\
net-tools
\
numactl
\
openssh-client
\
openssh-server
\
pciutils
\
python3.11-venv
\
rsync
\
sudo
\
util-linux
\
vim
\
wget
\
&&
\
rm
-rf
/tmp/
*
# Install Docker
ENV
DOCKER_VERSION=20.10.8
RUN
cd
/tmp
&&
\
wget
-q
https://download.docker.com/linux/static/stable/x86_64/docker-
${
DOCKER_VERSION
}
.tgz
-O
docker.tgz
&&
\
tar
--extract
--file
docker.tgz
--strip-components
1
--directory
/usr/local/bin/
&&
\
rm
docker.tgz
# Update system config
RUN
mkdir
-p
/root/.ssh
&&
\
touch
/root/.ssh/authorized_keys
&&
\
mkdir
-p
/var/run/sshd
&&
\
sed
-i
"s/[# ]*PermitRootLogin prohibit-password/PermitRootLogin yes/"
/etc/ssh/sshd_config
&&
\
sed
-i
"s/[# ]*PermitUserEnvironment no/PermitUserEnvironment yes/"
/etc/ssh/sshd_config
&&
\
sed
-i
"s/[# ]*Port.*/Port 22/"
/etc/ssh/sshd_config
&&
\
echo
"* soft nofile 1048576
\n
* hard nofile 1048576"
>>
/etc/security/limits.conf
&&
\
echo
"root soft nofile 1048576
\n
root hard nofile 1048576"
>>
/etc/security/limits.conf
ENV
ROCM_PATH=/opt/dtk
# Install UCX
ARG
UCX_VERSION=1.20.0
ARG
UCX_HOME=/opt/ucx
RUN
--mount
=
type
=
bind
,from
=
hyhal,source
=
/,target
=
/opt/hyhal
\
cd
/tmp
&&
\
wget https://github.com/openucx/ucx/releases/download/v
${
UCX_VERSION
}
/ucx-
${
UCX_VERSION
}
.tar.gz
&&
\
tar
xzf ucx-
${
UCX_VERSION
}
.tar.gz
&&
\
cd
ucx-
${
UCX_VERSION
}
&&
\
./contrib/configure-release
--prefix
=
${
UCX_HOME
}
\
--enable-optimizations
--enable-tuning
\
--enable-cma
--enable-mt
\
--with-mlx5
--with-rc
--with-ud
--with-dc
--with-dm
--with-ib_hw_tm
\
--with-verbs
=
/usr/include
--with-rdmacm
=
/usr
\
--with-rocm
=
${
ROCM_PATH
}
\
--without-knem
--without-cuda
--without-java
&&
\
make
-j
$(
nproc
)
&&
\
rm
-rf
${
UCX_HOME
}
&&
\
make
install
&&
\
rm
-rf
/tmp/ucx-
${
UCX_VERSION
}*
# Install OpenMPI
ENV
MPI_HOME=/opt/mpi
ARG
OMPI_VERSION=5.0.9
RUN
--mount
=
type
=
bind
,from
=
hyhal,source
=
/,target
=
/opt/hyhal
\
cd
/tmp
&&
\
wget https://download.open-mpi.org/release/open-mpi/v
${
OMPI_VERSION
%.*
}
/openmpi-
${
OMPI_VERSION
}
.tar.gz
&&
\
tar
xzf openmpi-
${
OMPI_VERSION
}
.tar.gz
&&
\
cd
openmpi-
${
OMPI_VERSION
}
&&
\
./configure
--prefix
=
${
MPI_HOME
}
\
--with-ucx
=
${
UCX_HOME
}
\
--with-rocm
=
${
ROCM_PATH
}
\
--enable-builtin-atomics
\
--enable-wrapper-rpath
\
--enable-mca-no-build
=
btl-uct
\
--enable-prte-prefix-by-default
&&
\
make
-j
$(
nproc
)
&&
\
rm
-rf
${
MPI_HOME
}
&&
\
make
install
&&
\
ldconfig
&&
\
cd
/
&&
\
rm
-rf
/tmp/openmpi-
${
OMPI_VERSION
}*
# Install Intel MLC
RUN
cd
/tmp
&&
\
wget
-q
https://downloadmirror.intel.com/866182/mlc_v3.12.tgz
-O
mlc.tgz
&&
\
tar
xzf mlc.tgz Linux/mlc
&&
\
cp
./Linux/mlc /usr/local/bin/
&&
\
rm
-rf
./Linux mlc.tgz
# Add rocblas-bench to path
RUN
ln
-s
${
ROCM_PATH
}
/lib/rocblas/benchmark_tool/rocblas-bench
${
ROCM_PATH
}
/bin/
&&
\
chmod
+x
${
ROCM_PATH
}
/bin/rocblas-bench
&&
\
ln
-s
${
ROCM_PATH
}
/lib/hipblaslt/benchmark_tool/hipblaslt-bench
${
ROCM_PATH
}
/bin/
&&
\
chmod
+x
${
ROCM_PATH
}
/bin/hipblaslt-bench
ENV
PATH="${MPI_HOME}/bin:${UCX_HOME}/bin:/opt/superbench/bin:/usr/local/bin/${PATH:+:${PATH}}" \
LD_LIBRARY_PATH="${MPI_HOME}/lib:${UCX_HOME}/lib:/usr/lib/x86_64-linux-gnu/:/usr/local/lib/${LD_LIBRARY_PATH:+:${LD_LIBRARY_PATH}}" \
SB_HOME=/opt/superbench \
SB_MICRO_PATH=/opt/superbench \
ANSIBLE_DEPRECATION_WARNINGS=FALSE \
ANSIBLE_COLLECTIONS_PATH=/usr/share/ansible/collections
WORKDIR
${SB_HOME}
COPY
third_party third_party
COPY
dockerfile/etc/dtk26.04-topo-mapping.xml ${ROCM_PATH}/rccl/lib/topo_mapping_default.xml
RUN
--mount
=
type
=
bind
,from
=
hyhal,source
=
/,target
=
/opt/hyhal
\
make
\
RCCL_HOME
=
${
ROCM_PATH
}
/rccl
\
ROCM_PATH
=
${
ROCM_PATH
}
\
HIP_HOME
=
${
ROCM_PATH
}
/hip
\
MPI_HOME
=
${
MPI_HOME
}
\
-C
third_party
\
dtk
\
-o
cpu_hpl
\
-o
cpu_stream
\
-o
megatron_lm
\
-o
apex_rocm
\
-o
megatron_deepspeed
\
-o
rocm_megatron_lm
COPY
. .
ARG
SB_PIP_INDEX_URL=https://mirrors.tuna.tsinghua.edu.cn/pypi/web/simple
ENV
USE_HIP_DATATYPE=1 \
USE_HIPBLAS_COMPUTETYPE=1 \
VIRTUAL_ENV=/opt/superbench-venv
ENV
PATH="${VIRTUAL_ENV}/bin:${MPI_HOME}/bin:${UCX_HOME}/bin:/opt/superbench/bin:/usr/local/bin/${PATH:+:${PATH}}"
RUN
sed
-i
'/NCCL_/d'
/etc/bash.bashrc
&&
\
echo
PATH
=
"
$PATH
"
>
/etc/environment
&&
\
echo
LD_LIBRARY_PATH
=
"
$LD_LIBRARY_PATH
"
>>
/etc/environment
&&
\
echo
SB_MICRO_PATH
=
"
$SB_MICRO_PATH
"
>>
/etc/environment
&&
\
echo
VIRTUAL_ENV
=
"
$VIRTUAL_ENV
"
>>
/etc/environment
RUN
--mount
=
type
=
bind
,from
=
hyhal,source
=
/,target
=
/opt/hyhal
\
python3
-m
venv
--system-site-packages
${
VIRTUAL_ENV
}
&&
\
python3
-m
pip
install
-i
${
SB_PIP_INDEX_URL
}
--upgrade
pip wheel
setuptools
==
65.7 mpi4py
&&
\
python3
-m
pip
install
-i
${
SB_PIP_INDEX_URL
}
--no-build-isolation
.[hgworker]
&&
\
make cppbuild
&&
\
make postinstall
dockerfile/dtk26.04.dockerfile
→
dockerfile/dtk26.04
-vllm0.11.0
.dockerfile
View file @
b015ceeb
ARG
BASE_IMAGE=harbor.sourcefind.cn:5443/dcu/admin/base/vllm:0.11.0-ubuntu22.04-dtk26.04-py3.1
0
ARG
BASE_IMAGE=harbor.sourcefind.cn:5443/dcu/admin/base/vllm:0.11.0-ubuntu22.04-dtk26.04-py3.1
1
FROM
${BASE_IMAGE}
FROM
${BASE_IMAGE}
#
OS
:
#
Included in the base image
:
# - Ubuntu: 22.04
# - Ubuntu: 22.04
# - Docker Client: 20.10.8
# - Python: 3.11
# DTK:
# - DTK: 26.04
# - DTK: 26.04
# Lib:
# - AMD SMI: 24.5.3+02cbffb.dirty
# - ucx: 1.20.0
# - Torch: 2.5.1+das.opt1.dtk2604
# - openmpi: 5.0.9
# - Torchvision: 0.20.1+das.opt1.dtk2604.torch251
# Intel:
# - vLLM: 0.11.0+das.opt1.dtk2604.torch251
# - mlc: v3.12
# - ONNX Runtime: 1.19.2+das.opt1.dtk2604.torch251
# - DeepSpeed: 0.15.4+das.opt1.dtk2604.torch251
# - Apex: 1.5.0+das.opt1.dtk2604.torch251
# - FlashAttention: 2.6.1+das.opt1.dtk2604.torch251
# - Transformer Engine: 2.7.0+das.opt1.dtk2604.torch251
# - Triton: 3.1.0+das.opt1.dtk2604.torch251
# Added or changed by this Dockerfile:
# - Docker client: 20.10.8
# - UCX: 1.20.0, built with DTK/ROCm support
# - Open MPI: 5.0.9, built with UCX and DTK/ROCm support
# - Intel MLC: v3.12
# - rocblas-bench and hipblaslt-bench command symlinks
# - RCCL topology mapping override for DTK
# - SSH and ulimit configuration
LABEL
maintainer="SuperBench"
LABEL
maintainer="SuperBench"
...
@@ -42,7 +54,7 @@ RUN apt-get update && \
...
@@ -42,7 +54,7 @@ RUN apt-get update && \
openssh-client
\
openssh-client
\
openssh-server
\
openssh-server
\
pciutils
\
pciutils
\
python3.1
0
-venv
\
python3.1
1
-venv
\
rsync
\
rsync
\
sudo
\
sudo
\
util-linux
\
util-linux
\
...
...
dockerfile/dtk26.04_docker18.dockerfile
View file @
b015ceeb
ARG
BASE_IMAGE=harbor.sourcefind.cn:5443/dcu/admin/base/vllm:0.11.0-ubuntu22.04-dtk26.04-py3.1
0
ARG
BASE_IMAGE=harbor.sourcefind.cn:5443/dcu/admin/base/vllm:0.11.0-ubuntu22.04-dtk26.04-py3.1
1
FROM
${BASE_IMAGE}
FROM
${BASE_IMAGE}
#
OS
:
#
Included in the base image
:
# - Ubuntu: 22.04
# - Ubuntu: 22.04
# - Docker Client: 20.10.8
# - Python: 3.11
# DTK:
# - DTK: 26.04
# - DTK: 26.04
# Lib:
# - AMD SMI: 24.5.3+02cbffb.dirty
# - ucx: 1.20.0
# - Torch: 2.5.1+das.opt1.dtk2604
# - openmpi: 5.0.9
# - Torchvision: 0.20.1+das.opt1.dtk2604.torch251
# Intel:
# - vLLM: 0.11.0+das.opt1.dtk2604.torch251
# - mlc: v3.12
# - ONNX Runtime: 1.19.2+das.opt1.dtk2604.torch251
# - DeepSpeed: 0.15.4+das.opt1.dtk2604.torch251
# - Apex: 1.5.0+das.opt1.dtk2604.torch251
# - FlashAttention: 2.6.1+das.opt1.dtk2604.torch251
# - Transformer Engine: 2.7.0+das.opt1.dtk2604.torch251
# - Triton: 3.1.0+das.opt1.dtk2604.torch251
# Added or changed by this Dockerfile:
# - Docker client: 20.10.8
# - UCX: 1.20.0, built with DTK/ROCm support
# - Open MPI: 5.0.9, built with UCX and DTK/ROCm support
# - Intel MLC: v3.12
# - rocblas-bench and hipblaslt-bench command symlinks
# - RCCL topology mapping override for DTK
# - SSH and ulimit configuration
LABEL
maintainer="SuperBench"
LABEL
maintainer="SuperBench"
...
@@ -42,7 +54,7 @@ RUN apt-get update && \
...
@@ -42,7 +54,7 @@ RUN apt-get update && \
openssh-client
\
openssh-client
\
openssh-server
\
openssh-server
\
pciutils
\
pciutils
\
python3.1
0
-venv
\
python3.1
1
-venv
\
rsync
\
rsync
\
sudo
\
sudo
\
util-linux
\
util-linux
\
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment