Dockerfile 1.21 KB
Newer Older
1
2
FROM hpcaitech/cuda-conda:11.3

3
4
5
6
7
# metainformation
LABEL org.opencontainers.image.source = "https://github.com/hpcaitech/ColossalAI"
LABEL org.opencontainers.image.licenses = "Apache License 2.0"
LABEL org.opencontainers.image.base.name = "docker.io/library/hpcaitech/cuda-conda:11.3"

8
# install torch
9
RUN conda install pytorch==1.12.1 torchvision==0.13.1 torchaudio==0.12.1 cudatoolkit=11.3 -c pytorch
10

11
12
13
# install ninja
RUN apt-get install -y --no-install-recommends ninja-build

14
15
16
# install apex
RUN git clone https://github.com/NVIDIA/apex && \
    cd apex && \
17
    git checkout 91fcaa && \
18
    pip install packaging && \
kurisusnowdeng's avatar
kurisusnowdeng committed
19
    pip install -v --disable-pip-version-check --no-cache-dir --global-option="--cpp_ext" --global-option="--cuda_ext" --global-option="--fast_layer_norm" ./
Frank Lee's avatar
Frank Lee committed
20
21

# install colossalai
liuzeming's avatar
liuzeming committed
22
23
ARG VERSION=1
RUN git clone -b ${VERSION} https://github.com/hpcaitech/ColossalAI.git \
kurisusnowdeng's avatar
kurisusnowdeng committed
24
    && cd ./ColossalAI \
25
    && CUDA_EXT=1 pip install -v --no-cache-dir .
26
27

# install titans
28
RUN pip install --no-cache-dir titans
29
30
31
32
33
34

# install tensornvme
RUN conda install cmake && \
    git clone https://github.com/hpcaitech/TensorNVMe.git && \
    cd TensorNVMe && \
    pip install -r requirements.txt && \
35
    pip install -v --no-cache-dir .