Dockerfile.neuron 1.24 KB
Newer Older
1
# default base image
2
ARG BASE_IMAGE="public.ecr.aws/neuron/pytorch-inference-neuronx:2.1.2-neuronx-py310-sdk2.20.0-ubuntu20.04"
3
4
5
6
7
8

FROM $BASE_IMAGE

RUN echo "Base image is $BASE_IMAGE"

# Install some basic utilities
9
10
11
12
13
14
RUN apt-get update && \
    apt-get install -y \
        git \
        python3 \
        python3-pip \
        ffmpeg libsm6 libxext6 libgl1
15
16
17
18
19
20
21
22
23
24
25

### Mount Point ###
# When launching the container, mount the code directory to /app
ARG APP_MOUNT=/app
VOLUME [ ${APP_MOUNT} ]
WORKDIR ${APP_MOUNT}

RUN python3 -m pip install --upgrade pip
RUN python3 -m pip install --no-cache-dir fastapi ninja tokenizers pandas
RUN python3 -m pip install sentencepiece transformers==4.36.2 -U
RUN python3 -m pip install transformers-neuronx --extra-index-url=https://pip.repos.neuron.amazonaws.com -U
26
RUN python3 -m pip install --pre neuronx-cc==2.15.* --extra-index-url=https://pip.repos.neuron.amazonaws.com -U
27

28
COPY . /app/vllm
29
30

RUN cd /app/vllm \
31
32
33
    && python3 -m pip install -U \
        cmake>=3.26 ninja packaging setuptools-scm>=8 wheel jinja2 \
        -r requirements-neuron.txt
34

35
ENV VLLM_TARGET_DEVICE neuron
36
37
38
RUN --mount=type=bind,source=.git,target=.git \
    cd /app/vllm \
    && pip install --no-build-isolation -v -e . \
39
40
41
    && cd ..

CMD ["/bin/bash"]