Dockerfile 3.01 KB
Newer Older
Timothy J. Baek's avatar
Timothy J. Baek committed
1
2
# syntax=docker/dockerfile:1

3
FROM node:alpine as build
4

Timothy J. Baek's avatar
Timothy J. Baek committed
5
6
WORKDIR /app

Timothy J. Baek's avatar
Timothy J. Baek committed
7
# wget embedding model weight from alpine (does not exist from slim-buster)
Xiaodong Ye's avatar
Xiaodong Ye committed
8
9
RUN wget "https://chroma-onnx-models.s3.amazonaws.com/all-MiniLM-L6-v2/onnx.tar.gz" -O - | \
    tar -xzf - -C /app
Timothy J. Baek's avatar
Timothy J. Baek committed
10

Xiaodong Ye's avatar
Xiaodong Ye committed
11
COPY package.json package-lock.json ./
12
RUN npm ci
13

14
15
COPY . .
RUN npm run build
Timothy J. Baek's avatar
Timothy J. Baek committed
16

Timothy J. Baek's avatar
Timothy J. Baek committed
17

Timothy J. Baek's avatar
Timothy J. Baek committed
18
FROM python:3.11-slim-bookworm as base
Timothy J. Baek's avatar
Timothy J. Baek committed
19
20

ENV ENV=prod
21
ENV PORT ""
Timothy J. Baek's avatar
Timothy J. Baek committed
22
23

ENV OLLAMA_API_BASE_URL "/ollama/api"
Timothy J. Baek's avatar
Timothy J. Baek committed
24
25
26
27

ENV OPENAI_API_BASE_URL ""
ENV OPENAI_API_KEY ""

28
ENV WEBUI_SECRET_KEY ""
Timothy J. Baek's avatar
Timothy J. Baek committed
29

30
31
32
ENV SCARF_NO_ANALYTICS true
ENV DO_NOT_TRACK true

33
######## Preloaded models ########
34
# whisper TTS Settings
35
ENV WHISPER_MODEL="base"
Timothy J. Baek's avatar
refac  
Timothy J. Baek committed
36
ENV WHISPER_MODEL_DIR="/app/backend/data/cache/whisper/models"
37

38
# RAG Embedding Model Settings
39
40
# any sentence transformer model; models to use can be found at https://huggingface.co/models?library=sentence-transformers
# Leaderboard: https://huggingface.co/spaces/mteb/leaderboard 
41
# for better persormance and multilangauge support use "intfloat/multilingual-e5-large" (~2.5GB) or "intfloat/multilingual-e5-base" (~1.5GB)
42
# IMPORTANT: If you change the default model (all-MiniLM-L6-v2) and vice versa, you aren't able to use RAG Chat with your previous documents loaded in the WebUI! You need to re-embed them.
43
ENV RAG_EMBEDDING_MODEL="all-MiniLM-L6-v2"
44
45
# device type for whisper tts and ebbeding models - "cpu" (default), "cuda" (nvidia gpu and CUDA required) or "mps" (apple silicon) - choosing this right can lead to better performance
ENV RAG_EMBEDDING_MODEL_DEVICE_TYPE="cpu"
Timothy J. Baek's avatar
refac  
Timothy J. Baek committed
46
47
48
ENV RAG_EMBEDDING_MODEL_DIR="/app/backend/data/cache/embedding/models"
ENV SENTENCE_TRANSFORMERS_HOME $RAG_EMBEDDING_MODEL_DIR

49
######## Preloaded models ########
50

Timothy J. Baek's avatar
Timothy J. Baek committed
51
52
WORKDIR /app/backend

53
# install python dependencies
Timothy J. Baek's avatar
Timothy J. Baek committed
54
COPY ./backend/requirements.txt ./requirements.txt
Timothy J. Baek's avatar
Timothy J. Baek committed
55

Ismael's avatar
Ismael committed
56
57
RUN pip3 install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cpu --no-cache-dir
RUN pip3 install -r requirements.txt --no-cache-dir
58

TriantaTV's avatar
TriantaTV committed
59
# Install pandoc and netcat
Timothy J. Baek's avatar
Timothy J. Baek committed
60
61
# RUN python -c "import pypandoc; pypandoc.download_pandoc()"
RUN apt-get update \
TriantaTV's avatar
TriantaTV committed
62
    && apt-get install -y pandoc netcat-openbsd \
Timothy J. Baek's avatar
Timothy J. Baek committed
63
64
    && rm -rf /var/lib/apt/lists/*

65
# preload embedding model
66
RUN python -c "import os; from chromadb.utils import embedding_functions; sentence_transformer_ef = embedding_functions.SentenceTransformerEmbeddingFunction(model_name=os.environ['RAG_EMBEDDING_MODEL'], device=os.environ['RAG_EMBEDDING_MODEL_DEVICE_TYPE'])"
67
# preload tts model
68
RUN python -c "import os; from faster_whisper import WhisperModel; WhisperModel(os.environ['WHISPER_MODEL'], device='auto', compute_type='int8', download_root=os.environ['WHISPER_MODEL_DIR'])"
69

70
71
# copy embedding weight from build
RUN mkdir -p /root/.cache/chroma/onnx_models/all-MiniLM-L6-v2
Xiaodong Ye's avatar
Xiaodong Ye committed
72
COPY --from=build /app/onnx /root/.cache/chroma/onnx_models/all-MiniLM-L6-v2/onnx
73
74
75

# copy built frontend files
COPY --from=build /app/build /app/build
76
77
COPY --from=build /app/CHANGELOG.md /app/CHANGELOG.md
COPY --from=build /app/package.json /app/package.json
78
79

# copy backend files
Timothy J. Baek's avatar
Timothy J. Baek committed
80
81
COPY ./backend .

82
CMD [ "bash", "start.sh"]