Dockerfile 2.86 KB
Newer Older
Timothy J. Baek's avatar
Timothy J. Baek committed
1
2
# syntax=docker/dockerfile:1

3
FROM node:alpine as build
4

Timothy J. Baek's avatar
Timothy J. Baek committed
5
6
WORKDIR /app

Timothy J. Baek's avatar
Timothy J. Baek committed
7
# wget embedding model weight from alpine (does not exist from slim-buster)
Xiaodong Ye's avatar
Xiaodong Ye committed
8
9
RUN wget "https://chroma-onnx-models.s3.amazonaws.com/all-MiniLM-L6-v2/onnx.tar.gz" -O - | \
    tar -xzf - -C /app
Timothy J. Baek's avatar
Timothy J. Baek committed
10

Xiaodong Ye's avatar
Xiaodong Ye committed
11
COPY package.json package-lock.json ./
12
RUN npm ci
13

14
15
COPY . .
RUN npm run build
Timothy J. Baek's avatar
Timothy J. Baek committed
16

Timothy J. Baek's avatar
Timothy J. Baek committed
17

Timothy J. Baek's avatar
Timothy J. Baek committed
18
FROM python:3.11-slim-bookworm as base
Timothy J. Baek's avatar
Timothy J. Baek committed
19
20

ENV ENV=prod
21
ENV PORT ""
Timothy J. Baek's avatar
Timothy J. Baek committed
22
23

ENV OLLAMA_API_BASE_URL "/ollama/api"
Timothy J. Baek's avatar
Timothy J. Baek committed
24
25
26
27

ENV OPENAI_API_BASE_URL ""
ENV OPENAI_API_KEY ""

28
ENV WEBUI_SECRET_KEY ""
Timothy J. Baek's avatar
Timothy J. Baek committed
29

30
31
32
ENV SCARF_NO_ANALYTICS true
ENV DO_NOT_TRACK true

33
######## Preloaded models ########
34
# whisper TTS Settings
35
ENV WHISPER_MODEL="base"
Timothy J. Baek's avatar
refac  
Timothy J. Baek committed
36
ENV WHISPER_MODEL_DIR="/app/backend/data/cache/whisper/models"
37

38
# RAG Embedding Model Settings
39
40
# any sentence transformer model; models to use can be found at https://huggingface.co/models?library=sentence-transformers
# Leaderboard: https://huggingface.co/spaces/mteb/leaderboard 
41
# for better persormance and multilangauge support use "intfloat/multilingual-e5-large" (~2.5GB) or "intfloat/multilingual-e5-base" (~1.5GB)
42
# IMPORTANT: If you change the default model (all-MiniLM-L6-v2) and vice versa, you aren't able to use RAG Chat with your previous documents loaded in the WebUI! You need to re-embed them.
43
ENV RAG_EMBEDDING_MODEL="all-MiniLM-L6-v2"
44
45
46
47
ENV SENTENCE_TRANSFORMERS_HOME="/app/backend/data/cache/embedding/models"
# device type for whisper tts and ebbeding models - "cpu" (default), "cuda" (nvidia gpu and CUDA required) or "mps" (apple silicon) - choosing this right can lead to better performance
ENV RAG_EMBEDDING_MODEL_DEVICE_TYPE="cpu"
######## Preloaded models ########
48

Timothy J. Baek's avatar
Timothy J. Baek committed
49
50
WORKDIR /app/backend

51
# install python dependencies
Timothy J. Baek's avatar
Timothy J. Baek committed
52
COPY ./backend/requirements.txt ./requirements.txt
Timothy J. Baek's avatar
Timothy J. Baek committed
53

Ismael's avatar
Ismael committed
54
55
RUN pip3 install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cpu --no-cache-dir
RUN pip3 install -r requirements.txt --no-cache-dir
56

TriantaTV's avatar
TriantaTV committed
57
# Install pandoc and netcat
Timothy J. Baek's avatar
Timothy J. Baek committed
58
59
# RUN python -c "import pypandoc; pypandoc.download_pandoc()"
RUN apt-get update \
TriantaTV's avatar
TriantaTV committed
60
    && apt-get install -y pandoc netcat-openbsd \
Timothy J. Baek's avatar
Timothy J. Baek committed
61
62
    && rm -rf /var/lib/apt/lists/*

63
# preload embedding model
64
RUN python -c "import os; from chromadb.utils import embedding_functions; sentence_transformer_ef = embedding_functions.SentenceTransformerEmbeddingFunction(model_name=os.environ['RAG_EMBEDDING_MODEL'], device=os.environ['RAG_EMBEDDING_MODEL_DEVICE_TYPE'])"
65
# preload tts model
66
RUN python -c "import os; from faster_whisper import WhisperModel; WhisperModel(os.environ['WHISPER_MODEL'], device='auto', compute_type='int8', download_root=os.environ['WHISPER_MODEL_DIR'])"
67

Timothy J. Baek's avatar
Timothy J. Baek committed
68

69
70
# copy embedding weight from build
RUN mkdir -p /root/.cache/chroma/onnx_models/all-MiniLM-L6-v2
Xiaodong Ye's avatar
Xiaodong Ye committed
71
COPY --from=build /app/onnx /root/.cache/chroma/onnx_models/all-MiniLM-L6-v2/onnx
72
73
74
75
76

# copy built frontend files
COPY --from=build /app/build /app/build

# copy backend files
Timothy J. Baek's avatar
Timothy J. Baek committed
77
78
COPY ./backend .

79
CMD [ "bash", "start.sh"]