Dockerfile 3.14 KB
Newer Older
Timothy J. Baek's avatar
Timothy J. Baek committed
1
2
# syntax=docker/dockerfile:1

3
FROM node:alpine as build
4

Timothy J. Baek's avatar
Timothy J. Baek committed
5
6
WORKDIR /app

Timothy J. Baek's avatar
Timothy J. Baek committed
7
# wget embedding model weight from alpine (does not exist from slim-buster)
Xiaodong Ye's avatar
Xiaodong Ye committed
8
9
RUN wget "https://chroma-onnx-models.s3.amazonaws.com/all-MiniLM-L6-v2/onnx.tar.gz" -O - | \
    tar -xzf - -C /app
Timothy J. Baek's avatar
Timothy J. Baek committed
10

Xiaodong Ye's avatar
Xiaodong Ye committed
11
COPY package.json package-lock.json ./
12
RUN npm ci
13

14
15
COPY . .
RUN npm run build
Timothy J. Baek's avatar
Timothy J. Baek committed
16

Timothy J. Baek's avatar
Timothy J. Baek committed
17

Timothy J. Baek's avatar
Timothy J. Baek committed
18
FROM python:3.11-slim-bookworm as base
Timothy J. Baek's avatar
Timothy J. Baek committed
19
20

ENV ENV=prod
21
ENV PORT ""
Timothy J. Baek's avatar
Timothy J. Baek committed
22

23
ENV OLLAMA_BASE_URL "/ollama"
Timothy J. Baek's avatar
Timothy J. Baek committed
24
25
26
27

ENV OPENAI_API_BASE_URL ""
ENV OPENAI_API_KEY ""

28
ENV WEBUI_SECRET_KEY ""
Timothy J. Baek's avatar
Timothy J. Baek committed
29

30
31
32
ENV SCARF_NO_ANALYTICS true
ENV DO_NOT_TRACK true

33
34
35
ENV MANIFEST_NAME "Open WebUI"
ENV MANIFEST_SHORT_NAME "Open WebUI"

36
######## Preloaded models ########
37
# whisper TTS Settings
38
ENV WHISPER_MODEL="base"
Timothy J. Baek's avatar
refac  
Timothy J. Baek committed
39
ENV WHISPER_MODEL_DIR="/app/backend/data/cache/whisper/models"
40

41
# RAG Embedding Model Settings
42
43
# any sentence transformer model; models to use can be found at https://huggingface.co/models?library=sentence-transformers
# Leaderboard: https://huggingface.co/spaces/mteb/leaderboard 
44
# for better persormance and multilangauge support use "intfloat/multilingual-e5-large" (~2.5GB) or "intfloat/multilingual-e5-base" (~1.5GB)
45
# IMPORTANT: If you change the default model (all-MiniLM-L6-v2) and vice versa, you aren't able to use RAG Chat with your previous documents loaded in the WebUI! You need to re-embed them.
46
ENV RAG_EMBEDDING_MODEL="all-MiniLM-L6-v2"
pandego's avatar
pandego committed
47
# device type for whisper tts and embbeding models - "cpu" (default), "cuda" (nvidia gpu and CUDA required) or "mps" (apple silicon) - choosing this right can lead to better performance
48
ENV RAG_EMBEDDING_MODEL_DEVICE_TYPE="cpu"
Timothy J. Baek's avatar
refac  
Timothy J. Baek committed
49
50
51
ENV RAG_EMBEDDING_MODEL_DIR="/app/backend/data/cache/embedding/models"
ENV SENTENCE_TRANSFORMERS_HOME $RAG_EMBEDDING_MODEL_DIR

52
######## Preloaded models ########
53

Timothy J. Baek's avatar
Timothy J. Baek committed
54
55
WORKDIR /app/backend

56
# install python dependencies
Timothy J. Baek's avatar
Timothy J. Baek committed
57
COPY ./backend/requirements.txt ./requirements.txt
Timothy J. Baek's avatar
Timothy J. Baek committed
58

Timothy J. Baek's avatar
Timothy J. Baek committed
59
60
RUN apt-get update && apt-get install ffmpeg libsm6 libxext6  -y

Ismael's avatar
Ismael committed
61
62
RUN pip3 install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cpu --no-cache-dir
RUN pip3 install -r requirements.txt --no-cache-dir
63

TriantaTV's avatar
TriantaTV committed
64
# Install pandoc and netcat
Timothy J. Baek's avatar
Timothy J. Baek committed
65
66
# RUN python -c "import pypandoc; pypandoc.download_pandoc()"
RUN apt-get update \
TriantaTV's avatar
TriantaTV committed
67
    && apt-get install -y pandoc netcat-openbsd \
Timothy J. Baek's avatar
Timothy J. Baek committed
68
69
    && rm -rf /var/lib/apt/lists/*

70
# preload embedding model
71
RUN python -c "import os; from chromadb.utils import embedding_functions; sentence_transformer_ef = embedding_functions.SentenceTransformerEmbeddingFunction(model_name=os.environ['RAG_EMBEDDING_MODEL'], device=os.environ['RAG_EMBEDDING_MODEL_DEVICE_TYPE'])"
72
# preload tts model
73
RUN python -c "import os; from faster_whisper import WhisperModel; WhisperModel(os.environ['WHISPER_MODEL'], device='auto', compute_type='int8', download_root=os.environ['WHISPER_MODEL_DIR'])"
74

75
76
# copy embedding weight from build
RUN mkdir -p /root/.cache/chroma/onnx_models/all-MiniLM-L6-v2
Xiaodong Ye's avatar
Xiaodong Ye committed
77
COPY --from=build /app/onnx /root/.cache/chroma/onnx_models/all-MiniLM-L6-v2/onnx
78
79
80

# copy built frontend files
COPY --from=build /app/build /app/build
81
82
COPY --from=build /app/CHANGELOG.md /app/CHANGELOG.md
COPY --from=build /app/package.json /app/package.json
83
84

# copy backend files
Timothy J. Baek's avatar
Timothy J. Baek committed
85
86
COPY ./backend .

pandego's avatar
pandego committed
87
CMD [ "bash", "start.sh"]