Merge pull request #897 from open-webui/main

dev

Merge pull request #897 from open-webui/main
dev
437d7ff6 · Timothy Jaeryang Baek · GitHub · 02f364bf · 81eceb48 · 437d7ff6
Unverified Commit 437d7ff6 authored Feb 24, 2024 by Timothy Jaeryang Baek Committed by GitHub Feb 24, 2024
20 changed files
--- a/kubernetes/helm/values-minikube.yaml
+++ b/kubernetes/helm/values-minikube.yaml
+ollama:
+  resources:
+    requests:
+      cpu: "2000m"
+      memory: "2Gi"
+    limits:
+      cpu: "4000m"
+      memory: "4Gi"
+      nvidia.com/gpu: "0"
+  service:
+    type: ClusterIP
+  gpu:
+    enabled: false
+webui:
+  resources:
+    requests:
+      cpu: "500m"
+      memory: "500Mi"
+    limits:
+      cpu: "1000m"
+      memory: "1Gi"
+  ingress:
+    enabled: true
+    host: open-webui.minikube.local
+  service:
+    type: NodePort
--- a/kubernetes/helm/values.yaml
+++ b/kubernetes/helm/values.yaml
-namespace: ollama-namespace
+nameOverride: ""
 ollama:
+  annotations: {}
+  podAnnotations: {}
  replicaCount: 1
-  image: ollama/ollama:latest
+  image:
-  servicePort: 11434
+    repository: ollama/ollama
-  resources:
+    tag: latest
-    limits:
+    pullPolicy: Always
-      cpu: "2000m"
+  resources: {}
-      memory: "2Gi"
+  persistence:
-      nvidia.com/gpu: "0"
+    enabled: true
-  volumeSize: 1Gi
+    size: 30Gi
+    existingClaim: ""
+    accessModes:
+    - ReadWriteOnce
+    storageClass: ""
+    selector: {}
+    annotations: {}
  nodeSelector: {}
-  tolerations: []
+  # -- If using a special runtime container such as nvidia, set it here.
+  runtimeClassName: ""
+  tolerations:
+  - key: nvidia.com/gpu
+    operator: Exists
+    effect: NoSchedule
  service:
    type: ClusterIP
+    annotations: {}
+    port: 80
+    containerPort: 11434
  gpu:
+    # -- Enable additional ENV values to help Ollama discover GPU usage
    enabled: false
 webui:
+  annotations: {}
+  podAnnotations: {}
  replicaCount: 1
-  image: ghcr.io/ollama-webui/ollama-webui:main
+  image:
-  servicePort: 8080
+    repository: ghcr.io/open-webui/open-webui
-  resources:
+    tag: ""
-    limits:
+    pullPolicy: Always
-      cpu: "500m"
+  resources: {}
-      memory: "500Mi"
  ingress:
-    enabled: true
+    enabled: false
-    annotations:
+    class: ""
-    # Use appropriate annotations for your Ingress controller, e.g., for NGINX:
+    # -- Use appropriate annotations for your Ingress controller, e.g., for NGINX:
    # nginx.ingress.kubernetes.io/rewrite-target: /
-    host: ollama.minikube.local
+    annotations: {}
-  volumeSize: 1Gi
+    host: ""
+    tls: false
+    existingSecret: ""
+  persistence:
+    enabled: true
+    size: 2Gi
+    existingClaim: ""
+    # -- If using multiple replicas, you must update accessModes to ReadWriteMany
+    accessModes:
+    - ReadWriteOnce
+    storageClass: ""
+    selector: {}
+    annotations: {}
  nodeSelector: {}
  tolerations: []
  service:
-    type: NodePort
+    type: ClusterIP
\ No newline at end of file
+    annotations: {}
+    port: 80
+    containerPort: 8080
+    nodePort: ""
--- a/kubernetes/manifest/base/ollama-service.yaml
+++ b/kubernetes/manifest/base/ollama-service.yaml
@@ -2,7 +2,7 @@ apiVersion: v1
 kind: Service
 metadata:
  name: ollama-service
-  namespace: ollama-namespace
+  namespace: open-webui
 spec:
  selector:
    app: ollama

--- a/kubernetes/manifest/base/ollama-statefulset.yaml
+++ b/kubernetes/manifest/base/ollama-statefulset.yaml
@@ -2,7 +2,7 @@ apiVersion: apps/v1
 kind: StatefulSet
 metadata:
  name: ollama
-  namespace: ollama-namespace
+  namespace: open-webui
 spec:
  serviceName: "ollama"
  replicas: 1
@@ -20,9 +20,13 @@ spec:
        ports:
        - containerPort: 11434
        resources:
-          limits:
+          requests:
            cpu: "2000m"
            memory: "2Gi"
+          limits:
+            cpu: "4000m"
+            memory: "4Gi"
+            nvidia.com/gpu: "0"
        volumeMounts:
        - name: ollama-volume
          mountPath: /root/.ollama
@@ -34,4 +38,4 @@ spec:
      accessModes: [ "ReadWriteOnce" ]
      resources:
        requests:
-          storage: 1Gi
+          storage: 30Gi
\ No newline at end of file
--- a/kubernetes/manifest/base/ollama-namespace.yaml
+++ b/kubernetes/manifest/base/ollama-namespace.yaml
 apiVersion: v1
 kind: Namespace
 metadata:
-  name: ollama-namespace
+  name: open-webui
\ No newline at end of file
--- a/kubernetes/manifest/base/webui-deployment.yaml
+++ b/kubernetes/manifest/base/webui-deployment.yaml
 apiVersion: apps/v1
 kind: Deployment
 metadata:
-  name: ollama-webui-deployment
+  name: open-webui-deployment
-  namespace: ollama-namespace
+  namespace: open-webui
 spec:
  replicas: 1
  selector:
    matchLabels:
-      app: ollama-webui
+      app: open-webui
  template:
    metadata:
      labels:
-        app: ollama-webui
+        app: open-webui
    spec:
      containers:
-      - name: ollama-webui
+      - name: open-webui
-        image: ghcr.io/ollama-webui/ollama-webui:main
+        image: ghcr.io/open-webui/open-webui:main
        ports:
        - containerPort: 8080
        resources:
-          limits:
+          requests:
            cpu: "500m"
            memory: "500Mi"
+          limits:
+            cpu: "1000m"
+            memory: "1Gi"
        env:
        - name: OLLAMA_API_BASE_URL
-          value: "http://ollama-service.ollama-namespace.svc.cluster.local:11434/api"
+          value: "http://ollama-service.open-webui.svc.cluster.local:11434/api"
        tty: true
+        volumeMounts:
+        - name: webui-volume
+          mountPath: /app/backend/data
+      volumes:
+      - name: webui-volume
+        persistentVolumeClaim:
+          claimName: ollama-webui-pvc          
\ No newline at end of file
--- a/kubernetes/manifest/base/webui-ingress.yaml
+++ b/kubernetes/manifest/base/webui-ingress.yaml
--- a/kubernetes/manifest/base/webui-pvc.yaml
+++ b/kubernetes/manifest/base/webui-pvc.yaml
--- a/kubernetes/manifest/base/webui-service.yaml
+++ b/kubernetes/manifest/base/webui-service.yaml
--- a/kubernetes/manifest/kustomization.yaml
+++ b/kubernetes/manifest/kustomization.yaml
 resources:
- base/ollama-namespace.yaml
+- base/open-webui.yaml
 - base/ollama-service.yaml
 - base/ollama-statefulset.yaml
 - base/webui-deployment.yaml
 - base/webui-service.yaml
 - base/webui-ingress.yaml
+- base/webui-pvc.yaml
 apiVersion: kustomize.config.k8s.io/v1beta1
 kind: Kustomization

--- a/kubernetes/manifest/patches/ollama-statefulset-gpu.yaml
+++ b/kubernetes/manifest/patches/ollama-statefulset-gpu.yaml
--- a/package-lock.json
+++ b/package-lock.json
--- a/package.json
+++ b/package.json
--- a/run-compose.sh
+++ b/run-compose.sh
--- a/run-ollama-docker.sh
+++ b/run-ollama-docker.sh
--- a/run.sh
+++ b/run.sh
--- a/src/app.css
+++ b/src/app.css
--- a/src/lib/apis/audio/index.ts
+++ b/src/lib/apis/audio/index.ts
--- a/src/lib/apis/auths/index.ts
+++ b/src/lib/apis/auths/index.ts
--- a/src/lib/apis/chats/index.ts
+++ b/src/lib/apis/chats/index.ts