ollama-statefulset.yaml 1.68 KB
Newer Older
1
2
3
apiVersion: apps/v1
kind: StatefulSet
metadata:
duhow's avatar
duhow committed
4
  name: {{ include "ollama.name" . }}
duhow's avatar
duhow committed
5
6
  labels:
    {{- include "ollama.labels" . | nindent 4 }}
7
spec:
duhow's avatar
duhow committed
8
  serviceName: {{ include "ollama.name" . }}
9
10
11
  replicas: {{ .Values.ollama.replicaCount }}
  selector:
    matchLabels:
duhow's avatar
duhow committed
12
      {{- include "ollama.selectorLabels" . | nindent 6 }}
13
14
15
  template:
    metadata:
      labels:
duhow's avatar
duhow committed
16
        {{- include "ollama.selectorLabels" . | nindent 8 }}
17
18
    spec:
      containers:
duhow's avatar
duhow committed
19
      - name: {{ include "ollama.name" . }}
20
21
22
        image: {{ .Values.ollama.image }}
        ports:
        - containerPort: {{ .Values.ollama.servicePort }}
23
24
25
26
27
28
29
30
31
        env:
        {{- if .Values.ollama.gpu.enabled }}
          - name: PATH
            value: /usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin
          - name: LD_LIBRARY_PATH
            value: /usr/local/nvidia/lib:/usr/local/nvidia/lib64
          - name: NVIDIA_DRIVER_CAPABILITIES
            value: compute,utility
        {{- end}}
duhow's avatar
duhow committed
32
33
        {{- with .Values.ollama.resources }}
        resources: {{- toYaml . | nindent 10 }}
34
        {{- end }}
35
36
37
38
        volumeMounts:
        - name: ollama-volume
          mountPath: /root/.ollama
        tty: true
39
40
41
42
43
44
45
46
47
48
      {{- with .Values.ollama.nodeSelector }}
      nodeSelector:
        {{- toYaml . | nindent 8 }}
      {{- end }}
      tolerations:
        {{- if .Values.ollama.gpu.enabled }}
        - key: nvidia.com/gpu
          operator: Exists
          effect: NoSchedule
        {{- end }}
49
50
51
52
53
54
55
  volumeClaimTemplates:
  - metadata:
      name: ollama-volume
    spec:
      accessModes: [ "ReadWriteOnce" ]
      resources:
        requests:
duhow's avatar
duhow committed
56
          storage: {{ .Values.ollama.volumeSize }}