ollama-statefulset.yaml 1.54 KB
Newer Older
1
2
3
apiVersion: apps/v1
kind: StatefulSet
metadata:
duhow's avatar
duhow committed
4
  name: {{ include "ollama.name" . }}
5
spec:
duhow's avatar
duhow committed
6
  serviceName: {{ include "ollama.name" . }}
7
8
9
10
11
12
13
14
15
16
17
18
19
20
  replicas: {{ .Values.ollama.replicaCount }}
  selector:
    matchLabels:
      app: ollama
  template:
    metadata:
      labels:
        app: ollama
    spec:
      containers:
      - name: ollama
        image: {{ .Values.ollama.image }}
        ports:
        - containerPort: {{ .Values.ollama.servicePort }}
21
22
23
24
25
26
27
28
29
30
31
32
        env:
        {{- if .Values.ollama.gpu.enabled }}
          - name: PATH
            value: /usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin
          - name: LD_LIBRARY_PATH
            value: /usr/local/nvidia/lib:/usr/local/nvidia/lib64
          - name: NVIDIA_DRIVER_CAPABILITIES
            value: compute,utility
        {{- end}}
        {{- if .Values.ollama.resources }}
        resources: {{- toYaml .Values.ollama.resources | nindent 10 }}
        {{- end }}
33
34
35
36
        volumeMounts:
        - name: ollama-volume
          mountPath: /root/.ollama
        tty: true
37
38
39
40
41
42
43
44
45
46
      {{- with .Values.ollama.nodeSelector }}
      nodeSelector:
        {{- toYaml . | nindent 8 }}
      {{- end }}
      tolerations:
        {{- if .Values.ollama.gpu.enabled }}
        - key: nvidia.com/gpu
          operator: Exists
          effect: NoSchedule
        {{- end }}
47
48
49
50
51
52
53
  volumeClaimTemplates:
  - metadata:
      name: ollama-volume
    spec:
      accessModes: [ "ReadWriteOnce" ]
      resources:
        requests:
duhow's avatar
duhow committed
54
          storage: {{ .Values.ollama.volumeSize }}