ollama-statefulset.yaml 1.76 KB
Newer Older
1
2
3
apiVersion: apps/v1
kind: StatefulSet
metadata:
duhow's avatar
duhow committed
4
  name: {{ include "ollama.name" . }}
duhow's avatar
duhow committed
5
6
  labels:
    {{- include "ollama.labels" . | nindent 4 }}
7
spec:
duhow's avatar
duhow committed
8
  serviceName: {{ include "ollama.name" . }}
9
10
11
  replicas: {{ .Values.ollama.replicaCount }}
  selector:
    matchLabels:
duhow's avatar
duhow committed
12
      {{- include "ollama.selectorLabels" . | nindent 6 }}
13
14
15
  template:
    metadata:
      labels:
16
        {{- include "ollama.labels" . | nindent 8 }}
17
18
    spec:
      containers:
duhow's avatar
duhow committed
19
      - name: {{ include "ollama.name" . }}
duhow's avatar
duhow committed
20
21
22
23
        {{- with .Values.ollama.image }}
        image: {{ .repository }}:{{ .tag }}
        imagePullPolicy: {{ .pullPolicy }}
        {{- end }}
24
        ports:
25
26
        - name: http
          containerPort: {{ .Values.ollama.service.containerPort }}
27
28
29
30
31
32
33
34
        env:
        {{- if .Values.ollama.gpu.enabled }}
          - name: PATH
            value: /usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin
          - name: LD_LIBRARY_PATH
            value: /usr/local/nvidia/lib:/usr/local/nvidia/lib64
          - name: NVIDIA_DRIVER_CAPABILITIES
            value: compute,utility
duhow's avatar
duhow committed
35
        {{- end }}
duhow's avatar
duhow committed
36
37
        {{- with .Values.ollama.resources }}
        resources: {{- toYaml . | nindent 10 }}
38
        {{- end }}
39
40
41
42
        volumeMounts:
        - name: ollama-volume
          mountPath: /root/.ollama
        tty: true
43
44
45
46
      {{- with .Values.ollama.nodeSelector }}
      nodeSelector:
        {{- toYaml . | nindent 8 }}
      {{- end }}
duhow's avatar
duhow committed
47
      {{- with .Values.ollama.tolerations }}
48
      tolerations:
duhow's avatar
duhow committed
49
50
        {{- toYaml . | nindent 8 }}
      {{- end }}
51
52
53
54
55
56
57
  volumeClaimTemplates:
  - metadata:
      name: ollama-volume
    spec:
      accessModes: [ "ReadWriteOnce" ]
      resources:
        requests:
duhow's avatar
duhow committed
58
          storage: {{ .Values.ollama.persistence.size }}