model.go 6.24 KB
Newer Older
Michael Yang's avatar
Michael Yang committed
1
2
3
4
5
6
7
8
9
package server

import (
	"archive/zip"
	"bytes"
	"context"
	"errors"
	"fmt"
	"io"
10
	"log/slog"
Michael Yang's avatar
Michael Yang committed
11
12
13
	"net/http"
	"os"
	"path/filepath"
14
	"strings"
Michael Yang's avatar
Michael Yang committed
15
16
17
18

	"github.com/ollama/ollama/api"
	"github.com/ollama/ollama/convert"
	"github.com/ollama/ollama/llm"
Michael Yang's avatar
Michael Yang committed
19
	"github.com/ollama/ollama/template"
Michael Yang's avatar
Michael Yang committed
20
21
22
	"github.com/ollama/ollama/types/model"
)

Michael Yang's avatar
Michael Yang committed
23
var intermediateBlobs map[string]string = make(map[string]string)
24

25
type layerGGML struct {
Michael Yang's avatar
Michael Yang committed
26
27
28
29
	*Layer
	*llm.GGML
}

30
func parseFromModel(ctx context.Context, name model.Name, fn func(api.ProgressResponse)) (layers []*layerGGML, err error) {
31
	m, err := ParseNamedManifest(name)
Michael Yang's avatar
Michael Yang committed
32
33
	switch {
	case errors.Is(err, os.ErrNotExist):
Michael Yang's avatar
Michael Yang committed
34
		if err := PullModel(ctx, name.String(), &registryOptions{}, fn); err != nil {
Michael Yang's avatar
Michael Yang committed
35
36
37
			return nil, err
		}

38
		m, err = ParseNamedManifest(name)
Michael Yang's avatar
Michael Yang committed
39
40
41
		if err != nil {
			return nil, err
		}
Michael Yang's avatar
Michael Yang committed
42
43
44
45
	case err != nil:
		return nil, err
	}

46
47
	for _, layer := range m.Layers {
		layer, err := NewLayerFromLayer(layer.Digest, layer.MediaType, name.DisplayShortest())
Michael Yang's avatar
Michael Yang committed
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
		if err != nil {
			return nil, err
		}

		switch layer.MediaType {
		case "application/vnd.ollama.image.model",
			"application/vnd.ollama.image.projector",
			"application/vnd.ollama.image.adapter":
			blobpath, err := GetBlobsPath(layer.Digest)
			if err != nil {
				return nil, err
			}

			blob, err := os.Open(blobpath)
			if err != nil {
				return nil, err
			}
			defer blob.Close()

67
			ggml, _, err := llm.DecodeGGML(blob, 0)
Michael Yang's avatar
Michael Yang committed
68
69
70
			if err != nil {
				return nil, err
			}
Michael Yang's avatar
Michael Yang committed
71

72
			layers = append(layers, &layerGGML{layer, ggml})
Michael Yang's avatar
Michael Yang committed
73
		default:
74
			layers = append(layers, &layerGGML{layer, nil})
Michael Yang's avatar
Michael Yang committed
75
76
77
78
79
80
		}
	}

	return layers, nil
}

81
func extractFromZipFile(p string, file *os.File, fn func(api.ProgressResponse)) error {
Michael Yang's avatar
Michael Yang committed
82
83
	stat, err := file.Stat()
	if err != nil {
84
		return err
Michael Yang's avatar
Michael Yang committed
85
86
87
88
	}

	r, err := zip.NewReader(file, stat.Size())
	if err != nil {
89
		return err
Michael Yang's avatar
Michael Yang committed
90
91
92
93
	}

	fn(api.ProgressResponse{Status: "unpacking model metadata"})
	for _, f := range r.File {
94
95
96
97
98
99
100
101
102
103
		n := filepath.Join(p, f.Name)
		if !strings.HasPrefix(n, p) {
			slog.Warn("skipped extracting file outside of context", "name", f.Name)
			continue
		}

		if err := os.MkdirAll(filepath.Dir(n), 0o750); err != nil {
			return err
		}

Michael Yang's avatar
Michael Yang committed
104
		// TODO(mxyng): this should not write out all files to disk
105
		outfile, err := os.Create(n)
Michael Yang's avatar
Michael Yang committed
106
		if err != nil {
107
			return err
Michael Yang's avatar
Michael Yang committed
108
		}
Michael Yang's avatar
Michael Yang committed
109
		defer outfile.Close()
Michael Yang's avatar
Michael Yang committed
110
111
112

		infile, err := f.Open()
		if err != nil {
113
			return err
Michael Yang's avatar
Michael Yang committed
114
		}
Michael Yang's avatar
Michael Yang committed
115
		defer infile.Close()
Michael Yang's avatar
Michael Yang committed
116
117

		if _, err = io.Copy(outfile, infile); err != nil {
118
			return err
Michael Yang's avatar
Michael Yang committed
119
120
121
		}

		if err := outfile.Close(); err != nil {
122
			return err
Michael Yang's avatar
Michael Yang committed
123
124
125
		}

		if err := infile.Close(); err != nil {
126
			return err
Michael Yang's avatar
Michael Yang committed
127
128
129
		}
	}

130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
	return nil
}

func parseFromZipFile(_ context.Context, file *os.File, digest string, fn func(api.ProgressResponse)) (layers []*layerGGML, err error) {
	tempDir, err := os.MkdirTemp(filepath.Dir(file.Name()), "")
	if err != nil {
		return nil, err
	}
	defer os.RemoveAll(tempDir)

	if err := extractFromZipFile(tempDir, file, fn); err != nil {
		return nil, err
	}

	mf, err := convert.GetModelFormat(tempDir)
Michael Yang's avatar
Michael Yang committed
145
146
147
148
	if err != nil {
		return nil, err
	}

149
	params, err := mf.GetParams(tempDir)
Michael Yang's avatar
Michael Yang committed
150
151
152
153
	if err != nil {
		return nil, err
	}

154
	mArch, err := mf.GetModelArch("", tempDir, params)
Michael Yang's avatar
Michael Yang committed
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
	if err != nil {
		return nil, err
	}

	fn(api.ProgressResponse{Status: "processing tensors"})
	if err := mArch.GetTensors(); err != nil {
		return nil, err
	}

	if err := mArch.LoadVocab(); err != nil {
		return nil, err
	}

	fn(api.ProgressResponse{Status: "converting model"})

	// TODO(mxyng): this should write directly into a layer
	// e.g. NewLayer(arch.Reader(), "application/vnd.ollama.image.model")
172
	temp, err := os.CreateTemp(tempDir, "fp16")
Michael Yang's avatar
Michael Yang committed
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
	if err != nil {
		return nil, err
	}
	defer temp.Close()
	defer os.Remove(temp.Name())

	if err = mArch.WriteGGUF(temp); err != nil {
		return nil, err
	}

	if _, err := temp.Seek(0, io.SeekStart); err != nil {
		return nil, err
	}

	layer, err := NewLayer(temp, "application/vnd.ollama.image.model")
	if err != nil {
Michael Yang's avatar
Michael Yang committed
189
		return nil, err
Michael Yang's avatar
Michael Yang committed
190
191
	}

192
	bin, err := layer.Open()
Michael Yang's avatar
Michael Yang committed
193
194
195
196
197
	if err != nil {
		return nil, err
	}
	defer bin.Close()

198
	ggml, _, err := llm.DecodeGGML(bin, 0)
Michael Yang's avatar
Michael Yang committed
199
200
201
202
	if err != nil {
		return nil, err
	}

203
	layers = append(layers, &layerGGML{layer, ggml})
204

Michael Yang's avatar
Michael Yang committed
205
	intermediateBlobs[digest] = layer.Digest
206
	return detectChatTemplate(layers)
Michael Yang's avatar
Michael Yang committed
207
208
}

209
func parseFromFile(ctx context.Context, file *os.File, digest string, fn func(api.ProgressResponse)) (layers []*layerGGML, err error) {
Michael Yang's avatar
Michael Yang committed
210
211
212
213
214
215
216
217
218
219
	sr := io.NewSectionReader(file, 0, 512)
	contentType, err := detectContentType(sr)
	if err != nil {
		return nil, err
	}

	switch contentType {
	case "gguf", "ggla":
		// noop
	case "application/zip":
220
		return parseFromZipFile(ctx, file, digest, fn)
Michael Yang's avatar
Michael Yang committed
221
222
223
224
225
226
227
228
229
230
231
	default:
		return nil, fmt.Errorf("unsupported content type: %s", contentType)
	}

	stat, err := file.Stat()
	if err != nil {
		return nil, err
	}

	var offset int64
	for offset < stat.Size() {
232
		ggml, n, err := llm.DecodeGGML(file, 0)
Michael Yang's avatar
Michael Yang committed
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
		if errors.Is(err, io.EOF) {
			break
		} else if err != nil {
			return nil, err
		}

		mediatype := "application/vnd.ollama.image.model"
		if ggml.Name() == "ggla" {
			mediatype = "application/vnd.ollama.image.adapter"
		} else if ggml.KV().Architecture() == "clip" {
			mediatype = "application/vnd.ollama.image.projector"
		}

		layer, err := NewLayer(io.NewSectionReader(file, offset, n), mediatype)
		if err != nil {
			return nil, err
		}

251
		layers = append(layers, &layerGGML{layer, ggml})
Michael Yang's avatar
Michael Yang committed
252
253
254
		offset = n
	}

255
256
257
258
259
260
	return detectChatTemplate(layers)
}

func detectChatTemplate(layers []*layerGGML) ([]*layerGGML, error) {
	for _, layer := range layers {
		if s := layer.GGML.KV().ChatTemplate(); s != "" {
Michael Yang's avatar
Michael Yang committed
261
			if t, err := template.Named(s); err != nil {
262
263
264
265
266
267
268
269
270
271
272
273
274
				slog.Debug("template detection", "error", err)
			} else {
				tmpl, err := NewLayer(t.Reader(), "application/vnd.ollama.image.template")
				if err != nil {
					return nil, err
				}

				tmpl.status = fmt.Sprintf("using autodetected template %s", t.Name)
				layers = append(layers, &layerGGML{tmpl, nil})
			}
		}
	}

Michael Yang's avatar
Michael Yang committed
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
	return layers, nil
}

func detectContentType(r io.Reader) (string, error) {
	var b bytes.Buffer
	if _, err := io.Copy(&b, r); err != nil {
		return "", err
	}

	if contentType := llm.DetectGGMLType(b.Bytes()); contentType != "" {
		return contentType, nil
	}

	if contentType := http.DetectContentType(b.Bytes()); contentType != "application/octet-stream" {
		return contentType, nil
	}

	return "unknown", nil
}