model.go 8.4 KB
Newer Older
Michael Yang's avatar
Michael Yang committed
1
2
3
4
5
6
package server

import (
	"archive/zip"
	"bytes"
	"context"
Michael Yang's avatar
tools  
Michael Yang committed
7
	"encoding/json"
Michael Yang's avatar
Michael Yang committed
8
9
10
	"errors"
	"fmt"
	"io"
11
	"log/slog"
Michael Yang's avatar
Michael Yang committed
12
13
14
	"net/http"
	"os"
	"path/filepath"
Michael Yang's avatar
tools  
Michael Yang committed
15
16
17
	"slices"
	"strings"
	"text/template/parse"
Michael Yang's avatar
Michael Yang committed
18

Michael Yang's avatar
tools  
Michael Yang committed
19
	"github.com/google/uuid"
Michael Yang's avatar
Michael Yang committed
20
21
22
	"github.com/ollama/ollama/api"
	"github.com/ollama/ollama/convert"
	"github.com/ollama/ollama/llm"
Michael Yang's avatar
Michael Yang committed
23
	"github.com/ollama/ollama/template"
Michael Yang's avatar
Michael Yang committed
24
25
26
	"github.com/ollama/ollama/types/model"
)

Michael Yang's avatar
Michael Yang committed
27
var intermediateBlobs map[string]string = make(map[string]string)
28

29
type layerGGML struct {
Michael Yang's avatar
Michael Yang committed
30
31
32
33
	*Layer
	*llm.GGML
}

34
func parseFromModel(ctx context.Context, name model.Name, fn func(api.ProgressResponse)) (layers []*layerGGML, err error) {
35
	m, err := ParseNamedManifest(name)
Michael Yang's avatar
Michael Yang committed
36
37
	switch {
	case errors.Is(err, os.ErrNotExist):
Michael Yang's avatar
Michael Yang committed
38
		if err := PullModel(ctx, name.String(), &registryOptions{}, fn); err != nil {
Michael Yang's avatar
Michael Yang committed
39
40
41
			return nil, err
		}

42
		m, err = ParseNamedManifest(name)
Michael Yang's avatar
Michael Yang committed
43
44
45
		if err != nil {
			return nil, err
		}
Michael Yang's avatar
Michael Yang committed
46
47
48
49
	case err != nil:
		return nil, err
	}

50
51
	for _, layer := range m.Layers {
		layer, err := NewLayerFromLayer(layer.Digest, layer.MediaType, name.DisplayShortest())
Michael Yang's avatar
Michael Yang committed
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
		if err != nil {
			return nil, err
		}

		switch layer.MediaType {
		case "application/vnd.ollama.image.model",
			"application/vnd.ollama.image.projector",
			"application/vnd.ollama.image.adapter":
			blobpath, err := GetBlobsPath(layer.Digest)
			if err != nil {
				return nil, err
			}

			blob, err := os.Open(blobpath)
			if err != nil {
				return nil, err
			}
			defer blob.Close()

71
			ggml, _, err := llm.DecodeGGML(blob, 0)
Michael Yang's avatar
Michael Yang committed
72
73
74
			if err != nil {
				return nil, err
			}
Michael Yang's avatar
Michael Yang committed
75

76
			layers = append(layers, &layerGGML{layer, ggml})
Michael Yang's avatar
Michael Yang committed
77
		default:
78
			layers = append(layers, &layerGGML{layer, nil})
Michael Yang's avatar
Michael Yang committed
79
80
81
82
83
84
		}
	}

	return layers, nil
}

85
func extractFromZipFile(p string, file *os.File, fn func(api.ProgressResponse)) error {
Michael Yang's avatar
Michael Yang committed
86
87
	stat, err := file.Stat()
	if err != nil {
88
		return err
Michael Yang's avatar
Michael Yang committed
89
90
91
92
	}

	r, err := zip.NewReader(file, stat.Size())
	if err != nil {
93
		return err
Michael Yang's avatar
Michael Yang committed
94
95
96
97
	}

	fn(api.ProgressResponse{Status: "unpacking model metadata"})
	for _, f := range r.File {
Michael Yang's avatar
Michael Yang committed
98
99
		if !filepath.IsLocal(f.Name) {
			return fmt.Errorf("%w: %s", zip.ErrInsecurePath, f.Name)
100
101
		}

Michael Yang's avatar
Michael Yang committed
102
		n := filepath.Join(p, f.Name)
103
104
105
106
		if err := os.MkdirAll(filepath.Dir(n), 0o750); err != nil {
			return err
		}

Michael Yang's avatar
Michael Yang committed
107
		// TODO(mxyng): this should not write out all files to disk
108
		outfile, err := os.Create(n)
Michael Yang's avatar
Michael Yang committed
109
		if err != nil {
110
			return err
Michael Yang's avatar
Michael Yang committed
111
		}
Michael Yang's avatar
Michael Yang committed
112
		defer outfile.Close()
Michael Yang's avatar
Michael Yang committed
113
114
115

		infile, err := f.Open()
		if err != nil {
116
			return err
Michael Yang's avatar
Michael Yang committed
117
		}
Michael Yang's avatar
Michael Yang committed
118
		defer infile.Close()
Michael Yang's avatar
Michael Yang committed
119
120

		if _, err = io.Copy(outfile, infile); err != nil {
121
			return err
Michael Yang's avatar
Michael Yang committed
122
123
124
		}

		if err := outfile.Close(); err != nil {
125
			return err
Michael Yang's avatar
Michael Yang committed
126
127
128
		}

		if err := infile.Close(); err != nil {
129
			return err
Michael Yang's avatar
Michael Yang committed
130
131
132
		}
	}

133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
	return nil
}

func parseFromZipFile(_ context.Context, file *os.File, digest string, fn func(api.ProgressResponse)) (layers []*layerGGML, err error) {
	tempDir, err := os.MkdirTemp(filepath.Dir(file.Name()), "")
	if err != nil {
		return nil, err
	}
	defer os.RemoveAll(tempDir)

	if err := extractFromZipFile(tempDir, file, fn); err != nil {
		return nil, err
	}

	mf, err := convert.GetModelFormat(tempDir)
Michael Yang's avatar
Michael Yang committed
148
149
150
151
	if err != nil {
		return nil, err
	}

152
	params, err := mf.GetParams(tempDir)
Michael Yang's avatar
Michael Yang committed
153
154
155
156
	if err != nil {
		return nil, err
	}

157
	mArch, err := mf.GetModelArch("", tempDir, params)
Michael Yang's avatar
Michael Yang committed
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
	if err != nil {
		return nil, err
	}

	fn(api.ProgressResponse{Status: "processing tensors"})
	if err := mArch.GetTensors(); err != nil {
		return nil, err
	}

	if err := mArch.LoadVocab(); err != nil {
		return nil, err
	}

	fn(api.ProgressResponse{Status: "converting model"})

	// TODO(mxyng): this should write directly into a layer
	// e.g. NewLayer(arch.Reader(), "application/vnd.ollama.image.model")
175
	temp, err := os.CreateTemp(tempDir, "fp16")
Michael Yang's avatar
Michael Yang committed
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
	if err != nil {
		return nil, err
	}
	defer temp.Close()
	defer os.Remove(temp.Name())

	if err = mArch.WriteGGUF(temp); err != nil {
		return nil, err
	}

	if _, err := temp.Seek(0, io.SeekStart); err != nil {
		return nil, err
	}

	layer, err := NewLayer(temp, "application/vnd.ollama.image.model")
	if err != nil {
Michael Yang's avatar
Michael Yang committed
192
		return nil, err
Michael Yang's avatar
Michael Yang committed
193
194
	}

195
	bin, err := layer.Open()
Michael Yang's avatar
Michael Yang committed
196
197
198
199
200
	if err != nil {
		return nil, err
	}
	defer bin.Close()

201
	ggml, _, err := llm.DecodeGGML(bin, 0)
Michael Yang's avatar
Michael Yang committed
202
203
204
205
	if err != nil {
		return nil, err
	}

206
	layers = append(layers, &layerGGML{layer, ggml})
207

Michael Yang's avatar
Michael Yang committed
208
	intermediateBlobs[digest] = layer.Digest
209
	return detectChatTemplate(layers)
Michael Yang's avatar
Michael Yang committed
210
211
}

212
func parseFromFile(ctx context.Context, file *os.File, digest string, fn func(api.ProgressResponse)) (layers []*layerGGML, err error) {
Michael Yang's avatar
Michael Yang committed
213
214
215
216
217
218
219
220
221
222
	sr := io.NewSectionReader(file, 0, 512)
	contentType, err := detectContentType(sr)
	if err != nil {
		return nil, err
	}

	switch contentType {
	case "gguf", "ggla":
		// noop
	case "application/zip":
223
		return parseFromZipFile(ctx, file, digest, fn)
Michael Yang's avatar
Michael Yang committed
224
225
226
227
228
229
230
231
232
233
234
	default:
		return nil, fmt.Errorf("unsupported content type: %s", contentType)
	}

	stat, err := file.Stat()
	if err != nil {
		return nil, err
	}

	var offset int64
	for offset < stat.Size() {
235
		ggml, n, err := llm.DecodeGGML(file, 0)
Michael Yang's avatar
Michael Yang committed
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
		if errors.Is(err, io.EOF) {
			break
		} else if err != nil {
			return nil, err
		}

		mediatype := "application/vnd.ollama.image.model"
		if ggml.Name() == "ggla" {
			mediatype = "application/vnd.ollama.image.adapter"
		} else if ggml.KV().Architecture() == "clip" {
			mediatype = "application/vnd.ollama.image.projector"
		}

		layer, err := NewLayer(io.NewSectionReader(file, offset, n), mediatype)
		if err != nil {
			return nil, err
		}

254
		layers = append(layers, &layerGGML{layer, ggml})
Michael Yang's avatar
Michael Yang committed
255
256
257
		offset = n
	}

258
259
260
261
262
263
	return detectChatTemplate(layers)
}

func detectChatTemplate(layers []*layerGGML) ([]*layerGGML, error) {
	for _, layer := range layers {
		if s := layer.GGML.KV().ChatTemplate(); s != "" {
Michael Yang's avatar
Michael Yang committed
264
			if t, err := template.Named(s); err != nil {
265
266
267
268
269
270
271
272
273
274
275
276
277
				slog.Debug("template detection", "error", err)
			} else {
				tmpl, err := NewLayer(t.Reader(), "application/vnd.ollama.image.template")
				if err != nil {
					return nil, err
				}

				tmpl.status = fmt.Sprintf("using autodetected template %s", t.Name)
				layers = append(layers, &layerGGML{tmpl, nil})
			}
		}
	}

Michael Yang's avatar
Michael Yang committed
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
	return layers, nil
}

func detectContentType(r io.Reader) (string, error) {
	var b bytes.Buffer
	if _, err := io.Copy(&b, r); err != nil {
		return "", err
	}

	if contentType := llm.DetectGGMLType(b.Bytes()); contentType != "" {
		return contentType, nil
	}

	if contentType := http.DetectContentType(b.Bytes()); contentType != "application/octet-stream" {
		return contentType, nil
	}

	return "unknown", nil
}
Michael Yang's avatar
tools  
Michael Yang committed
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396

// parseToolCalls attempts to parse a JSON string into a slice of ToolCalls.
// mxyng: this only really works if the input contains tool calls in some JSON format
func (m *Model) parseToolCalls(s string) ([]api.ToolCall, bool) {
	// create a subtree from the node that ranges over .ToolCalls
	tmpl := m.Template.Subtree(func(n parse.Node) bool {
		if t, ok := n.(*parse.RangeNode); ok {
			return slices.Contains(template.Identifiers(t.Pipe), "ToolCalls")
		}

		return false
	})

	if tmpl == nil {
		return nil, false
	}

	var b bytes.Buffer
	if err := tmpl.Execute(&b, map[string][]map[string]any{
		"ToolCalls": {
			{
				"Function": map[string]any{
					"Name":      "@@name@@",
					"Arguments": "@@arguments@@",
				},
			},
		},
	}); err != nil {
		return nil, false
	}

	var kv map[string]string
	// execute the subtree with placeholders to identify the keys
	if err := json.Unmarshal(b.Bytes(), &kv); err != nil {
		return nil, false
	}

	// find the keys that correspond to the name and arguments fields
	var name, arguments string
	for k, v := range kv {
		switch v {
		case "@@name@@":
			name = k
		case "@@arguments@@":
			arguments = k
		}
	}

	var sm []map[string]any
	decoder := json.NewDecoder(strings.NewReader(s))
	for {
		// incrementally decode the JSON into a list of JSON objects
		// skipping over any invalid tokens
		if err := decoder.Decode(&sm); err != nil {
			if errors.Is(err, io.EOF) {
				break
			}

			if errors.As(err, new(*json.SyntaxError)) {
				r := decoder.Buffered()
				if _, err := r.Read(make([]byte, decoder.InputOffset()+1)); err != nil {
					break
				}

				decoder = json.NewDecoder(r)
				continue
			}

			return nil, false
		}

		// break as soon as a valid object is decoded
		break
	}

	var toolCalls []api.ToolCall
	for _, kv := range sm {
		call := api.ToolCall{
			ID:   uuid.New().String(),
			Type: "function",
		}

		for k, v := range kv {
			switch k {
			case name:
				call.Function.Name = v.(string)
			case arguments:
				call.Function.Arguments = v.(map[string]any)
			}
		}

		toolCalls = append(toolCalls, call)
	}

	if len(toolCalls) > 0 {
		return toolCalls, true
	}

	return nil, false
}