client.go 10.1 KB
Newer Older
1
2
3
4
5
6
// Package api implements the client-side API for code wishing to interact
// with the ollama service. The methods of the [Client] type correspond to
// the ollama REST API as described in https://github.com/ollama/ollama/blob/main/docs/api.md
//
// The ollama command-line client itself uses this package to interact with
// the backend service.
Jeffrey Morgan's avatar
Jeffrey Morgan committed
7
8
9
package api

import (
Jeffrey Morgan's avatar
Jeffrey Morgan committed
10
	"bufio"
Jeffrey Morgan's avatar
Jeffrey Morgan committed
11
12
13
	"bytes"
	"context"
	"encoding/json"
14
	"fmt"
Patrick Devine's avatar
Patrick Devine committed
15
	"io"
Michael Yang's avatar
Michael Yang committed
16
	"net"
Jeffrey Morgan's avatar
Jeffrey Morgan committed
17
	"net/http"
Michael Yang's avatar
Michael Yang committed
18
	"net/url"
19
	"os"
Michael Yang's avatar
Michael Yang committed
20
	"runtime"
21
	"strconv"
22
	"strings"
Michael Yang's avatar
Michael Yang committed
23

24
25
	"github.com/ollama/ollama/format"
	"github.com/ollama/ollama/version"
26
27
)

28
29
// Client encapsulates client state for interacting with the ollama
// service. Use [ClientFromEnvironment] to create new Clients.
Patrick Devine's avatar
Patrick Devine committed
30
type Client struct {
Michael Yang's avatar
Michael Yang committed
31
	base *url.URL
Michael Yang's avatar
Michael Yang committed
32
	http *http.Client
Michael Yang's avatar
Michael Yang committed
33
34
}

Patrick Devine's avatar
Patrick Devine committed
35
func checkError(resp *http.Response, body []byte) error {
Michael Yang's avatar
Michael Yang committed
36
	if resp.StatusCode < http.StatusBadRequest {
Patrick Devine's avatar
Patrick Devine committed
37
		return nil
Michael Yang's avatar
Michael Yang committed
38
39
	}

Patrick Devine's avatar
Patrick Devine committed
40
	apiError := StatusError{StatusCode: resp.StatusCode}
Michael Yang's avatar
Michael Yang committed
41

Patrick Devine's avatar
Patrick Devine committed
42
43
44
	err := json.Unmarshal(body, &apiError)
	if err != nil {
		// Use the full body as the message if we fail to decode a response.
45
		apiError.ErrorMessage = string(body)
Patrick Devine's avatar
Patrick Devine committed
46
47
48
	}

	return apiError
Michael Yang's avatar
Michael Yang committed
49
50
}

51
52
53
54
55
56
57
58
59
// ClientFromEnvironment creates a new [Client] using configuration from the
// environment variable OLLAMA_HOST, which points to the network host and
// port on which the ollama service is listenting. The format of this variable
// is:
//
//	<scheme>://<host>:<port>
//
// If the variable is not specified, a default ollama host and port will be
// used.
Michael Yang's avatar
Michael Yang committed
60
func ClientFromEnvironment() (*Client, error) {
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
	ollamaHost, err := GetOllamaHost()
	if err != nil {
		return nil, err
	}

	return &Client{
		base: &url.URL{
			Scheme: ollamaHost.Scheme,
			Host:   net.JoinHostPort(ollamaHost.Host, ollamaHost.Port),
		},
		http: http.DefaultClient,
	}, nil
}

type OllamaHost struct {
	Scheme string
	Host   string
	Port   string
}

func GetOllamaHost() (OllamaHost, error) {
Michael Yang's avatar
Michael Yang committed
82
83
	defaultPort := "11434"

84
85
86
87
	hostVar := os.Getenv("OLLAMA_HOST")
	hostVar = strings.TrimSpace(strings.Trim(strings.TrimSpace(hostVar), "\"'"))

	scheme, hostport, ok := strings.Cut(hostVar, "://")
Michael Yang's avatar
Michael Yang committed
88
89
	switch {
	case !ok:
90
		scheme, hostport = "http", hostVar
Michael Yang's avatar
Michael Yang committed
91
92
93
94
	case scheme == "http":
		defaultPort = "80"
	case scheme == "https":
		defaultPort = "443"
Michael Yang's avatar
Michael Yang committed
95
96
	}

Michael Yang's avatar
Michael Yang committed
97
98
99
	// trim trailing slashes
	hostport = strings.TrimRight(hostport, "/")

Michael Yang's avatar
Michael Yang committed
100
101
	host, port, err := net.SplitHostPort(hostport)
	if err != nil {
Michael Yang's avatar
Michael Yang committed
102
		host, port = "127.0.0.1", defaultPort
Michael Yang's avatar
Michael Yang committed
103
		if ip := net.ParseIP(strings.Trim(hostport, "[]")); ip != nil {
Michael Yang's avatar
Michael Yang committed
104
			host = ip.String()
Michael Yang's avatar
Michael Yang committed
105
106
		} else if hostport != "" {
			host = hostport
Michael Yang's avatar
Michael Yang committed
107
108
109
		}
	}

110
111
112
113
114
115
116
117
	if portNum, err := strconv.ParseInt(port, 10, 32); err != nil || portNum > 65535 || portNum < 0 {
		return OllamaHost{}, ErrInvalidHostPort
	}

	return OllamaHost{
		Scheme: scheme,
		Host:   host,
		Port:   port,
Michael Yang's avatar
Michael Yang committed
118
	}, nil
Patrick Devine's avatar
Patrick Devine committed
119
120
}

Daniel Hiltgen's avatar
Daniel Hiltgen committed
121
122
123
124
125
126
127
func NewClient(base *url.URL, http *http.Client) *Client {
	return &Client{
		base: base,
		http: http,
	}
}

Patrick Devine's avatar
Patrick Devine committed
128
129
130
131
func (c *Client) do(ctx context.Context, method, path string, reqData, respData any) error {
	var reqBody io.Reader
	var data []byte
	var err error
Michael Yang's avatar
Michael Yang committed
132
133
134
135
136
137
138
139

	switch reqData := reqData.(type) {
	case io.Reader:
		// reqData is already an io.Reader
		reqBody = reqData
	case nil:
		// noop
	default:
Patrick Devine's avatar
Patrick Devine committed
140
141
142
143
		data, err = json.Marshal(reqData)
		if err != nil {
			return err
		}
Michael Yang's avatar
Michael Yang committed
144

Patrick Devine's avatar
Patrick Devine committed
145
146
147
		reqBody = bytes.NewReader(data)
	}

Michael Yang's avatar
Michael Yang committed
148
	requestURL := c.base.JoinPath(path)
Michael Yang's avatar
Michael Yang committed
149
	request, err := http.NewRequestWithContext(ctx, method, requestURL.String(), reqBody)
Patrick Devine's avatar
Patrick Devine committed
150
151
152
153
	if err != nil {
		return err
	}

Michael Yang's avatar
Michael Yang committed
154
155
156
	request.Header.Set("Content-Type", "application/json")
	request.Header.Set("Accept", "application/json")
	request.Header.Set("User-Agent", fmt.Sprintf("ollama/%s (%s %s) Go/%s", version.Version, runtime.GOARCH, runtime.GOOS, runtime.Version()))
Patrick Devine's avatar
Patrick Devine committed
157

Michael Yang's avatar
Michael Yang committed
158
	respObj, err := c.http.Do(request)
Patrick Devine's avatar
Patrick Devine committed
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
	if err != nil {
		return err
	}
	defer respObj.Body.Close()

	respBody, err := io.ReadAll(respObj.Body)
	if err != nil {
		return err
	}

	if err := checkError(respObj, respBody); err != nil {
		return err
	}

	if len(respBody) > 0 && respData != nil {
		if err := json.Unmarshal(respBody, respData); err != nil {
			return err
		}
	}
	return nil
Jeffrey Morgan's avatar
Jeffrey Morgan committed
179
180
}

Michael Yang's avatar
Michael Yang committed
181
const maxBufferSize = 512 * format.KiloByte
182

Michael Yang's avatar
Michael Yang committed
183
func (c *Client) stream(ctx context.Context, method, path string, data any, fn func([]byte) error) error {
184
185
186
187
188
189
	var buf *bytes.Buffer
	if data != nil {
		bts, err := json.Marshal(data)
		if err != nil {
			return err
		}
Michael Yang's avatar
Michael Yang committed
190

191
		buf = bytes.NewBuffer(bts)
Jeffrey Morgan's avatar
Jeffrey Morgan committed
192
193
	}

Michael Yang's avatar
Michael Yang committed
194
	requestURL := c.base.JoinPath(path)
Michael Yang's avatar
Michael Yang committed
195
	request, err := http.NewRequestWithContext(ctx, method, requestURL.String(), buf)
Jeffrey Morgan's avatar
Jeffrey Morgan committed
196
197
198
199
	if err != nil {
		return err
	}

Michael Yang's avatar
Michael Yang committed
200
	request.Header.Set("Content-Type", "application/json")
201
	request.Header.Set("Accept", "application/x-ndjson")
Michael Yang's avatar
Michael Yang committed
202
	request.Header.Set("User-Agent", fmt.Sprintf("ollama/%s (%s %s) Go/%s", version.Version, runtime.GOARCH, runtime.GOOS, runtime.Version()))
Jeffrey Morgan's avatar
Jeffrey Morgan committed
203

Michael Yang's avatar
Michael Yang committed
204
	response, err := c.http.Do(request)
Jeffrey Morgan's avatar
Jeffrey Morgan committed
205
206
207
	if err != nil {
		return err
	}
Michael Yang's avatar
Michael Yang committed
208
	defer response.Body.Close()
Jeffrey Morgan's avatar
Jeffrey Morgan committed
209

210
	scanner := bufio.NewScanner(response.Body)
211
212
213
	// increase the buffer size to avoid running out of space
	scanBuf := make([]byte, 0, maxBufferSize)
	scanner.Buffer(scanBuf, maxBufferSize)
214
215
	for scanner.Scan() {
		var errorResponse struct {
Michael Yang's avatar
Michael Yang committed
216
			Error string `json:"error,omitempty"`
217
218
219
220
221
222
223
		}

		bts := scanner.Bytes()
		if err := json.Unmarshal(bts, &errorResponse); err != nil {
			return fmt.Errorf("unmarshal: %w", err)
		}

Michael Yang's avatar
Michael Yang committed
224
		if errorResponse.Error != "" {
225
			return fmt.Errorf(errorResponse.Error)
Michael Yang's avatar
Michael Yang committed
226
227
		}

Michael Yang's avatar
Michael Yang committed
228
		if response.StatusCode >= http.StatusBadRequest {
Michael Yang's avatar
Michael Yang committed
229
			return StatusError{
230
231
232
				StatusCode:   response.StatusCode,
				Status:       response.Status,
				ErrorMessage: errorResponse.Error,
Michael Yang's avatar
Michael Yang committed
233
			}
234
235
		}

Michael Yang's avatar
Michael Yang committed
236
		if err := fn(bts); err != nil {
237
			return err
Jeffrey Morgan's avatar
Jeffrey Morgan committed
238
239
240
		}
	}

Michael Yang's avatar
Michael Yang committed
241
242
	return nil
}
Jeffrey Morgan's avatar
Jeffrey Morgan committed
243

244
245
246
// GenerateResponseFunc is a function that [Client.Generate] invokes every time
// a response is received from the service. If this function returns an error,
// [Client.Generate] will stop generating and return this error.
Michael Yang's avatar
Michael Yang committed
247
type GenerateResponseFunc func(GenerateResponse) error
Jeffrey Morgan's avatar
Jeffrey Morgan committed
248

249
250
251
// Generate generates a response for a given prompt. The req parameter should
// be populated with prompt details. fn is called for each response (there may
// be multiple responses, e.g. in case streaming is enabled).
Michael Yang's avatar
Michael Yang committed
252
func (c *Client) Generate(ctx context.Context, req *GenerateRequest, fn GenerateResponseFunc) error {
253
254
255
256
257
258
259
260
	return c.stream(ctx, http.MethodPost, "/api/generate", req, func(bts []byte) error {
		var resp GenerateResponse
		if err := json.Unmarshal(bts, &resp); err != nil {
			return err
		}

		return fn(resp)
	})
Jeffrey Morgan's avatar
Jeffrey Morgan committed
261
}
Bruce MacDonald's avatar
Bruce MacDonald committed
262

263
264
265
// ChatResponseFunc is a function that [Client.Chat] invokes every time
// a response is received from the service. If this function returns an error,
// [Client.Chat] will stop generating and return this error.
Bruce MacDonald's avatar
Bruce MacDonald committed
266
267
type ChatResponseFunc func(ChatResponse) error

268
269
270
271
// Chat generates the next message in a chat. [ChatRequest] may contain a
// sequence of messages which can be used to maintain chat history with a model.
// fn is called for each response (there may be multiple responses, e.g. if case
// streaming is enabled).
Bruce MacDonald's avatar
Bruce MacDonald committed
272
273
274
275
276
277
278
279
280
281
282
func (c *Client) Chat(ctx context.Context, req *ChatRequest, fn ChatResponseFunc) error {
	return c.stream(ctx, http.MethodPost, "/api/chat", req, func(bts []byte) error {
		var resp ChatResponse
		if err := json.Unmarshal(bts, &resp); err != nil {
			return err
		}

		return fn(resp)
	})
}

283
284
285
// PullProgressFunc is a function that [Client.Pull] invokes every time there
// is progress with a "pull" request sent to the service. If this function
// returns an error, [Client.Pull] will stop the process and return this error.
286
type PullProgressFunc func(ProgressResponse) error
Michael Yang's avatar
Michael Yang committed
287

288
289
290
// Pull downloads a model from the ollama library. fn is called each time
// progress is made on the request and can be used to display a progress bar,
// etc.
Michael Yang's avatar
Michael Yang committed
291
func (c *Client) Pull(ctx context.Context, req *PullRequest, fn PullProgressFunc) error {
292
	return c.stream(ctx, http.MethodPost, "/api/pull", req, func(bts []byte) error {
293
		var resp ProgressResponse
294
295
296
297
298
299
		if err := json.Unmarshal(bts, &resp); err != nil {
			return err
		}

		return fn(resp)
	})
Bruce MacDonald's avatar
Bruce MacDonald committed
300
}
301

302
type PushProgressFunc func(ProgressResponse) error
303
304
305

func (c *Client) Push(ctx context.Context, req *PushRequest, fn PushProgressFunc) error {
	return c.stream(ctx, http.MethodPost, "/api/push", req, func(bts []byte) error {
306
		var resp ProgressResponse
307
308
309
310
311
312
313
314
		if err := json.Unmarshal(bts, &resp); err != nil {
			return err
		}

		return fn(resp)
	})
}

315
type CreateProgressFunc func(ProgressResponse) error
316
317
318

func (c *Client) Create(ctx context.Context, req *CreateRequest, fn CreateProgressFunc) error {
	return c.stream(ctx, http.MethodPost, "/api/create", req, func(bts []byte) error {
319
		var resp ProgressResponse
320
321
322
323
324
325
326
		if err := json.Unmarshal(bts, &resp); err != nil {
			return err
		}

		return fn(resp)
	})
}
Patrick Devine's avatar
Patrick Devine committed
327
328
329
330
331
332
333
334

func (c *Client) List(ctx context.Context) (*ListResponse, error) {
	var lr ListResponse
	if err := c.do(ctx, http.MethodGet, "/api/tags", nil, &lr); err != nil {
		return nil, err
	}
	return &lr, nil
}
335

Patrick Devine's avatar
Patrick Devine committed
336
337
338
339
340
341
342
func (c *Client) Copy(ctx context.Context, req *CopyRequest) error {
	if err := c.do(ctx, http.MethodPost, "/api/copy", req, nil); err != nil {
		return err
	}
	return nil
}

343
344
345
346
347
func (c *Client) Delete(ctx context.Context, req *DeleteRequest) error {
	if err := c.do(ctx, http.MethodDelete, "/api/delete", req, nil); err != nil {
		return err
	}
	return nil
348
}
349

Patrick Devine's avatar
Patrick Devine committed
350
351
352
353
354
355
356
357
func (c *Client) Show(ctx context.Context, req *ShowRequest) (*ShowResponse, error) {
	var resp ShowResponse
	if err := c.do(ctx, http.MethodPost, "/api/show", req, &resp); err != nil {
		return nil, err
	}
	return &resp, nil
}

358
func (c *Client) Heartbeat(ctx context.Context) error {
Bruce MacDonald's avatar
Bruce MacDonald committed
359
	if err := c.do(ctx, http.MethodHead, "/", nil, nil); err != nil {
360
361
362
363
		return err
	}
	return nil
}
Brian Murray's avatar
Brian Murray committed
364
365
366
367
368
369
370
func (c *Client) Embeddings(ctx context.Context, req *EmbeddingRequest) (*EmbeddingResponse, error) {
	var resp EmbeddingResponse
	if err := c.do(ctx, http.MethodPost, "/api/embeddings", req, &resp); err != nil {
		return nil, err
	}
	return &resp, nil
}
Michael Yang's avatar
Michael Yang committed
371

Michael Yang's avatar
Michael Yang committed
372
func (c *Client) CreateBlob(ctx context.Context, digest string, r io.Reader) error {
373
	return c.do(ctx, http.MethodPost, fmt.Sprintf("/api/blobs/%s", digest), r, nil)
Michael Yang's avatar
Michael Yang committed
374
}
Michael Yang's avatar
Michael Yang committed
375
376
377
378
379
380
381
382
383
384
385
386

func (c *Client) Version(ctx context.Context) (string, error) {
	var version struct {
		Version string `json:"version"`
	}

	if err := c.do(ctx, http.MethodGet, "/api/version", nil, &version); err != nil {
		return "", err
	}

	return version.Version, nil
}