upload.go 9 KB
Newer Older
Michael Yang's avatar
Michael Yang committed
1
2
3
4
package server

import (
	"context"
5
	"crypto/md5"
Michael Yang's avatar
Michael Yang committed
6
7
	"errors"
	"fmt"
8
	"hash"
Michael Yang's avatar
Michael Yang committed
9
	"io"
10
	"log/slog"
Jeffrey Morgan's avatar
Jeffrey Morgan committed
11
	"math"
Michael Yang's avatar
Michael Yang committed
12
13
14
	"net/http"
	"net/url"
	"os"
Michael Yang's avatar
Michael Yang committed
15
	"sync"
Michael Yang's avatar
Michael Yang committed
16
17
	"sync/atomic"
	"time"
Michael Yang's avatar
Michael Yang committed
18

19
20
	"github.com/ollama/ollama/api"
	"github.com/ollama/ollama/format"
21
	"golang.org/x/sync/errgroup"
Michael Yang's avatar
Michael Yang committed
22
23
)

Michael Yang's avatar
Michael Yang committed
24
25
26
27
28
29
30
31
32
33
34
35
36
37
var blobUploadManager sync.Map

type blobUpload struct {
	*Layer

	Total     int64
	Completed atomic.Int64

	Parts []blobUploadPart

	nextURL chan *url.URL

	context.CancelFunc

38
39
	file *os.File

Michael Yang's avatar
Michael Yang committed
40
41
42
43
44
	done       bool
	err        error
	references atomic.Int32
}

45
const (
Michael Yang's avatar
Michael Yang committed
46
	numUploadParts          = 64
Michael Yang's avatar
Michael Yang committed
47
48
	minUploadPartSize int64 = 100 * format.MegaByte
	maxUploadPartSize int64 = 1000 * format.MegaByte
49
50
)

Michael Yang's avatar
Michael Yang committed
51
func (b *blobUpload) Prepare(ctx context.Context, requestURL *url.URL, opts *registryOptions) error {
Michael Yang's avatar
Michael Yang committed
52
53
54
55
56
57
	p, err := GetBlobsPath(b.Digest)
	if err != nil {
		return err
	}

	if b.From != "" {
Michael Yang's avatar
Michael Yang committed
58
		values := requestURL.Query()
Michael Yang's avatar
Michael Yang committed
59
		values.Add("mount", b.Digest)
60
		values.Add("from", ParseModelPath(b.From).GetNamespaceRepository())
Michael Yang's avatar
Michael Yang committed
61
62
63
		requestURL.RawQuery = values.Encode()
	}

Michael Yang's avatar
Michael Yang committed
64
	resp, err := makeRequestWithRetry(ctx, http.MethodPost, requestURL, nil, nil, opts)
Michael Yang's avatar
Michael Yang committed
65
	if err != nil {
Michael Yang's avatar
Michael Yang committed
66
		return err
Michael Yang's avatar
Michael Yang committed
67
68
69
	}
	defer resp.Body.Close()

70
	location := resp.Header.Get("Docker-Upload-Location")
Michael Yang's avatar
Michael Yang committed
71
	if location == "" {
72
73
74
		location = resp.Header.Get("Location")
	}

Michael Yang's avatar
Michael Yang committed
75
	fi, err := os.Stat(p)
76
	if err != nil {
Michael Yang's avatar
Michael Yang committed
77
		return err
Michael Yang's avatar
Michael Yang committed
78
79
	}

Michael Yang's avatar
Michael Yang committed
80
81
	b.Total = fi.Size()

Michael Yang's avatar
Michael Yang committed
82
83
84
85
86
87
88
89
	// http.StatusCreated indicates a blob has been mounted
	// ref: https://distribution.github.io/distribution/spec/api/#cross-repository-blob-mount
	if resp.StatusCode == http.StatusCreated {
		b.Completed.Store(b.Total)
		b.done = true
		return nil
	}

Michael Yang's avatar
Michael Yang committed
90
	size := b.Total / numUploadParts
Michael Yang's avatar
Michael Yang committed
91
92
93
94
95
96
97
98
99
100
101
102
103
	switch {
	case size < minUploadPartSize:
		size = minUploadPartSize
	case size > maxUploadPartSize:
		size = maxUploadPartSize
	}

	var offset int64
	for offset < fi.Size() {
		if offset+size > fi.Size() {
			size = fi.Size() - offset
		}

Michael Yang's avatar
Michael Yang committed
104
		// set part.N to the current number of parts
105
		b.Parts = append(b.Parts, blobUploadPart{N: len(b.Parts), Offset: offset, Size: size})
Michael Yang's avatar
Michael Yang committed
106
107
		offset += size
	}
Michael Yang's avatar
Michael Yang committed
108

109
	slog.Info(fmt.Sprintf("uploading %s in %d %s part(s)", b.Digest[7:19], len(b.Parts), format.HumanBytes(b.Parts[0].Size)))
Michael Yang's avatar
Michael Yang committed
110

Michael Yang's avatar
Michael Yang committed
111
	requestURL, err = url.Parse(location)
Michael Yang's avatar
Michael Yang committed
112
113
114
115
	if err != nil {
		return err
	}

Michael Yang's avatar
Michael Yang committed
116
117
118
119
120
	b.nextURL = make(chan *url.URL, 1)
	b.nextURL <- requestURL
	return nil
}

Michael Yang's avatar
Michael Yang committed
121
122
// Run uploads blob parts to the upstream. If the upstream supports redirection, parts will be uploaded
// in parallel as defined by Prepare. Otherwise, parts will be uploaded serially. Run sets b.err on error.
Michael Yang's avatar
Michael Yang committed
123
func (b *blobUpload) Run(ctx context.Context, opts *registryOptions) {
Michael Yang's avatar
Michael Yang committed
124
125
126
	defer blobUploadManager.Delete(b.Digest)
	ctx, b.CancelFunc = context.WithCancel(ctx)

127
128
129
130
131
132
133
134
135
136
137
138
139
	p, err := GetBlobsPath(b.Digest)
	if err != nil {
		b.err = err
		return
	}

	b.file, err = os.Open(p)
	if err != nil {
		b.err = err
		return
	}
	defer b.file.Close()

140
141
	g, inner := errgroup.WithContext(ctx)
	g.SetLimit(numUploadParts)
Michael Yang's avatar
Michael Yang committed
142
143
	for i := range b.Parts {
		part := &b.Parts[i]
Michael Yang's avatar
Michael Yang committed
144
145
146
		select {
		case <-inner.Done():
		case requestURL := <-b.nextURL:
147
			g.Go(func() error {
Michael Yang's avatar
Michael Yang committed
148
				var err error
Michael Yang's avatar
Michael Yang committed
149
				for try := 0; try < maxRetries; try++ {
150
					err = b.uploadPart(inner, http.MethodPatch, requestURL, part, opts)
Michael Yang's avatar
Michael Yang committed
151
152
153
154
155
156
					switch {
					case errors.Is(err, context.Canceled):
						return err
					case errors.Is(err, errMaxRetriesExceeded):
						return err
					case err != nil:
Jeffrey Morgan's avatar
Jeffrey Morgan committed
157
						sleep := time.Second * time.Duration(math.Pow(2, float64(try)))
158
						slog.Info(fmt.Sprintf("%s part %d attempt %d failed: %v, retrying in %s", b.Digest[7:19], part.N, try, err, sleep))
Michael Yang's avatar
Michael Yang committed
159
						time.Sleep(sleep)
Michael Yang's avatar
Michael Yang committed
160
161
162
163
						continue
					}

					return nil
Michael Yang's avatar
Michael Yang committed
164
165
				}

Michael Yang's avatar
Michael Yang committed
166
				return fmt.Errorf("%w: %w", errMaxRetriesExceeded, err)
Michael Yang's avatar
Michael Yang committed
167
168
			})
		}
Michael Yang's avatar
Michael Yang committed
169
	}
170

Michael Yang's avatar
Michael Yang committed
171
	if err := g.Wait(); err != nil {
Michael Yang's avatar
Michael Yang committed
172
173
		b.err = err
		return
Michael Yang's avatar
Michael Yang committed
174
175
	}

Michael Yang's avatar
Michael Yang committed
176
177
	requestURL := <-b.nextURL

178
	// calculate md5 checksum and add it to the commit request
179
	md5sum := md5.New()
180
	for _, part := range b.Parts {
181
		md5sum.Write(part.Sum(nil))
182
183
	}

Michael Yang's avatar
Michael Yang committed
184
	values := requestURL.Query()
Michael Yang's avatar
Michael Yang committed
185
	values.Add("digest", b.Digest)
186
	values.Add("etag", fmt.Sprintf("%x-%d", md5sum.Sum(nil), len(b.Parts)))
Michael Yang's avatar
Michael Yang committed
187
188
189
190
191
192
	requestURL.RawQuery = values.Encode()

	headers := make(http.Header)
	headers.Set("Content-Type", "application/octet-stream")
	headers.Set("Content-Length", "0")

Michael Yang's avatar
Michael Yang committed
193
	for try := 0; try < maxRetries; try++ {
Michael Yang's avatar
Michael Yang committed
194
195
196
197
198
		var resp *http.Response
		resp, err = makeRequestWithRetry(ctx, http.MethodPut, requestURL, headers, nil, opts)
		if errors.Is(err, context.Canceled) {
			break
		} else if err != nil {
Jeffrey Morgan's avatar
Jeffrey Morgan committed
199
			sleep := time.Second * time.Duration(math.Pow(2, float64(try)))
200
			slog.Info(fmt.Sprintf("%s complete upload attempt %d failed: %v, retrying in %s", b.Digest[7:19], try, err, sleep))
Michael Yang's avatar
Michael Yang committed
201
202
203
204
			time.Sleep(sleep)
			continue
		}
		defer resp.Body.Close()
Michael Yang's avatar
Michael Yang committed
205
		break
Michael Yang's avatar
Michael Yang committed
206
	}
Michael Yang's avatar
Michael Yang committed
207
208
209

	b.err = err
	b.done = true
Michael Yang's avatar
Michael Yang committed
210
}
Michael Yang's avatar
Michael Yang committed
211

Michael Yang's avatar
Michael Yang committed
212
func (b *blobUpload) uploadPart(ctx context.Context, method string, requestURL *url.URL, part *blobUploadPart, opts *registryOptions) error {
Michael Yang's avatar
Michael Yang committed
213
214
	headers := make(http.Header)
	headers.Set("Content-Type", "application/octet-stream")
Michael Yang's avatar
Michael Yang committed
215
	headers.Set("Content-Length", fmt.Sprintf("%d", part.Size))
216
217

	if method == http.MethodPatch {
218
		headers.Set("X-Redirect-Uploads", "1")
Michael Yang's avatar
Michael Yang committed
219
		headers.Set("Content-Range", fmt.Sprintf("%d-%d", part.Offset, part.Offset+part.Size-1))
220
	}
Michael Yang's avatar
Michael Yang committed
221

222
	sr := io.NewSectionReader(b.file, part.Offset, part.Size)
223
224
225
226

	md5sum := md5.New()
	w := &progressWriter{blobUpload: b}

Michael Yang's avatar
Michael Yang committed
227
	resp, err := makeRequest(ctx, method, requestURL, headers, io.TeeReader(sr, io.MultiWriter(w, md5sum)), opts)
Michael Yang's avatar
Michael Yang committed
228
	if err != nil {
229
		w.Rollback()
Michael Yang's avatar
Michael Yang committed
230
231
232
		return err
	}
	defer resp.Body.Close()
Michael Yang's avatar
Michael Yang committed
233

Michael Yang's avatar
Michael Yang committed
234
235
236
237
238
239
240
	location := resp.Header.Get("Docker-Upload-Location")
	if location == "" {
		location = resp.Header.Get("Location")
	}

	nextURL, err := url.Parse(location)
	if err != nil {
241
		w.Rollback()
Michael Yang's avatar
Michael Yang committed
242
243
244
245
246
		return err
	}

	switch {
	case resp.StatusCode == http.StatusTemporaryRedirect:
247
		w.Rollback()
Michael Yang's avatar
Michael Yang committed
248
249
250
251
252
253
		b.nextURL <- nextURL

		redirectURL, err := resp.Location()
		if err != nil {
			return err
		}
254

Jeffrey Morgan's avatar
Jeffrey Morgan committed
255
		// retry uploading to the redirect URL
Michael Yang's avatar
Michael Yang committed
256
		for try := 0; try < maxRetries; try++ {
257
			err = b.uploadPart(ctx, http.MethodPut, redirectURL, part, nil)
Michael Yang's avatar
Michael Yang committed
258
259
260
261
262
263
			switch {
			case errors.Is(err, context.Canceled):
				return err
			case errors.Is(err, errMaxRetriesExceeded):
				return err
			case err != nil:
Jeffrey Morgan's avatar
Jeffrey Morgan committed
264
				sleep := time.Second * time.Duration(math.Pow(2, float64(try)))
265
				slog.Info(fmt.Sprintf("%s part %d attempt %d failed: %v, retrying in %s", b.Digest[7:19], part.N, try, err, sleep))
Jeffrey Morgan's avatar
Jeffrey Morgan committed
266
				time.Sleep(sleep)
267
268
269
				continue
			}

Michael Yang's avatar
Michael Yang committed
270
271
272
			return nil
		}

Michael Yang's avatar
Michael Yang committed
273
		return fmt.Errorf("%w: %w", errMaxRetriesExceeded, err)
Michael Yang's avatar
Michael Yang committed
274

Michael Yang's avatar
Michael Yang committed
275
	case resp.StatusCode == http.StatusUnauthorized:
276
		w.Rollback()
Michael Yang's avatar
Michael Yang committed
277
278
		challenge := parseRegistryChallenge(resp.Header.Get("www-authenticate"))
		token, err := getAuthorizationToken(ctx, challenge)
Michael Yang's avatar
Michael Yang committed
279
280
281
		if err != nil {
			return err
		}
Michael Yang's avatar
Michael Yang committed
282

Michael Yang's avatar
Michael Yang committed
283
284
285
		opts.Token = token
		fallthrough
	case resp.StatusCode >= http.StatusBadRequest:
286
		w.Rollback()
Michael Yang's avatar
Michael Yang committed
287
288
289
		body, err := io.ReadAll(resp.Body)
		if err != nil {
			return err
Michael Yang's avatar
Michael Yang committed
290
291
		}

292
		return fmt.Errorf("http status %s: %s", resp.Status, body)
Michael Yang's avatar
Michael Yang committed
293
294
	}

Michael Yang's avatar
Michael Yang committed
295
296
297
298
	if method == http.MethodPatch {
		b.nextURL <- nextURL
	}

Michael Yang's avatar
Michael Yang committed
299
	part.Hash = md5sum
Michael Yang's avatar
Michael Yang committed
300
	return nil
Michael Yang's avatar
Michael Yang committed
301
302
}

Michael Yang's avatar
Michael Yang committed
303
304
func (b *blobUpload) acquire() {
	b.references.Add(1)
Michael Yang's avatar
Michael Yang committed
305
306
}

Michael Yang's avatar
Michael Yang committed
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
func (b *blobUpload) release() {
	if b.references.Add(-1) == 0 {
		b.CancelFunc()
	}
}

func (b *blobUpload) Wait(ctx context.Context, fn func(api.ProgressResponse)) error {
	b.acquire()
	defer b.release()

	ticker := time.NewTicker(60 * time.Millisecond)
	for {
		select {
		case <-ticker.C:
		case <-ctx.Done():
			return ctx.Err()
		}

		fn(api.ProgressResponse{
Jeffrey Morgan's avatar
Jeffrey Morgan committed
326
			Status:    fmt.Sprintf("pushing %s", b.Digest[7:19]),
Michael Yang's avatar
Michael Yang committed
327
328
329
			Digest:    b.Digest,
			Total:     b.Total,
			Completed: b.Completed.Load(),
Michael Yang's avatar
Michael Yang committed
330
331
		})

Michael Yang's avatar
Michael Yang committed
332
333
334
		if b.done || b.err != nil {
			return b.err
		}
Michael Yang's avatar
Michael Yang committed
335
	}
Michael Yang's avatar
Michael Yang committed
336
}
Michael Yang's avatar
Michael Yang committed
337

Michael Yang's avatar
Michael Yang committed
338
339
type blobUploadPart struct {
	// N is the part number
340
341
342
343
344
	N      int
	Offset int64
	Size   int64
	hash.Hash
}
345

346
347
type progressWriter struct {
	written int64
Michael Yang's avatar
Michael Yang committed
348
349
350
	*blobUpload
}

351
func (p *progressWriter) Write(b []byte) (n int, err error) {
Michael Yang's avatar
Michael Yang committed
352
353
354
	n = len(b)
	p.written += int64(n)
	p.Completed.Add(int64(n))
Michael Yang's avatar
Michael Yang committed
355
356
	return n, nil
}
Michael Yang's avatar
Michael Yang committed
357

358
359
func (p *progressWriter) Rollback() {
	p.Completed.Add(-p.written)
Michael Yang's avatar
Michael Yang committed
360
361
362
	p.written = 0
}

Michael Yang's avatar
Michael Yang committed
363
func uploadBlob(ctx context.Context, mp ModelPath, layer *Layer, opts *registryOptions, fn func(api.ProgressResponse)) error {
Michael Yang's avatar
Michael Yang committed
364
365
366
	requestURL := mp.BaseURL()
	requestURL = requestURL.JoinPath("v2", mp.GetNamespaceRepository(), "blobs", layer.Digest)

Michael Yang's avatar
Michael Yang committed
367
368
369
370
	resp, err := makeRequestWithRetry(ctx, http.MethodHead, requestURL, nil, nil, opts)
	switch {
	case errors.Is(err, os.ErrNotExist):
	case err != nil:
Michael Yang's avatar
Michael Yang committed
371
		return err
Michael Yang's avatar
Michael Yang committed
372
373
	default:
		defer resp.Body.Close()
Michael Yang's avatar
Michael Yang committed
374
		fn(api.ProgressResponse{
Jeffrey Morgan's avatar
Jeffrey Morgan committed
375
			Status:    fmt.Sprintf("pushing %s", layer.Digest[7:19]),
Michael Yang's avatar
Michael Yang committed
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
			Digest:    layer.Digest,
			Total:     layer.Size,
			Completed: layer.Size,
		})

		return nil
	}

	data, ok := blobUploadManager.LoadOrStore(layer.Digest, &blobUpload{Layer: layer})
	upload := data.(*blobUpload)
	if !ok {
		requestURL := mp.BaseURL()
		requestURL = requestURL.JoinPath("v2", mp.GetNamespaceRepository(), "blobs/uploads/")
		if err := upload.Prepare(ctx, requestURL, opts); err != nil {
			blobUploadManager.Delete(layer.Digest)
			return err
		}

Michael Yang's avatar
Michael Yang committed
394
		// nolint: contextcheck
Michael Yang's avatar
Michael Yang committed
395
396
397
398
399
		go upload.Run(context.Background(), opts)
	}

	return upload.Wait(ctx, fn)
}