routes.go 4.8 KB
Newer Older
Jeffrey Morgan's avatar
Jeffrey Morgan committed
1
2
3
package server

import (
Michael Yang's avatar
Michael Yang committed
4
	"encoding/json"
Jeffrey Morgan's avatar
Jeffrey Morgan committed
5
6
7
8
	"io"
	"log"
	"net"
	"net/http"
9
	"os"
Michael Yang's avatar
Michael Yang committed
10
	"path/filepath"
Michael Yang's avatar
Michael Yang committed
11
	"strings"
12
	"time"
Jeffrey Morgan's avatar
Jeffrey Morgan committed
13

Michael Yang's avatar
Michael Yang committed
14
	"dario.cat/mergo"
Jeffrey Morgan's avatar
Jeffrey Morgan committed
15
16
	"github.com/gin-gonic/gin"

Jeffrey Morgan's avatar
Jeffrey Morgan committed
17
	"github.com/jmorganca/ollama/api"
Michael Yang's avatar
Michael Yang committed
18
	"github.com/jmorganca/ollama/llama"
Jeffrey Morgan's avatar
Jeffrey Morgan committed
19
20
)

21
22
23
24
25
26
func cacheDir() string {
	home, err := os.UserHomeDir()
	if err != nil {
		panic(err)
	}

Michael Yang's avatar
Michael Yang committed
27
	return filepath.Join(home, ".ollama")
28
29
}

Bruce MacDonald's avatar
Bruce MacDonald committed
30
func generate(c *gin.Context) {
31
32
	start := time.Now()

Michael Yang's avatar
Michael Yang committed
33
	var req api.GenerateRequest
Bruce MacDonald's avatar
Bruce MacDonald committed
34
	if err := c.ShouldBindJSON(&req); err != nil {
35
		c.JSON(http.StatusBadRequest, gin.H{"error": err.Error()})
Bruce MacDonald's avatar
Bruce MacDonald committed
36
37
		return
	}
38

39
40
41
42
	model, err := GetModel(req.Model)
	if err != nil {
		c.JSON(http.StatusBadRequest, gin.H{"error": err.Error()})
		return
Bruce MacDonald's avatar
Bruce MacDonald committed
43
	}
Michael Yang's avatar
Michael Yang committed
44

Michael Yang's avatar
Michael Yang committed
45
46
47
48
49
50
51
52
53
54
55
	opts := api.DefaultOptions()
	if err := mergo.Merge(&opts, model.Options, mergo.WithOverride); err != nil {
		c.JSON(http.StatusInternalServerError, gin.H{"error": err.Error()})
		return
	}

	if err := mergo.Merge(&opts, req.Options, mergo.WithOverride); err != nil {
		c.JSON(http.StatusInternalServerError, gin.H{"error": err.Error()})
		return
	}

56
	prompt, err := model.Prompt(req)
57
58
59
	if err != nil {
		c.JSON(http.StatusInternalServerError, gin.H{"error": err.Error()})
		return
Michael Yang's avatar
Michael Yang committed
60
61
	}

Michael Yang's avatar
Michael Yang committed
62
	llm, err := llama.New(model.ModelPath, opts)
Michael Yang's avatar
Michael Yang committed
63
64
65
66
67
	if err != nil {
		c.JSON(http.StatusInternalServerError, gin.H{"error": err.Error()})
		return
	}
	defer llm.Close()
Jeffrey Morgan's avatar
Jeffrey Morgan committed
68

Michael Yang's avatar
Michael Yang committed
69
70
71
	ch := make(chan any)
	go func() {
		defer close(ch)
72
		llm.Predict(req.Context, prompt, func(r api.GenerateResponse) {
Michael Yang's avatar
Michael Yang committed
73
74
75
76
77
78
79
80
81
			r.Model = req.Model
			r.CreatedAt = time.Now().UTC()
			if r.Done {
				r.TotalDuration = time.Since(start)
			}

			ch <- r
		})
	}()
Michael Yang's avatar
Michael Yang committed
82

Michael Yang's avatar
Michael Yang committed
83
	streamResponse(c, ch)
Michael Yang's avatar
Michael Yang committed
84
}
Michael Yang's avatar
Michael Yang committed
85

Michael Yang's avatar
Michael Yang committed
86
87
88
89
90
91
92
func pull(c *gin.Context) {
	var req api.PullRequest
	if err := c.ShouldBindJSON(&req); err != nil {
		c.JSON(http.StatusBadRequest, gin.H{"error": err.Error()})
		return
	}

93
94
95
	ch := make(chan any)
	go func() {
		defer close(ch)
96
97
		fn := func(r api.ProgressResponse) {
			ch <- r
98
		}
99

100
101
102
103
104
105
106
107
108
109
110
111
112
		if err := PullModel(req.Name, req.Username, req.Password, fn); err != nil {
			c.JSON(http.StatusInternalServerError, gin.H{"error": err.Error()})
			return
		}
	}()

	streamResponse(c, ch)
}

func push(c *gin.Context) {
	var req api.PushRequest
	if err := c.ShouldBindJSON(&req); err != nil {
		c.JSON(http.StatusBadRequest, gin.H{"error": err.Error()})
Michael Yang's avatar
Michael Yang committed
113
114
		return
	}
Michael Yang's avatar
Michael Yang committed
115

116
117
118
	ch := make(chan any)
	go func() {
		defer close(ch)
119
120
		fn := func(r api.ProgressResponse) {
			ch <- r
121
		}
122

123
124
125
126
127
128
129
130
131
132
133
134
135
		if err := PushModel(req.Name, req.Username, req.Password, fn); err != nil {
			c.JSON(http.StatusInternalServerError, gin.H{"error": err.Error()})
			return
		}
	}()

	streamResponse(c, ch)
}

func create(c *gin.Context) {
	var req api.CreateRequest
	if err := c.ShouldBindJSON(&req); err != nil {
		c.JSON(http.StatusBadRequest, gin.H{"message": err.Error()})
Michael Yang's avatar
Michael Yang committed
136
		return
137
138
	}

Michael Yang's avatar
Michael Yang committed
139
	ch := make(chan any)
Michael Yang's avatar
Michael Yang committed
140
141
	go func() {
		defer close(ch)
142
143
144
		fn := func(status string) {
			ch <- api.CreateProgress{
				Status: status,
Michael Yang's avatar
Michael Yang committed
145
			}
146
147
		}

148
		if err := CreateModel(req.Name, req.Path, fn); err != nil {
149
150
151
			c.JSON(http.StatusBadRequest, gin.H{"message": err.Error()})
			return
		}
Michael Yang's avatar
Michael Yang committed
152
	}()
Michael Yang's avatar
Michael Yang committed
153

Michael Yang's avatar
Michael Yang committed
154
	streamResponse(c, ch)
Bruce MacDonald's avatar
Bruce MacDonald committed
155
156
}

Patrick Devine's avatar
Patrick Devine committed
157
158
159
160
161
162
163
164
165
166
167
168
169
170
func list(c *gin.Context) {
	var models []api.ListResponseModel
	fp, err := GetManifestPath()
	if err != nil {
		c.JSON(http.StatusInternalServerError, gin.H{"error": err.Error()})
		return
	}
	err = filepath.Walk(fp, func(path string, info os.FileInfo, err error) error {
		if err != nil {
			return err
		}
		if !info.IsDir() {
			fi, err := os.Stat(path)
			if err != nil {
171
172
				log.Printf("skipping file: %s", fp)
				return nil
Patrick Devine's avatar
Patrick Devine committed
173
174
175
176
177
178
179
180
181
182
			}
			path := path[len(fp)+1:]
			slashIndex := strings.LastIndex(path, "/")
			if slashIndex == -1 {
				return nil
			}
			tag := path[:slashIndex] + ":" + path[slashIndex+1:]
			mp := ParseModelPath(tag)
			manifest, err := GetManifest(mp)
			if err != nil {
183
184
				log.Printf("skipping file: %s", fp)
				return nil
Patrick Devine's avatar
Patrick Devine committed
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
			}
			model := api.ListResponseModel{
				Name:       mp.GetShortTagname(),
				Size:       manifest.GetTotalSize(),
				ModifiedAt: fi.ModTime(),
			}
			models = append(models, model)
		}
		return nil
	})
	if err != nil {
		c.JSON(http.StatusInternalServerError, gin.H{"error": err.Error()})
		return
	}

	c.JSON(http.StatusOK, api.ListResponse{models})
}

Bruce MacDonald's avatar
Bruce MacDonald committed
203
204
205
func Serve(ln net.Listener) error {
	r := gin.Default()

206
207
208
209
	r.GET("/", func(c *gin.Context) {
		c.String(http.StatusOK, "Ollama is running")
	})

Michael Yang's avatar
Michael Yang committed
210
	r.POST("/api/pull", pull)
Bruce MacDonald's avatar
Bruce MacDonald committed
211
	r.POST("/api/generate", generate)
212
213
	r.POST("/api/create", create)
	r.POST("/api/push", push)
Patrick Devine's avatar
Patrick Devine committed
214
	r.GET("/api/tags", list)
Jeffrey Morgan's avatar
Jeffrey Morgan committed
215
216
217
218
219
220
221
222

	log.Printf("Listening on %s", ln.Addr())
	s := &http.Server{
		Handler: r,
	}

	return s.Serve(ln)
}
Michael Yang's avatar
Michael Yang committed
223

Michael Yang's avatar
Michael Yang committed
224
func streamResponse(c *gin.Context, ch chan any) {
Michael Yang's avatar
Michael Yang committed
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
	c.Stream(func(w io.Writer) bool {
		val, ok := <-ch
		if !ok {
			return false
		}

		bts, err := json.Marshal(val)
		if err != nil {
			return false
		}

		bts = append(bts, '\n')
		if _, err := w.Write(bts); err != nil {
			return false
		}

		return true
	})
}