"tests/pipelines/pag/test_pag_hunyuan_dit.py" did not exist on "e1d508ae921035a0ec72d06754b41879421b0308"
openai.go 19.2 KB
Newer Older
1
// openai package provides core transformation logic for partial compatibility with the OpenAI REST API
2
3
4
package openai

import (
5
	"bytes"
6
	"encoding/base64"
7
	"encoding/binary"
8
	"encoding/json"
Michael Yang's avatar
lint  
Michael Yang committed
9
	"errors"
10
	"fmt"
royjhan's avatar
royjhan committed
11
	"log/slog"
12
	"net/http"
13
	"slices"
14
	"strings"
15
16
	"time"

17
	"github.com/ollama/ollama/api"
18
	"github.com/ollama/ollama/types/model"
19
20
)

21
22
var finishReasonToolCalls = "tool_calls"

23
type Error struct {
24
25
26
27
	Message string  `json:"message"`
	Type    string  `json:"type"`
	Param   any     `json:"param"`
	Code    *string `json:"code"`
28
29
30
31
32
33
34
}

type ErrorResponse struct {
	Error Error `json:"error"`
}

type Message struct {
35
36
37
38
39
40
	Role       string     `json:"role"`
	Content    any        `json:"content"`
	Reasoning  string     `json:"reasoning,omitempty"`
	ToolCalls  []ToolCall `json:"tool_calls,omitempty"`
	Name       string     `json:"name,omitempty"`
	ToolCallID string     `json:"tool_call_id,omitempty"`
41
42
43
44
45
46
47
48
49
50
51
52
53
54
}

type Choice struct {
	Index        int     `json:"index"`
	Message      Message `json:"message"`
	FinishReason *string `json:"finish_reason"`
}

type ChunkChoice struct {
	Index        int     `json:"index"`
	Delta        Message `json:"delta"`
	FinishReason *string `json:"finish_reason"`
}

55
56
57
58
59
60
type CompleteChunkChoice struct {
	Text         string  `json:"text"`
	Index        int     `json:"index"`
	FinishReason *string `json:"finish_reason"`
}

61
62
63
64
65
66
67
type Usage struct {
	PromptTokens     int `json:"prompt_tokens"`
	CompletionTokens int `json:"completion_tokens"`
	TotalTokens      int `json:"total_tokens"`
}

type ResponseFormat struct {
68
69
70
71
72
	Type       string      `json:"type"`
	JsonSchema *JsonSchema `json:"json_schema,omitempty"`
}

type JsonSchema struct {
73
	Schema json.RawMessage `json:"schema"`
74
75
}

76
type EmbedRequest struct {
77
78
79
80
	Input          any    `json:"input"`
	Model          string `json:"model"`
	Dimensions     int    `json:"dimensions,omitempty"`
	EncodingFormat string `json:"encoding_format,omitempty"` // "float" or "base64"
81
82
}

83
84
85
86
type StreamOptions struct {
	IncludeUsage bool `json:"include_usage"`
}

Michael Yang's avatar
Michael Yang committed
87
type Reasoning struct {
88
	Effort string `json:"effort,omitempty"`
Michael Yang's avatar
Michael Yang committed
89
90
}

91
92
93
94
type ChatCompletionRequest struct {
	Model            string          `json:"model"`
	Messages         []Message       `json:"messages"`
	Stream           bool            `json:"stream"`
95
	StreamOptions    *StreamOptions  `json:"stream_options"`
96
97
98
99
100
	MaxTokens        *int            `json:"max_tokens"`
	Seed             *int            `json:"seed"`
	Stop             any             `json:"stop"`
	Temperature      *float64        `json:"temperature"`
	FrequencyPenalty *float64        `json:"frequency_penalty"`
101
	PresencePenalty  *float64        `json:"presence_penalty"`
102
103
	TopP             *float64        `json:"top_p"`
	ResponseFormat   *ResponseFormat `json:"response_format"`
royjhan's avatar
royjhan committed
104
	Tools            []api.Tool      `json:"tools"`
Michael Yang's avatar
Michael Yang committed
105
	Reasoning        *Reasoning      `json:"reasoning,omitempty"`
106
	ReasoningEffort  *string         `json:"reasoning_effort,omitempty"`
Devon Rifkin's avatar
Devon Rifkin committed
107
	DebugRenderOnly  bool            `json:"_debug_render_only"`
108
109
110
}

type ChatCompletion struct {
Devon Rifkin's avatar
Devon Rifkin committed
111
112
113
114
115
116
117
118
	Id                string         `json:"id"`
	Object            string         `json:"object"`
	Created           int64          `json:"created"`
	Model             string         `json:"model"`
	SystemFingerprint string         `json:"system_fingerprint"`
	Choices           []Choice       `json:"choices"`
	Usage             Usage          `json:"usage,omitempty"`
	DebugInfo         *api.DebugInfo `json:"_debug_info,omitempty"`
119
120
121
122
123
124
125
126
127
}

type ChatCompletionChunk struct {
	Id                string        `json:"id"`
	Object            string        `json:"object"`
	Created           int64         `json:"created"`
	Model             string        `json:"model"`
	SystemFingerprint string        `json:"system_fingerprint"`
	Choices           []ChunkChoice `json:"choices"`
128
	Usage             *Usage        `json:"usage,omitempty"`
129
130
}

131
132
// TODO (https://github.com/ollama/ollama/issues/5259): support []string, []int and [][]int
type CompletionRequest struct {
133
134
135
136
137
138
139
140
141
142
143
144
	Model            string         `json:"model"`
	Prompt           string         `json:"prompt"`
	FrequencyPenalty float32        `json:"frequency_penalty"`
	MaxTokens        *int           `json:"max_tokens"`
	PresencePenalty  float32        `json:"presence_penalty"`
	Seed             *int           `json:"seed"`
	Stop             any            `json:"stop"`
	Stream           bool           `json:"stream"`
	StreamOptions    *StreamOptions `json:"stream_options"`
	Temperature      *float32       `json:"temperature"`
	TopP             float32        `json:"top_p"`
	Suffix           string         `json:"suffix"`
Devon Rifkin's avatar
Devon Rifkin committed
145
	DebugRenderOnly  bool           `json:"_debug_render_only"`
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
}

type Completion struct {
	Id                string                `json:"id"`
	Object            string                `json:"object"`
	Created           int64                 `json:"created"`
	Model             string                `json:"model"`
	SystemFingerprint string                `json:"system_fingerprint"`
	Choices           []CompleteChunkChoice `json:"choices"`
	Usage             Usage                 `json:"usage,omitempty"`
}

type CompletionChunk struct {
	Id                string                `json:"id"`
	Object            string                `json:"object"`
	Created           int64                 `json:"created"`
	Choices           []CompleteChunkChoice `json:"choices"`
	Model             string                `json:"model"`
	SystemFingerprint string                `json:"system_fingerprint"`
165
	Usage             *Usage                `json:"usage,omitempty"`
166
167
}

royjhan's avatar
royjhan committed
168
169
type ToolCall struct {
	ID       string `json:"id"`
170
	Index    int    `json:"index"`
royjhan's avatar
royjhan committed
171
172
173
174
175
176
177
	Type     string `json:"type"`
	Function struct {
		Name      string `json:"name"`
		Arguments string `json:"arguments"`
	} `json:"function"`
}

178
179
180
181
182
183
184
type Model struct {
	Id      string `json:"id"`
	Object  string `json:"object"`
	Created int64  `json:"created"`
	OwnedBy string `json:"owned_by"`
}

185
type Embedding struct {
186
187
188
	Object    string `json:"object"`
	Embedding any    `json:"embedding"` // Can be []float32 (float format) or string (base64 format)
	Index     int    `json:"index"`
189
190
}

191
192
193
194
195
type ListCompletion struct {
	Object string  `json:"object"`
	Data   []Model `json:"data"`
}

196
type EmbeddingList struct {
197
198
199
200
201
202
203
204
205
	Object string         `json:"object"`
	Data   []Embedding    `json:"data"`
	Model  string         `json:"model"`
	Usage  EmbeddingUsage `json:"usage,omitempty"`
}

type EmbeddingUsage struct {
	PromptTokens int `json:"prompt_tokens"`
	TotalTokens  int `json:"total_tokens"`
206
207
}

208
209
210
211
212
213
214
215
216
217
218
219
220
221
func NewError(code int, message string) ErrorResponse {
	var etype string
	switch code {
	case http.StatusBadRequest:
		etype = "invalid_request_error"
	case http.StatusNotFound:
		etype = "not_found_error"
	default:
		etype = "api_error"
	}

	return ErrorResponse{Error{Type: etype, Message: message}}
}

222
223
// ToUsage converts an api.ChatResponse to Usage
func ToUsage(r api.ChatResponse) Usage {
224
	return Usage{
225
226
227
		PromptTokens:     r.Metrics.PromptEvalCount,
		CompletionTokens: r.Metrics.EvalCount,
		TotalTokens:      r.Metrics.PromptEvalCount + r.Metrics.EvalCount,
228
229
230
	}
}

231
232
// ToToolCalls converts api.ToolCall to OpenAI ToolCall format
func ToToolCalls(tc []api.ToolCall) []ToolCall {
233
234
	toolCalls := make([]ToolCall, len(tc))
	for i, tc := range tc {
Grace's avatar
Grace committed
235
		toolCalls[i].ID = tc.ID
royjhan's avatar
royjhan committed
236
237
		toolCalls[i].Type = "function"
		toolCalls[i].Function.Name = tc.Function.Name
238
		toolCalls[i].Index = tc.Function.Index
royjhan's avatar
royjhan committed
239
240
241
242
243
244
245
246
247

		args, err := json.Marshal(tc.Function.Arguments)
		if err != nil {
			slog.Error("could not marshall function arguments to json", "error", err)
			continue
		}

		toolCalls[i].Function.Arguments = string(args)
	}
248
249
	return toolCalls
}
royjhan's avatar
royjhan committed
250

251
252
// ToChatCompletion converts an api.ChatResponse to ChatCompletion
func ToChatCompletion(id string, r api.ChatResponse) ChatCompletion {
253
	toolCalls := ToToolCalls(r.Message.ToolCalls)
254
255
256
257
258
259
260
	return ChatCompletion{
		Id:                id,
		Object:            "chat.completion",
		Created:           r.CreatedAt.Unix(),
		Model:             r.Model,
		SystemFingerprint: "fp_ollama",
		Choices: []Choice{{
261
			Index:   0,
Michael Yang's avatar
Michael Yang committed
262
			Message: Message{Role: r.Message.Role, Content: r.Message.Content, ToolCalls: toolCalls, Reasoning: r.Message.Thinking},
263
			FinishReason: func(reason string) *string {
264
265
266
				if len(toolCalls) > 0 {
					reason = "tool_calls"
				}
267
268
269
270
271
				if len(reason) > 0 {
					return &reason
				}
				return nil
			}(r.DoneReason),
272
		}}, Usage: ToUsage(r),
Devon Rifkin's avatar
Devon Rifkin committed
273
		DebugInfo: r.DebugInfo,
274
275
276
	}
}

277
278
// ToChunk converts an api.ChatResponse to ChatCompletionChunk
func ToChunk(id string, r api.ChatResponse, toolCallSent bool) ChatCompletionChunk {
279
	toolCalls := ToToolCalls(r.Message.ToolCalls)
280
281
282
283
284
285
	return ChatCompletionChunk{
		Id:                id,
		Object:            "chat.completion.chunk",
		Created:           time.Now().Unix(),
		Model:             r.Model,
		SystemFingerprint: "fp_ollama",
286
287
		Choices: []ChunkChoice{{
			Index: 0,
Michael Yang's avatar
Michael Yang committed
288
			Delta: Message{Role: "assistant", Content: r.Message.Content, ToolCalls: toolCalls, Reasoning: r.Message.Thinking},
289
290
			FinishReason: func(reason string) *string {
				if len(reason) > 0 {
Michael Yang's avatar
Michael Yang committed
291
					if toolCallSent || len(toolCalls) > 0 {
292
293
						return &finishReasonToolCalls
					}
294
295
296
297
298
					return &reason
				}
				return nil
			}(r.DoneReason),
		}},
299
300
301
	}
}

302
303
// ToUsageGenerate converts an api.GenerateResponse to Usage
func ToUsageGenerate(r api.GenerateResponse) Usage {
304
	return Usage{
305
306
307
		PromptTokens:     r.Metrics.PromptEvalCount,
		CompletionTokens: r.Metrics.EvalCount,
		TotalTokens:      r.Metrics.PromptEvalCount + r.Metrics.EvalCount,
308
309
310
	}
}

311
312
// ToCompletion converts an api.GenerateResponse to Completion
func ToCompletion(id string, r api.GenerateResponse) Completion {
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
	return Completion{
		Id:                id,
		Object:            "text_completion",
		Created:           r.CreatedAt.Unix(),
		Model:             r.Model,
		SystemFingerprint: "fp_ollama",
		Choices: []CompleteChunkChoice{{
			Text:  r.Response,
			Index: 0,
			FinishReason: func(reason string) *string {
				if len(reason) > 0 {
					return &reason
				}
				return nil
			}(r.DoneReason),
		}},
329
		Usage: ToUsageGenerate(r),
330
331
332
	}
}

333
334
// ToCompleteChunk converts an api.GenerateResponse to CompletionChunk
func ToCompleteChunk(id string, r api.GenerateResponse) CompletionChunk {
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
	return CompletionChunk{
		Id:                id,
		Object:            "text_completion",
		Created:           time.Now().Unix(),
		Model:             r.Model,
		SystemFingerprint: "fp_ollama",
		Choices: []CompleteChunkChoice{{
			Text:  r.Response,
			Index: 0,
			FinishReason: func(reason string) *string {
				if len(reason) > 0 {
					return &reason
				}
				return nil
			}(r.DoneReason),
		}},
	}
}

354
355
// ToListCompletion converts an api.ListResponse to ListCompletion
func ToListCompletion(r api.ListResponse) ListCompletion {
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
	var data []Model
	for _, m := range r.Models {
		data = append(data, Model{
			Id:      m.Name,
			Object:  "model",
			Created: m.ModifiedAt.Unix(),
			OwnedBy: model.ParseName(m.Name).Namespace,
		})
	}

	return ListCompletion{
		Object: "list",
		Data:   data,
	}
}

372
// ToEmbeddingList converts an api.EmbedResponse to EmbeddingList
373
374
// encodingFormat can be "float", "base64", or empty (defaults to "float")
func ToEmbeddingList(model string, r api.EmbedResponse, encodingFormat string) EmbeddingList {
375
376
377
	if r.Embeddings != nil {
		var data []Embedding
		for i, e := range r.Embeddings {
378
379
380
381
382
383
384
			var embedding any
			if strings.EqualFold(encodingFormat, "base64") {
				embedding = floatsToBase64(e)
			} else {
				embedding = e
			}

385
386
			data = append(data, Embedding{
				Object:    "embedding",
387
				Embedding: embedding,
388
389
390
391
392
393
394
395
				Index:     i,
			})
		}

		return EmbeddingList{
			Object: "list",
			Data:   data,
			Model:  model,
396
397
398
399
			Usage: EmbeddingUsage{
				PromptTokens: r.PromptEvalCount,
				TotalTokens:  r.PromptEvalCount,
			},
400
401
402
403
404
405
		}
	}

	return EmbeddingList{}
}

406
407
408
409
410
411
412
// floatsToBase64 encodes a []float32 to a base64 string
func floatsToBase64(floats []float32) string {
	var buf bytes.Buffer
	binary.Write(&buf, binary.LittleEndian, floats)
	return base64.StdEncoding.EncodeToString(buf.Bytes())
}

413
414
// ToModel converts an api.ShowResponse to Model
func ToModel(r api.ShowResponse, m string) Model {
415
416
417
418
419
420
421
422
	return Model{
		Id:      m,
		Object:  "model",
		Created: r.ModifiedAt.Unix(),
		OwnedBy: model.ParseName(m).Namespace,
	}
}

423
424
// FromChatRequest converts a ChatCompletionRequest to api.ChatRequest
func FromChatRequest(r ChatCompletionRequest) (*api.ChatRequest, error) {
425
426
	var messages []api.Message
	for _, msg := range r.Messages {
427
428
429
430
431
432
433
		toolName := ""
		if strings.ToLower(msg.Role) == "tool" {
			toolName = msg.Name
			if toolName == "" && msg.ToolCallID != "" {
				toolName = nameFromToolCallID(r.Messages, msg.ToolCallID)
			}
		}
434
435
		switch content := msg.Content.(type) {
		case string:
436
			toolCalls, err := FromCompletionToolCall(msg.ToolCalls)
437
438
439
			if err != nil {
				return nil, err
			}
440
			messages = append(messages, api.Message{Role: msg.Role, Content: content, Thinking: msg.Reasoning, ToolCalls: toolCalls, ToolName: toolName, ToolCallID: msg.ToolCallID})
441
442
443
444
		case []any:
			for _, c := range content {
				data, ok := c.(map[string]any)
				if !ok {
Michael Yang's avatar
lint  
Michael Yang committed
445
					return nil, errors.New("invalid message format")
446
447
448
449
450
				}
				switch data["type"] {
				case "text":
					text, ok := data["text"].(string)
					if !ok {
Michael Yang's avatar
lint  
Michael Yang committed
451
						return nil, errors.New("invalid message format")
452
					}
453
					messages = append(messages, api.Message{Role: msg.Role, Content: text})
454
455
456
457
				case "image_url":
					var url string
					if urlMap, ok := data["image_url"].(map[string]any); ok {
						if url, ok = urlMap["url"].(string); !ok {
Michael Yang's avatar
lint  
Michael Yang committed
458
							return nil, errors.New("invalid message format")
459
460
461
						}
					} else {
						if url, ok = data["image_url"].(string); !ok {
Michael Yang's avatar
lint  
Michael Yang committed
462
							return nil, errors.New("invalid message format")
463
464
465
						}
					}

466
					types := []string{"jpeg", "jpg", "png", "webp"}
467
					valid := false
468
469
470
471
472
					// support blank mime type to match api/chat taking just unadorned base64
					if strings.HasPrefix(url, "data:;base64,") {
						url = strings.TrimPrefix(url, "data:;base64,")
						valid = true
					}
473
474
475
476
477
478
479
480
481
482
					for _, t := range types {
						prefix := "data:image/" + t + ";base64,"
						if strings.HasPrefix(url, prefix) {
							url = strings.TrimPrefix(url, prefix)
							valid = true
							break
						}
					}

					if !valid {
Michael Yang's avatar
lint  
Michael Yang committed
483
						return nil, errors.New("invalid image input")
484
485
486
487
					}

					img, err := base64.StdEncoding.DecodeString(url)
					if err != nil {
Michael Yang's avatar
lint  
Michael Yang committed
488
						return nil, errors.New("invalid message format")
489
					}
490
491

					messages = append(messages, api.Message{Role: msg.Role, Images: []api.ImageData{img}})
492
				default:
Michael Yang's avatar
lint  
Michael Yang committed
493
					return nil, errors.New("invalid message format")
494
495
				}
			}
496
497
498
			// since we might have added multiple messages above, if we have tools
			// calls we'll add them to the last message
			if len(messages) > 0 && len(msg.ToolCalls) > 0 {
499
				toolCalls, err := FromCompletionToolCall(msg.ToolCalls)
500
501
502
503
				if err != nil {
					return nil, err
				}
				messages[len(messages)-1].ToolCalls = toolCalls
504
505
				messages[len(messages)-1].ToolName = toolName
				messages[len(messages)-1].ToolCallID = msg.ToolCallID
506
				messages[len(messages)-1].Thinking = msg.Reasoning
507
			}
508
		default:
509
			// content is only optional if tool calls are present
royjhan's avatar
royjhan committed
510
511
512
513
			if msg.ToolCalls == nil {
				return nil, fmt.Errorf("invalid message content type: %T", content)
			}

514
515
516
			toolCalls, err := FromCompletionToolCall(msg.ToolCalls)
			if err != nil {
				return nil, err
royjhan's avatar
royjhan committed
517
			}
518
			messages = append(messages, api.Message{Role: msg.Role, Thinking: msg.Reasoning, ToolCalls: toolCalls, ToolCallID: msg.ToolCallID})
519
		}
520
521
	}

522
	options := make(map[string]any)
523
524
525
526

	switch stop := r.Stop.(type) {
	case string:
		options["stop"] = []string{stop}
527
	case []any:
528
529
530
531
532
533
534
535
536
537
538
539
540
541
		var stops []string
		for _, s := range stop {
			if str, ok := s.(string); ok {
				stops = append(stops, str)
			}
		}
		options["stop"] = stops
	}

	if r.MaxTokens != nil {
		options["num_predict"] = *r.MaxTokens
	}

	if r.Temperature != nil {
542
		options["temperature"] = *r.Temperature
543
544
545
546
547
548
549
550
551
	} else {
		options["temperature"] = 1.0
	}

	if r.Seed != nil {
		options["seed"] = *r.Seed
	}

	if r.FrequencyPenalty != nil {
552
		options["frequency_penalty"] = *r.FrequencyPenalty
553
554
555
	}

	if r.PresencePenalty != nil {
556
		options["presence_penalty"] = *r.PresencePenalty
557
558
559
560
561
562
563
564
	}

	if r.TopP != nil {
		options["top_p"] = *r.TopP
	} else {
		options["top_p"] = 1.0
	}

565
566
567
568
569
570
571
572
	var format json.RawMessage
	if r.ResponseFormat != nil {
		switch strings.ToLower(strings.TrimSpace(r.ResponseFormat.Type)) {
		// Support the old "json_object" type for OpenAI compatibility
		case "json_object":
			format = json.RawMessage(`"json"`)
		case "json_schema":
			if r.ResponseFormat.JsonSchema != nil {
573
				format = r.ResponseFormat.JsonSchema.Schema
574
575
			}
		}
576
577
	}

Michael Yang's avatar
Michael Yang committed
578
	var think *api.ThinkValue
579
580
	var effort string

Michael Yang's avatar
Michael Yang committed
581
	if r.Reasoning != nil {
582
583
584
585
586
587
588
589
		effort = r.Reasoning.Effort
	} else if r.ReasoningEffort != nil {
		effort = *r.ReasoningEffort
	}

	if effort != "" {
		if !slices.Contains([]string{"high", "medium", "low", "none"}, effort) {
			return nil, fmt.Errorf("invalid reasoning value: '%s' (must be \"high\", \"medium\", \"low\", or \"none\")", effort)
Michael Yang's avatar
Michael Yang committed
590
		}
591

592
		if effort == "none" {
593
594
			think = &api.ThinkValue{Value: false}
		} else {
595
			think = &api.ThinkValue{Value: effort}
596
		}
Michael Yang's avatar
Michael Yang committed
597
598
	}

599
	return &api.ChatRequest{
Devon Rifkin's avatar
Devon Rifkin committed
600
601
602
603
604
605
606
607
		Model:           r.Model,
		Messages:        messages,
		Format:          format,
		Options:         options,
		Stream:          &r.Stream,
		Tools:           r.Tools,
		Think:           think,
		DebugRenderOnly: r.DebugRenderOnly,
608
	}, nil
609
610
}

611
612
613
614
615
616
617
618
619
620
621
622
623
624
func nameFromToolCallID(messages []Message, toolCallID string) string {
	// iterate backwards to be more resilient to duplicate tool call IDs (this
	// follows "last one wins")
	for i := len(messages) - 1; i >= 0; i-- {
		msg := messages[i]
		for _, tc := range msg.ToolCalls {
			if tc.ID == toolCallID {
				return tc.Function.Name
			}
		}
	}
	return ""
}

625
626
// FromCompletionToolCall converts OpenAI ToolCall format to api.ToolCall
func FromCompletionToolCall(toolCalls []ToolCall) ([]api.ToolCall, error) {
627
628
	apiToolCalls := make([]api.ToolCall, len(toolCalls))
	for i, tc := range toolCalls {
629
		apiToolCalls[i].ID = tc.ID
630
631
632
633
634
635
636
637
638
639
		apiToolCalls[i].Function.Name = tc.Function.Name
		err := json.Unmarshal([]byte(tc.Function.Arguments), &apiToolCalls[i].Function.Arguments)
		if err != nil {
			return nil, errors.New("invalid tool call arguments")
		}
	}

	return apiToolCalls, nil
}

640
641
// FromCompleteRequest converts a CompletionRequest to api.GenerateRequest
func FromCompleteRequest(r CompletionRequest) (api.GenerateRequest, error) {
642
643
644
645
646
	options := make(map[string]any)

	switch stop := r.Stop.(type) {
	case string:
		options["stop"] = []string{stop}
647
648
649
650
651
652
653
654
	case []any:
		var stops []string
		for _, s := range stop {
			if str, ok := s.(string); ok {
				stops = append(stops, str)
			} else {
				return api.GenerateRequest{}, fmt.Errorf("invalid type for 'stop' field: %T", s)
			}
655
		}
656
		options["stop"] = stops
657
658
659
660
661
662
663
	}

	if r.MaxTokens != nil {
		options["num_predict"] = *r.MaxTokens
	}

	if r.Temperature != nil {
664
		options["temperature"] = *r.Temperature
665
666
667
668
669
670
671
672
	} else {
		options["temperature"] = 1.0
	}

	if r.Seed != nil {
		options["seed"] = *r.Seed
	}

673
	options["frequency_penalty"] = r.FrequencyPenalty
674

675
	options["presence_penalty"] = r.PresencePenalty
676
677
678
679
680
681
682
683

	if r.TopP != 0.0 {
		options["top_p"] = r.TopP
	} else {
		options["top_p"] = 1.0
	}

	return api.GenerateRequest{
Devon Rifkin's avatar
Devon Rifkin committed
684
685
686
687
688
689
		Model:           r.Model,
		Prompt:          r.Prompt,
		Options:         options,
		Stream:          &r.Stream,
		Suffix:          r.Suffix,
		DebugRenderOnly: r.DebugRenderOnly,
690
691
	}, nil
}