llm: remove ambiguous comment when putting upper limit on predictions to avoid...

llm: remove ambiguous comment when putting upper limit on predictions to avoid infinite generation (#5535)

llm: remove ambiguous comment when putting upper limit on predictions to avoid...
llm: remove ambiguous comment when putting upper limit on predictions to avoid infinite generation (#5535)
53da2c69 · Jeffrey Morgan · GitHub · d8def1ff · 53da2c69
Unverified Commit 53da2c69 authored Jul 07, 2024 by Jeffrey Morgan Committed by GitHub Jul 07, 2024
Show whitespace changes
Inline Side-by-side

Showing with 1 addition and 2 deletions

llm/server.go llm/server.go +1 -2

No files found.
--- a/llm/server.go
+++ b/llm/server.go
@@ -699,10 +699,9 @@ func (s *llmServer) Completion(ctx context.Context, req CompletionRequest, fn fu
 	}
 	defer s.sem.Release(1)
-	// only allow maximum 10 "context shifts" to avoid infinite generation
+	// put an upper limit on num_predict to avoid the model running on forever
 	if req.Options.NumPredict < 0 || req.Options.NumPredict > 10*s.options.NumCtx {
 		req.Options.NumPredict = 10 * s.options.NumCtx
-		slog.Debug("setting token limit to 10x num_ctx", "num_ctx", s.options.NumCtx, "num_predict", req.Options.NumPredict)
 	}
 	request := map[string]any{