Commit 948114e3 authored by Mark Ward's avatar Mark Ward
Browse files

fix sched to wait for the runner to terminate to ensure following vram check will be more accurate

parent a3e60d90
...@@ -899,7 +899,10 @@ func (s *llmServer) Detokenize(ctx context.Context, tokens []int) (string, error ...@@ -899,7 +899,10 @@ func (s *llmServer) Detokenize(ctx context.Context, tokens []int) (string, error
func (s *llmServer) Close() error { func (s *llmServer) Close() error {
if s.cmd != nil { if s.cmd != nil {
slog.Debug("stopping llama server") slog.Debug("stopping llama server")
return s.cmd.Process.Kill() if err := s.cmd.Process.Kill(); err != nil {
return err
}
return s.cmd.Wait()
} }
return nil return nil
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment