Commit 948114e3 authored by Mark Ward's avatar Mark Ward
Browse files

fix sched to wait for the runner to terminate to ensure following vram check will be more accurate

parent a3e60d90
......@@ -899,7 +899,10 @@ func (s *llmServer) Detokenize(ctx context.Context, tokens []int) (string, error
func (s *llmServer) Close() error {
if s.cmd != nil {
slog.Debug("stopping llama server")
return s.cmd.Process.Kill()
if err := s.cmd.Process.Kill(); err != nil {
return err
}
return s.cmd.Wait()
}
return nil
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment