Unverified Commit 021dcf08 authored by Michael Yang's avatar Michael Yang Committed by GitHub
Browse files

Merge pull request #9824 from ollama/mxyng/sched

conditionally enable parallel pipelines
parents bf24498b 4561fff3
...@@ -373,7 +373,7 @@ func New(r *os.File, params ml.BackendParams) (ml.Backend, error) { ...@@ -373,7 +373,7 @@ func New(r *os.File, params ml.BackendParams) (ml.Backend, error) {
(*C.ggml_backend_buffer_type_t)(unsafe.Pointer(&schedBufts[0])), (*C.ggml_backend_buffer_type_t)(unsafe.Pointer(&schedBufts[0])),
C.int(len(schedBackends)), C.int(len(schedBackends)),
C.size_t(maxGraphNodes), C.size_t(maxGraphNodes),
true, C._Bool(len(gpus) > 1 && slices.Contains(gpus, output.d)),
), ),
input: deviceBufferTypes[input.d], input: deviceBufferTypes[input.d],
output: deviceBufferTypes[output.d], output: deviceBufferTypes[output.d],
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment