Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
orangecat
ollama
Commits
d06bc0cb
"examples/vscode:/vscode.git/clone" did not exist on "5177e65ff04eb8295c98d443b4a42ca186ee2a74"
Unverified
Commit
d06bc0cb
authored
Oct 05, 2023
by
Bruce MacDonald
Committed by
GitHub
Oct 05, 2023
Browse files
enable q8, q5, 5_1, and f32 for linux gpu (#699)
parent
d104b7e9
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
17 additions
and
14 deletions
+17
-14
llm/llm.go
llm/llm.go
+17
-14
No files found.
llm/llm.go
View file @
d06bc0cb
...
@@ -5,6 +5,7 @@ import (
...
@@ -5,6 +5,7 @@ import (
"fmt"
"fmt"
"log"
"log"
"os"
"os"
"runtime"
"github.com/pbnjay/memory"
"github.com/pbnjay/memory"
...
@@ -37,20 +38,22 @@ func New(workDir, model string, adapters []string, opts api.Options) (LLM, error
...
@@ -37,20 +38,22 @@ func New(workDir, model string, adapters []string, opts api.Options) (LLM, error
return
nil
,
err
return
nil
,
err
}
}
switch
ggml
.
FileType
()
{
if
runtime
.
GOOS
==
"darwin"
{
case
"Q8_0"
:
switch
ggml
.
FileType
()
{
if
ggml
.
Name
()
!=
"gguf"
&&
opts
.
NumGPU
!=
0
{
case
"Q8_0"
:
// GGML Q8_0 do not support Metal API and will
if
ggml
.
Name
()
!=
"gguf"
&&
opts
.
NumGPU
!=
0
{
// cause the runner to segmentation fault so disable GPU
// GGML Q8_0 do not support Metal API and will
log
.
Printf
(
"WARNING: GPU disabled for F32, Q5_0, Q5_1, and Q8_0"
)
// cause the runner to segmentation fault so disable GPU
opts
.
NumGPU
=
0
log
.
Printf
(
"WARNING: GPU disabled for F32, Q5_0, Q5_1, and Q8_0"
)
}
opts
.
NumGPU
=
0
case
"F32"
,
"Q5_0"
,
"Q5_1"
:
}
if
opts
.
NumGPU
!=
0
{
case
"F32"
,
"Q5_0"
,
"Q5_1"
:
// F32, Q5_0, Q5_1, and Q8_0 do not support Metal API and will
if
opts
.
NumGPU
!=
0
{
// cause the runner to segmentation fault so disable GPU
// F32, Q5_0, Q5_1, and Q8_0 do not support Metal API and will
log
.
Printf
(
"WARNING: GPU disabled for F32, Q5_0, Q5_1, and Q8_0"
)
// cause the runner to segmentation fault so disable GPU
opts
.
NumGPU
=
0
log
.
Printf
(
"WARNING: GPU disabled for F32, Q5_0, Q5_1, and Q8_0"
)
opts
.
NumGPU
=
0
}
}
}
}
}
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment