Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
ollama
Commits
bd6e38fb
Commit
bd6e38fb
authored
Oct 12, 2023
by
Michael Yang
Browse files
refactor memory check
parent
92189a58
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
15 additions
and
26 deletions
+15
-26
llm/llm.go
llm/llm.go
+15
-26
No files found.
llm/llm.go
View file @
bd6e38fb
...
...
@@ -58,38 +58,27 @@ func New(workDir, model string, adapters []string, opts api.Options) (LLM, error
}
}
totalResidentMemory
:=
memory
.
TotalMemory
()
var
requiredMemory
int64
var
f16Multiplier
int64
=
2
totalResidentMemory
:=
int64
(
memory
.
TotalMemory
())
switch
ggml
.
ModelType
()
{
case
"3B"
,
"7B"
:
if
ggml
.
FileType
()
==
"F16"
&&
totalResidentMemory
<
16
*
format
.
GigaByte
{
return
nil
,
fmt
.
Errorf
(
"F16 model requires at least 16 GB of memory"
)
}
else
if
totalResidentMemory
<
8
*
format
.
GigaByte
{
return
nil
,
fmt
.
Errorf
(
"model requires at least 8 GB of memory"
)
}
requiredMemory
=
8
*
format
.
GigaByte
case
"13B"
:
if
ggml
.
FileType
()
==
"F16"
&&
totalResidentMemory
<
32
*
format
.
GigaByte
{
return
nil
,
fmt
.
Errorf
(
"F16 model requires at least 32 GB of memory"
)
}
else
if
totalResidentMemory
<
16
*
format
.
GigaByte
{
return
nil
,
fmt
.
Errorf
(
"model requires at least 16 GB of memory"
)
}
requiredMemory
=
16
*
format
.
GigaByte
case
"30B"
,
"34B"
,
"40B"
:
if
ggml
.
FileType
()
==
"F16"
&&
totalResidentMemory
<
64
*
format
.
GigaByte
{
return
nil
,
fmt
.
Errorf
(
"F16 model requires at least 64 GB of memory"
)
}
else
if
totalResidentMemory
<
32
*
format
.
GigaByte
{
return
nil
,
fmt
.
Errorf
(
"model requires at least 32 GB of memory"
)
}
requiredMemory
=
32
*
format
.
GigaByte
case
"65B"
,
"70B"
:
if
ggml
.
FileType
()
==
"F16"
&&
totalResidentMemory
<
128
*
format
.
GigaByte
{
return
nil
,
fmt
.
Errorf
(
"F16 model requires at least 128 GB of memory"
)
}
else
if
totalResidentMemory
<
64
*
format
.
GigaByte
{
return
nil
,
fmt
.
Errorf
(
"model requires at least 64 GB of memory"
)
}
requiredMemory
=
64
*
format
.
GigaByte
case
"180B"
:
if
ggml
.
FileType
()
==
"F16"
&&
totalResidentMemory
<
512
*
format
.
GigaByte
{
return
nil
,
fmt
.
Errorf
(
"F16 model requires at least 512GB of memory"
)
}
else
if
totalResidentMemory
<
128
*
format
.
GigaByte
{
return
nil
,
fmt
.
Errorf
(
"model requires at least 128GB of memory"
)
}
requiredMemory
=
128
*
format
.
GigaByte
f16Multiplier
=
4
}
if
ggml
.
FileType
()
==
"F16"
&&
requiredMemory
*
f16Multiplier
>
totalResidentMemory
{
return
nil
,
fmt
.
Errorf
(
"F16 model requires at least %s of memory"
,
format
.
HumanBytes
(
requiredMemory
))
}
else
if
requiredMemory
>
totalResidentMemory
{
return
nil
,
fmt
.
Errorf
(
"model requires at least %s of memory"
,
format
.
HumanBytes
(
requiredMemory
))
}
switch
ggml
.
Name
()
{
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment