Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
cfb3bf25
Unverified
Commit
cfb3bf25
authored
Nov 27, 2024
by
yansh97
Committed by
GitHub
Nov 27, 2024
Browse files
[bugfix] fix the default value of llm_int8_threshold in BitsAndBytesConfig (#10657)
parent
1bf905dd
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
2 additions
and
2 deletions
+2
-2
vllm/model_executor/layers/quantization/bitsandbytes.py
vllm/model_executor/layers/quantization/bitsandbytes.py
+2
-2
No files found.
vllm/model_executor/layers/quantization/bitsandbytes.py
View file @
cfb3bf25
...
@@ -26,7 +26,7 @@ class BitsAndBytesConfig(QuantizationConfig):
...
@@ -26,7 +26,7 @@ class BitsAndBytesConfig(QuantizationConfig):
llm_int8_enable_fp32_cpu_offload
:
bool
=
False
,
llm_int8_enable_fp32_cpu_offload
:
bool
=
False
,
llm_int8_has_fp16_weight
:
bool
=
False
,
llm_int8_has_fp16_weight
:
bool
=
False
,
llm_int8_skip_modules
:
Optional
[
List
[
str
]]
=
None
,
llm_int8_skip_modules
:
Optional
[
List
[
str
]]
=
None
,
llm_int8_threshold
:
float
=
0
.0
,
llm_int8_threshold
:
float
=
6
.0
,
)
->
None
:
)
->
None
:
self
.
load_in_8bit
=
load_in_8bit
self
.
load_in_8bit
=
load_in_8bit
...
@@ -103,7 +103,7 @@ class BitsAndBytesConfig(QuantizationConfig):
...
@@ -103,7 +103,7 @@ class BitsAndBytesConfig(QuantizationConfig):
[
"llm_int8_skip_modules"
],
[
"llm_int8_skip_modules"
],
default_value
=
[])
default_value
=
[])
llm_int8_threshold
=
get_safe_value
(
config
,
[
"llm_int8_threshold"
],
llm_int8_threshold
=
get_safe_value
(
config
,
[
"llm_int8_threshold"
],
default_value
=
0
.0
)
default_value
=
6
.0
)
return
cls
(
return
cls
(
load_in_8bit
=
load_in_8bit
,
load_in_8bit
=
load_in_8bit
,
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment