Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
dad961ef
Unverified
Commit
dad961ef
authored
Aug 19, 2024
by
Ali Panahi
Committed by
GitHub
Aug 19, 2024
Browse files
[Bugfix] fix lora_dtype value type in arg_utils.py - part 2 (#5428)
parent
3ac50b47
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
3 additions
and
1 deletion
+3
-1
vllm/engine/arg_utils.py
vllm/engine/arg_utils.py
+3
-1
No files found.
vllm/engine/arg_utils.py
View file @
dad961ef
...
@@ -5,6 +5,8 @@ from dataclasses import dataclass
...
@@ -5,6 +5,8 @@ from dataclasses import dataclass
from
typing
import
(
TYPE_CHECKING
,
Dict
,
List
,
Mapping
,
Optional
,
Tuple
,
Type
,
from
typing
import
(
TYPE_CHECKING
,
Dict
,
List
,
Mapping
,
Optional
,
Tuple
,
Type
,
Union
)
Union
)
import
torch
import
vllm.envs
as
envs
import
vllm.envs
as
envs
from
vllm.config
import
(
CacheConfig
,
DecodingConfig
,
DeviceConfig
,
from
vllm.config
import
(
CacheConfig
,
DecodingConfig
,
DeviceConfig
,
EngineConfig
,
LoadConfig
,
LoRAConfig
,
ModelConfig
,
EngineConfig
,
LoadConfig
,
LoRAConfig
,
ModelConfig
,
...
@@ -113,7 +115,7 @@ class EngineArgs:
...
@@ -113,7 +115,7 @@ class EngineArgs:
fully_sharded_loras
:
bool
=
False
fully_sharded_loras
:
bool
=
False
lora_extra_vocab_size
:
int
=
256
lora_extra_vocab_size
:
int
=
256
long_lora_scaling_factors
:
Optional
[
Tuple
[
float
]]
=
None
long_lora_scaling_factors
:
Optional
[
Tuple
[
float
]]
=
None
lora_dtype
:
str
=
'auto'
lora_dtype
:
Optional
[
Union
[
str
,
torch
.
dtype
]]
=
'auto'
max_cpu_loras
:
Optional
[
int
]
=
None
max_cpu_loras
:
Optional
[
int
]
=
None
device
:
str
=
'auto'
device
:
str
=
'auto'
num_scheduler_steps
:
int
=
1
num_scheduler_steps
:
int
=
1
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment