Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
0ce0539d
Unverified
Commit
0ce0539d
authored
Apr 07, 2024
by
Isotr0py
Committed by
GitHub
Apr 07, 2024
Browse files
[Bugfix] Fix Llava inference with Tensor Parallelism. (#3883)
parent
2f192835
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
2 additions
and
0 deletions
+2
-0
vllm/executor/ray_gpu_executor.py
vllm/executor/ray_gpu_executor.py
+2
-0
No files found.
vllm/executor/ray_gpu_executor.py
View file @
0ce0539d
...
...
@@ -154,6 +154,7 @@ class RayGPUExecutor(ExecutorBase):
scheduler_config
=
copy
.
deepcopy
(
self
.
scheduler_config
)
device_config
=
copy
.
deepcopy
(
self
.
device_config
)
lora_config
=
copy
.
deepcopy
(
self
.
lora_config
)
vision_language_config
=
copy
.
deepcopy
(
self
.
vision_language_config
)
kv_cache_dtype
=
self
.
cache_config
.
cache_dtype
# Initialize the actual workers with the Worker class.
...
...
@@ -172,6 +173,7 @@ class RayGPUExecutor(ExecutorBase):
rank
,
distributed_init_method
,
lora_config
=
lora_config
,
vision_language_config
=
vision_language_config
,
kv_cache_dtype
=
kv_cache_dtype
,
))
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment