Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
479d69fa
Unverified
Commit
479d69fa
authored
Apr 24, 2024
by
Nick Hill
Committed by
GitHub
Apr 25, 2024
Browse files
[Core] Move ray_utils.py from `engine` to `executor` package (#4347)
parent
96e90fde
Changes
7
Hide whitespace changes
Inline
Side-by-side
Showing
7 changed files
with
11 additions
and
9 deletions
+11
-9
vllm/__init__.py
vllm/__init__.py
+1
-1
vllm/engine/async_llm_engine.py
vllm/engine/async_llm_engine.py
+1
-1
vllm/engine/llm_engine.py
vllm/engine/llm_engine.py
+1
-1
vllm/executor/ray_gpu_executor.py
vllm/executor/ray_gpu_executor.py
+6
-4
vllm/executor/ray_utils.py
vllm/executor/ray_utils.py
+0
-0
vllm/transformers_utils/tokenizer_group/__init__.py
vllm/transformers_utils/tokenizer_group/__init__.py
+1
-1
vllm/transformers_utils/tokenizer_group/ray_tokenizer_group.py
...transformers_utils/tokenizer_group/ray_tokenizer_group.py
+1
-1
No files found.
vllm/__init__.py
View file @
479d69fa
...
@@ -3,8 +3,8 @@
...
@@ -3,8 +3,8 @@
from
vllm.engine.arg_utils
import
AsyncEngineArgs
,
EngineArgs
from
vllm.engine.arg_utils
import
AsyncEngineArgs
,
EngineArgs
from
vllm.engine.async_llm_engine
import
AsyncLLMEngine
from
vllm.engine.async_llm_engine
import
AsyncLLMEngine
from
vllm.engine.llm_engine
import
LLMEngine
from
vllm.engine.llm_engine
import
LLMEngine
from
vllm.engine.ray_utils
import
initialize_ray_cluster
from
vllm.entrypoints.llm
import
LLM
from
vllm.entrypoints.llm
import
LLM
from
vllm.executor.ray_utils
import
initialize_ray_cluster
from
vllm.model_executor.models
import
ModelRegistry
from
vllm.model_executor.models
import
ModelRegistry
from
vllm.outputs
import
CompletionOutput
,
RequestOutput
from
vllm.outputs
import
CompletionOutput
,
RequestOutput
from
vllm.sampling_params
import
SamplingParams
from
vllm.sampling_params
import
SamplingParams
...
...
vllm/engine/async_llm_engine.py
View file @
479d69fa
...
@@ -10,7 +10,7 @@ from transformers import PreTrainedTokenizer
...
@@ -10,7 +10,7 @@ from transformers import PreTrainedTokenizer
from
vllm.config
import
ModelConfig
from
vllm.config
import
ModelConfig
from
vllm.engine.arg_utils
import
AsyncEngineArgs
from
vllm.engine.arg_utils
import
AsyncEngineArgs
from
vllm.engine.llm_engine
import
LLMEngine
from
vllm.engine.llm_engine
import
LLMEngine
from
vllm.e
ngine
.ray_utils
import
initialize_ray_cluster
,
ray
from
vllm.e
xecutor
.ray_utils
import
initialize_ray_cluster
,
ray
from
vllm.logger
import
init_logger
from
vllm.logger
import
init_logger
from
vllm.lora.request
import
LoRARequest
from
vllm.lora.request
import
LoRARequest
from
vllm.outputs
import
RequestOutput
from
vllm.outputs
import
RequestOutput
...
...
vllm/engine/llm_engine.py
View file @
479d69fa
...
@@ -15,8 +15,8 @@ from vllm.engine.output_processor.interfaces import (
...
@@ -15,8 +15,8 @@ from vllm.engine.output_processor.interfaces import (
SequenceGroupOutputProcessor
)
SequenceGroupOutputProcessor
)
from
vllm.engine.output_processor.stop_checker
import
StopChecker
from
vllm.engine.output_processor.stop_checker
import
StopChecker
from
vllm.engine.output_processor.util
import
create_output_by_sequence_group
from
vllm.engine.output_processor.util
import
create_output_by_sequence_group
from
vllm.engine.ray_utils
import
initialize_ray_cluster
from
vllm.executor.executor_base
import
ExecutorBase
from
vllm.executor.executor_base
import
ExecutorBase
from
vllm.executor.ray_utils
import
initialize_ray_cluster
from
vllm.logger
import
init_logger
from
vllm.logger
import
init_logger
from
vllm.lora.request
import
LoRARequest
from
vllm.lora.request
import
LoRARequest
from
vllm.outputs
import
RequestOutput
from
vllm.outputs
import
RequestOutput
...
...
vllm/executor/ray_gpu_executor.py
View file @
479d69fa
...
@@ -5,8 +5,8 @@ from collections import defaultdict
...
@@ -5,8 +5,8 @@ from collections import defaultdict
from
itertools
import
islice
,
repeat
from
itertools
import
islice
,
repeat
from
typing
import
TYPE_CHECKING
,
Any
,
Dict
,
List
,
Optional
,
Set
,
Tuple
from
typing
import
TYPE_CHECKING
,
Any
,
Dict
,
List
,
Optional
,
Set
,
Tuple
from
vllm.engine.ray_utils
import
RayWorkerWrapper
,
ray
from
vllm.executor.executor_base
import
ExecutorAsyncBase
,
ExecutorBase
from
vllm.executor.executor_base
import
ExecutorAsyncBase
,
ExecutorBase
from
vllm.executor.ray_utils
import
RayWorkerWrapper
,
ray
from
vllm.logger
import
init_logger
from
vllm.logger
import
init_logger
from
vllm.lora.request
import
LoRARequest
from
vllm.lora.request
import
LoRARequest
from
vllm.sequence
import
SamplerOutput
,
SequenceGroupMetadata
from
vllm.sequence
import
SamplerOutput
,
SequenceGroupMetadata
...
@@ -74,7 +74,7 @@ class RayGPUExecutor(ExecutorBase):
...
@@ -74,7 +74,7 @@ class RayGPUExecutor(ExecutorBase):
# The driver dummy worker does not actually use any resources.
# The driver dummy worker does not actually use any resources.
# It holds the resource for the driver worker.
# It holds the resource for the driver worker.
self
.
driver_dummy_worker
:
RayWorkerWrapper
=
None
self
.
driver_dummy_worker
:
Optional
[
RayWorkerWrapper
]
=
None
# The remaining workers are the actual ray actors.
# The remaining workers are the actual ray actors.
self
.
workers
:
List
[
RayWorkerWrapper
]
=
[]
self
.
workers
:
List
[
RayWorkerWrapper
]
=
[]
...
@@ -318,6 +318,7 @@ class RayGPUExecutor(ExecutorBase):
...
@@ -318,6 +318,7 @@ class RayGPUExecutor(ExecutorBase):
driver_worker_output
=
self
.
driver_worker
.
execute_method
(
driver_worker_output
=
self
.
driver_worker
.
execute_method
(
method
,
*
driver_args
,
**
driver_kwargs
)
method
,
*
driver_args
,
**
driver_kwargs
)
else
:
else
:
assert
self
.
driver_dummy_worker
is
not
None
driver_worker_output
=
ray
.
get
(
driver_worker_output
=
ray
.
get
(
self
.
driver_dummy_worker
.
execute_method
.
remote
(
self
.
driver_dummy_worker
.
execute_method
.
remote
(
method
,
*
driver_args
,
**
driver_kwargs
))
method
,
*
driver_args
,
**
driver_kwargs
))
...
@@ -353,8 +354,9 @@ class RayGPUExecutor(ExecutorBase):
...
@@ -353,8 +354,9 @@ class RayGPUExecutor(ExecutorBase):
# a dummy value for now. It will be fixed soon.
# a dummy value for now. It will be fixed soon.
with
InputNode
()
as
input_data
:
with
InputNode
()
as
input_data
:
forward_dag
=
MultiOutputNode
([
forward_dag
=
MultiOutputNode
([
worker
.
execute_model_compiled_dag_remote
.
bind
(
input_data
)
worker
.
execute_model_compiled_dag_remote
.
for
worker
in
self
.
workers
bind
(
# type: ignore[attr-defined]
input_data
)
for
worker
in
self
.
workers
])
])
return
forward_dag
.
experimental_compile
()
return
forward_dag
.
experimental_compile
()
...
...
vllm/e
ngine
/ray_utils.py
→
vllm/e
xecutor
/ray_utils.py
View file @
479d69fa
File moved
vllm/transformers_utils/tokenizer_group/__init__.py
View file @
479d69fa
from
typing
import
Optional
from
typing
import
Optional
from
vllm.config
import
TokenizerPoolConfig
from
vllm.config
import
TokenizerPoolConfig
from
vllm.e
ngine
.ray_utils
import
ray
from
vllm.e
xecutor
.ray_utils
import
ray
from
vllm.transformers_utils.tokenizer_group.base_tokenizer_group
import
(
from
vllm.transformers_utils.tokenizer_group.base_tokenizer_group
import
(
BaseTokenizerGroup
)
BaseTokenizerGroup
)
from
vllm.transformers_utils.tokenizer_group.tokenizer_group
import
(
from
vllm.transformers_utils.tokenizer_group.tokenizer_group
import
(
...
...
vllm/transformers_utils/tokenizer_group/ray_tokenizer_group.py
View file @
479d69fa
...
@@ -6,7 +6,7 @@ from ray.util.scheduling_strategies import NodeAffinitySchedulingStrategy
...
@@ -6,7 +6,7 @@ from ray.util.scheduling_strategies import NodeAffinitySchedulingStrategy
from
transformers
import
PreTrainedTokenizer
from
transformers
import
PreTrainedTokenizer
from
vllm.config
import
TokenizerPoolConfig
from
vllm.config
import
TokenizerPoolConfig
from
vllm.e
ngine
.ray_utils
import
ray
from
vllm.e
xecutor
.ray_utils
import
ray
from
vllm.lora.request
import
LoRARequest
from
vllm.lora.request
import
LoRARequest
from
vllm.transformers_utils.tokenizer_group.base_tokenizer_group
import
(
from
vllm.transformers_utils.tokenizer_group.base_tokenizer_group
import
(
BaseTokenizerGroup
)
BaseTokenizerGroup
)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment