Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
a8f12a63
Unverified
Commit
a8f12a63
authored
Mar 20, 2025
by
Richard Liu
Committed by
GitHub
Mar 20, 2025
Browse files
Fix env vars for running Ray distributed backend on GKE (#15166)
Signed-off-by:
Richard Liu
<
ricliu@google.com
>
parent
69ae2380
Changes
3
Show whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
8 additions
and
0 deletions
+8
-0
vllm/executor/ray_distributed_executor.py
vllm/executor/ray_distributed_executor.py
+2
-0
vllm/platforms/interface.py
vllm/platforms/interface.py
+2
-0
vllm/platforms/tpu.py
vllm/platforms/tpu.py
+4
-0
No files found.
vllm/executor/ray_distributed_executor.py
View file @
a8f12a63
...
@@ -340,6 +340,8 @@ class RayDistributedExecutor(DistributedExecutorBase):
...
@@ -340,6 +340,8 @@ class RayDistributedExecutor(DistributedExecutorBase):
and
v
not
in
self
.
non_carry_over_env_vars
and
v
not
in
self
.
non_carry_over_env_vars
]
]
env_vars_to_copy
.
extend
(
current_platform
.
additional_env_vars
)
# Copy existing env vars to each worker's args
# Copy existing env vars to each worker's args
for
args
in
all_args_to_update_environment_variables
:
for
args
in
all_args_to_update_environment_variables
:
# TODO: refactor platform-specific env vars
# TODO: refactor platform-specific env vars
...
...
vllm/platforms/interface.py
View file @
a8f12a63
...
@@ -112,6 +112,8 @@ class Platform:
...
@@ -112,6 +112,8 @@ class Platform:
supported_quantization
:
list
[
str
]
=
[]
supported_quantization
:
list
[
str
]
=
[]
additional_env_vars
:
list
[
str
]
=
[]
def
is_cuda
(
self
)
->
bool
:
def
is_cuda
(
self
)
->
bool
:
return
self
.
_enum
==
PlatformEnum
.
CUDA
return
self
.
_enum
==
PlatformEnum
.
CUDA
...
...
vllm/platforms/tpu.py
View file @
a8f12a63
...
@@ -29,6 +29,10 @@ class TpuPlatform(Platform):
...
@@ -29,6 +29,10 @@ class TpuPlatform(Platform):
"tpu_int8"
,
"compressed-tensors"
,
"compressed_tensors"
"tpu_int8"
,
"compressed-tensors"
,
"compressed_tensors"
]
]
additional_env_vars
:
list
[
str
]
=
[
"TPU_CHIPS_PER_HOST_BOUNDS"
,
"TPU_HOST_BOUNDS"
]
@
classmethod
@
classmethod
def
get_attn_backend_cls
(
cls
,
selected_backend
:
_Backend
,
head_size
:
int
,
def
get_attn_backend_cls
(
cls
,
selected_backend
:
_Backend
,
head_size
:
int
,
dtype
:
torch
.
dtype
,
kv_cache_dtype
:
Optional
[
str
],
dtype
:
torch
.
dtype
,
kv_cache_dtype
:
Optional
[
str
],
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment