Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
cf1d8464
Commit
cf1d8464
authored
May 09, 2025
by
lizhigong
Browse files
debug on v0.8.5
parent
29e922ac
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
0 additions
and
10 deletions
+0
-10
vllm/zero_overhead/llm_engine.py
vllm/zero_overhead/llm_engine.py
+0
-10
No files found.
vllm/zero_overhead/llm_engine.py
View file @
cf1d8464
...
@@ -52,7 +52,6 @@ class ZeroOverheadEngine(LLMEngine):
...
@@ -52,7 +52,6 @@ class ZeroOverheadEngine(LLMEngine):
log_stats
:
bool
,
log_stats
:
bool
,
usage_context
:
UsageContext
=
UsageContext
.
ENGINE_CONTEXT
,
usage_context
:
UsageContext
=
UsageContext
.
ENGINE_CONTEXT
,
stat_loggers
:
Optional
[
Dict
[
str
,
StatLoggerBase
]]
=
None
,
stat_loggers
:
Optional
[
Dict
[
str
,
StatLoggerBase
]]
=
None
,
input_registry
:
InputRegistry
=
INPUT_REGISTRY
,
mm_registry
:
MultiModalRegistry
=
MULTIMODAL_REGISTRY
,
mm_registry
:
MultiModalRegistry
=
MULTIMODAL_REGISTRY
,
use_cached_outputs
:
bool
=
False
,
use_cached_outputs
:
bool
=
False
,
)
->
None
:
)
->
None
:
...
@@ -113,10 +112,6 @@ class ZeroOverheadEngine(LLMEngine):
...
@@ -113,10 +112,6 @@ class ZeroOverheadEngine(LLMEngine):
self
.
tokenizer
,
self
.
tokenizer
,
mm_registry
)
mm_registry
)
self
.
input_registry
=
input_registry
self
.
input_processor
=
input_registry
.
create_input_processor
(
self
.
model_config
)
self
.
model_executor
=
executor_class
(
vllm_config
=
vllm_config
,
)
self
.
model_executor
=
executor_class
(
vllm_config
=
vllm_config
,
)
if
self
.
model_config
.
runner_type
!=
"pooling"
:
if
self
.
model_config
.
runner_type
!=
"pooling"
:
...
@@ -159,11 +154,6 @@ class ZeroOverheadEngine(LLMEngine):
...
@@ -159,11 +154,6 @@ class ZeroOverheadEngine(LLMEngine):
self
.
parallel_config
.
disable_custom_all_reduce
,
self
.
parallel_config
.
disable_custom_all_reduce
,
})
})
if
self
.
tokenizer
:
# Ping the tokenizer to ensure liveness if it runs in a
# different process.
self
.
tokenizer
.
ping
()
self
.
cached_scheduler_outputs
=
[
self
.
cached_scheduler_outputs
=
[
SchedulerOutputState
()
SchedulerOutputState
()
for
_
in
range
(
self
.
parallel_config
.
pipeline_parallel_size
)
for
_
in
range
(
self
.
parallel_config
.
pipeline_parallel_size
)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment