Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
e19ddc39
Commit
e19ddc39
authored
Apr 11, 2025
by
zhuwenwen
Browse files
support v1 engine
parent
ac61f64c
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
7 additions
and
5 deletions
+7
-5
vllm/config.py
vllm/config.py
+3
-1
vllm/worker/worker_base.py
vllm/worker/worker_base.py
+4
-4
No files found.
vllm/config.py
View file @
e19ddc39
...
@@ -3610,7 +3610,9 @@ class VllmConfig:
...
@@ -3610,7 +3610,9 @@ class VllmConfig:
self
.
compilation_config
.
cudagraph_num_of_warmups
=
1
self
.
compilation_config
.
cudagraph_num_of_warmups
=
1
self
.
compilation_config
.
pass_config
.
enable_fusion
=
False
self
.
compilation_config
.
pass_config
.
enable_fusion
=
False
self
.
compilation_config
.
pass_config
.
enable_noop
=
False
self
.
compilation_config
.
pass_config
.
enable_noop
=
False
self
.
compilation_config
.
level
=
CompilationLevel
.
PIECEWISE
# TODO
# self.compilation_config.level = CompilationLevel.PIECEWISE
self
.
compilation_config
.
level
=
CompilationLevel
.
NO_COMPILATION
self
.
compilation_config
.
set_splitting_ops_for_v1
()
self
.
compilation_config
.
set_splitting_ops_for_v1
()
self
.
_set_cudagraph_sizes
()
self
.
_set_cudagraph_sizes
()
...
...
vllm/worker/worker_base.py
View file @
e19ddc39
...
@@ -129,10 +129,10 @@ class WorkerBase:
...
@@ -129,10 +129,10 @@ class WorkerBase:
def
list_loras
(
self
)
->
Set
[
int
]:
def
list_loras
(
self
)
->
Set
[
int
]:
raise
NotImplementedError
raise
NotImplementedError
@
property
#
@property
@
abstractmethod
#
@abstractmethod
def
cache_engines
(
self
)
->
Optional
[
List
[
CacheEngine
]]:
#
def cache_engines(self) -> Optional[List[CacheEngine]]:
raise
NotImplementedError
#
raise NotImplementedError
@
property
@
property
def
vocab_size
(
self
)
->
int
:
def
vocab_size
(
self
)
->
int
:
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment