Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
4d4c6fe3
Commit
4d4c6fe3
authored
Feb 26, 2025
by
zhuwenwen
Browse files
add cudagraph
parent
537e2d9c
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
1 addition
and
3 deletions
+1
-3
vllm/config.py
vllm/config.py
+1
-2
vllm/engine/arg_utils.py
vllm/engine/arg_utils.py
+0
-1
No files found.
vllm/config.py
View file @
4d4c6fe3
...
...
@@ -322,8 +322,7 @@ class ModelConfig:
# Set enforce_eager to False if the value is unset.
if
self
.
enforce_eager
is
None
:
# self.enforce_eager = False
self
.
enforce_eager
=
True
self
.
enforce_eager
=
False
sliding_window
=
getattr
(
self
.
hf_text_config
,
"sliding_window"
,
None
)
has_interleaved_attention
=
(
sliding_window
is
not
None
)
and
(
...
...
vllm/engine/arg_utils.py
View file @
4d4c6fe3
...
...
@@ -565,7 +565,6 @@ class EngineArgs:
'parsed into a dictionary.'
)
parser
.
add_argument
(
'--enforce-eager'
,
action
=
'store_true'
,
default
=
True
,
help
=
'Always use eager-mode PyTorch. If False, '
'will use eager mode and CUDA graph in hybrid '
'for maximal performance and flexibility.'
)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment