Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
d06e8240
Unverified
Commit
d06e8240
authored
Jan 17, 2025
by
Chen Zhang
Committed by
GitHub
Jan 16, 2025
Browse files
[Bugfix] Set enforce_eager automatically for mllama (#12127)
Signed-off-by:
Chen Zhang
<
zhangch99@outlook.com
>
parent
62b06ba2
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
5 additions
and
5 deletions
+5
-5
examples/offline_inference/vision_language.py
examples/offline_inference/vision_language.py
+0
-1
examples/offline_inference/vision_language_multi_image.py
examples/offline_inference/vision_language_multi_image.py
+0
-1
vllm/config.py
vllm/config.py
+5
-3
No files found.
examples/offline_inference/vision_language.py
View file @
d06e8240
...
...
@@ -325,7 +325,6 @@ def run_mllama(question: str, modality: str):
model
=
model_name
,
max_model_len
=
4096
,
max_num_seqs
=
16
,
enforce_eager
=
True
,
disable_mm_preprocessor_cache
=
args
.
disable_mm_preprocessor_cache
,
)
...
...
examples/offline_inference/vision_language_multi_image.py
View file @
d06e8240
...
...
@@ -186,7 +186,6 @@ def load_mllama(question, image_urls: List[str]) -> ModelRequestData:
model
=
model_name
,
max_model_len
=
4096
,
max_num_seqs
=
16
,
enforce_eager
=
True
,
limit_mm_per_prompt
=
{
"image"
:
len
(
image_urls
)},
)
...
...
vllm/config.py
View file @
d06e8240
...
...
@@ -607,10 +607,12 @@ class ModelConfig:
self
.
max_seq_len_to_capture
=
min
(
self
.
max_seq_len_to_capture
,
self
.
max_model_len
)
if
(
self
.
hf_config
.
model_type
==
'deepseek_v3'
MODEL_NOT_SUPPORT_CUDA_GRAPH
=
[
'deepseek_v3'
,
'mllama'
]
if
(
self
.
hf_config
.
model_type
in
MODEL_NOT_SUPPORT_CUDA_GRAPH
and
not
self
.
enforce_eager
):
logger
.
warning
(
"CUDA graph is not supported for Deepseek V3 yet, "
"fallback to the eager mode."
)
logger
.
warning
(
"CUDA graph is not supported for %s yet, fallback to the eager "
"mode."
,
self
.
hf_config
.
model_type
)
self
.
enforce_eager
=
True
def
_verify_bnb_config
(
self
)
->
None
:
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment