Unverified Commit 18e7cbbb authored by Cyrus Leung's avatar Cyrus Leung Committed by GitHub
Browse files

[Bugfix] Fix startup hang for Granite Speech (#33699)


Signed-off-by: default avatarDarkLight1337 <tlleungac@connect.ust.hk>
parent f0d52517
...@@ -54,17 +54,17 @@ class MultiModalBudget: ...@@ -54,17 +54,17 @@ class MultiModalBudget:
self.max_model_len = model_config.max_model_len self.max_model_len = model_config.max_model_len
self.max_num_reqs = scheduler_config.max_num_seqs self.max_num_reqs = scheduler_config.max_num_seqs
cache = mm_registry.processor_only_cache_from_config(vllm_config) with set_default_torch_num_threads(): # Avoid hang during startup
processor = mm_registry.create_processor(model_config, cache=cache) cache = mm_registry.processor_only_cache_from_config(vllm_config)
processor = mm_registry.create_processor(model_config, cache=cache)
self.cache = cache self.cache = cache
self.mm_limits = mm_limits = processor.info.allowed_mm_limits self.mm_limits = mm_limits = processor.info.allowed_mm_limits
active_modalities = { active_modalities = {
modality for modality, limit in mm_limits.items() if limit > 0 modality for modality, limit in mm_limits.items() if limit > 0
} }
with set_default_torch_num_threads(): # Avoid hang during startup
all_mm_max_toks_per_item = get_mm_max_toks_per_item( all_mm_max_toks_per_item = get_mm_max_toks_per_item(
model_config, model_config,
mm_registry, mm_registry,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment