Unverified Commit dac914b0 authored by Chen Zhang's avatar Chen Zhang Committed by GitHub
Browse files

[Bugfix] use blockmanagerv1 for encoder-decoder (#9084)


Co-authored-by: default avatarRoger Wang <ywang@roblox.com>
parent a95354a3
...@@ -903,6 +903,11 @@ class EngineArgs: ...@@ -903,6 +903,11 @@ class EngineArgs:
"--enable-prefix-caching is currently not " "--enable-prefix-caching is currently not "
"supported for multimodal models and has been disabled.") "supported for multimodal models and has been disabled.")
self.enable_prefix_caching = False self.enable_prefix_caching = False
if model_config.is_encoder_decoder_model:
logger.warning(
"Block Manager v2 does not support encoder-decoder models"
" currently. Using Block Manager v1 as fallback.")
self.use_v2_block_manager = False
cache_config = CacheConfig( cache_config = CacheConfig(
block_size=self.block_size if self.device != "neuron" else block_size=self.block_size if self.device != "neuron" else
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment