Commit 52647592 authored by huangwb's avatar huangwb
Browse files

fix qwen2 sliding_window logic bug

parent aac64dda
...@@ -527,6 +527,8 @@ def get_model( ...@@ -527,6 +527,8 @@ def get_model(
if model_type == "qwen2": if model_type == "qwen2":
sliding_window = config_dict.get("sliding_window", -1) sliding_window = config_dict.get("sliding_window", -1)
use_sliding_window = config_dict.get("use_sliding_window", False)
sliding_window = sliding_window if use_sliding_window else None
if ( if (
(sliding_window is None or sliding_window == -1) and FLASH_ATTENTION (sliding_window is None or sliding_window == -1) and FLASH_ATTENTION
) or HAS_FLASH_ATTN_V2_CUDA: ) or HAS_FLASH_ATTN_V2_CUDA:
......
...@@ -54,6 +54,7 @@ class FlashQwen2(BaseFlashMistral): ...@@ -54,6 +54,7 @@ class FlashQwen2(BaseFlashMistral):
) )
config.quantize = quantize config.quantize = quantize
config.use_medusa = use_medusa config.use_medusa = use_medusa
config.sliding_window = config.sliding_window if config.use_sliding_window else None
# Set context windows # Set context windows
if config.sliding_window is not None: if config.sliding_window is not None:
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment