Unverified Commit f5d72b2f authored by sroy745's avatar sroy745 Committed by GitHub
Browse files

[Core] Make BlockSpaceManagerV2 the default BlockManager to use. (#8678)

parent 83caf35e
...@@ -970,7 +970,7 @@ class SchedulerConfig: ...@@ -970,7 +970,7 @@ class SchedulerConfig:
max_num_batched_tokens: Optional[int], max_num_batched_tokens: Optional[int],
max_num_seqs: int, max_num_seqs: int,
max_model_len: int, max_model_len: int,
use_v2_block_manager: bool = False, use_v2_block_manager: bool = True,
num_lookahead_slots: int = 0, num_lookahead_slots: int = 0,
delay_factor: float = 0.0, delay_factor: float = 0.0,
enable_chunked_prefill: bool = False, enable_chunked_prefill: bool = False,
......
...@@ -107,7 +107,7 @@ class EngineArgs: ...@@ -107,7 +107,7 @@ class EngineArgs:
block_size: int = 16 block_size: int = 16
enable_prefix_caching: bool = False enable_prefix_caching: bool = False
disable_sliding_window: bool = False disable_sliding_window: bool = False
use_v2_block_manager: bool = False use_v2_block_manager: bool = True
swap_space: float = 4 # GiB swap_space: float = 4 # GiB
cpu_offload_gb: float = 0 # GiB cpu_offload_gb: float = 0 # GiB
gpu_memory_utilization: float = 0.90 gpu_memory_utilization: float = 0.90
...@@ -369,9 +369,12 @@ class EngineArgs: ...@@ -369,9 +369,12 @@ class EngineArgs:
action='store_true', action='store_true',
help='Disables sliding window, ' help='Disables sliding window, '
'capping to sliding window size') 'capping to sliding window size')
parser.add_argument('--use-v2-block-manager', parser.add_argument(
'--use-v2-block-manager',
default=EngineArgs.use_v2_block_manager,
action='store_true', action='store_true',
help='Use BlockSpaceMangerV2.') help='Use BlockSpaceMangerV2. By default this is set to True. '
'Set to False to use BlockSpaceManagerV1')
parser.add_argument( parser.add_argument(
'--num-lookahead-slots', '--num-lookahead-slots',
type=int, type=int,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment