Unverified Commit 685c99ee authored by Yue Zhang's avatar Yue Zhang Committed by GitHub
Browse files

[KV offload] Offloading connector async scheduling support (#27648)


Signed-off-by: default avatarKevinCheung2259 <2651309292@qq.com>
Co-authored-by: default avatarNick Hill <nhill@redhat.com>
parent 1e88fb75
...@@ -274,8 +274,8 @@ class OffloadingConnectorScheduler: ...@@ -274,8 +274,8 @@ class OffloadingConnectorScheduler:
if num_new_blocks <= 0: if num_new_blocks <= 0:
continue continue
num_gpu_blocks = num_blocks * self.block_size_factor # NOTE: In async scheduling, placeholders may temporarily make
assert len(req.block_hashes) >= num_gpu_blocks # len(req.block_hashes) < num_blocks * self.block_size_factor.
new_block_hashes = self._get_block_hashes( new_block_hashes = self._get_block_hashes(
req, start_idx=start_block_idx, end_idx=num_blocks req, start_idx=start_block_idx, end_idx=num_blocks
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment