Minor

d359cda5 · Woosuk Kwon · 2f49f155 · d359cda5 · d359cda5 · d359cda5
Commit d359cda5 authored Mar 26, 2023 by Woosuk Kwon
Showing with 5 additions and 4 deletions

cacheflow/master/block_manager.py cacheflow/master/block_manager.py +3 -3

cacheflow/models/sample.py cacheflow/models/sample.py +1 -0

cacheflow/sequence.py cacheflow/sequence.py +1 -1

No files found.
--- a/cacheflow/master/block_manager.py
+++ b/cacheflow/master/block_manager.py
@@ -7,7 +7,7 @@ from cacheflow.sequence import SequenceStatus
 from cacheflow.utils import Device


-class BlockManager:
+class BlockAllocator:

    def __init__(
        self,
@@ -65,8 +65,8 @@ class BlockSpaceManager:
        self.num_total_gpu_blocks = num_gpu_blocks
        self.num_total_cpu_blocks = num_cpu_blocks

-        self.gpu_allocator = BlockManager(Device.GPU, block_size, num_gpu_blocks)
-        self.cpu_allocator = BlockManager(Device.CPU, block_size, num_cpu_blocks)
+        self.gpu_allocator = BlockAllocator(Device.GPU, block_size, num_gpu_blocks)
+        self.cpu_allocator = BlockAllocator(Device.CPU, block_size, num_cpu_blocks)

        # Mapping: seq_id -> BlockTable.
        self.block_tables: Dict[int, BlockTable] = {}

--- a/cacheflow/models/sample.py
+++ b/cacheflow/models/sample.py
@@ -8,6 +8,7 @@ from cacheflow.sampling_params import SamplingParams
 from cacheflow.sequence import SequenceOutputs
 from cacheflow.parallel_utils.tensor_parallel import gather_from_tensor_model_parallel_region

+
 class Sampler(nn.Module):

    def __init__(self) -> None:

--- a/cacheflow/sequence.py
+++ b/cacheflow/sequence.py
@@ -30,7 +30,7 @@ class Sequence:

        self.status = SequenceStatus.PENDING
        self.output_logprobs: List[Dict[int, float]] = []
-        self.cumulative_logprobs = 1.0
+        self.cumulative_logprobs = 0.0

    def add_block(self) -> None:
        block = LogicalTokenBlock(