block.py 1.52 KB
Newer Older
Woosuk Kwon's avatar
Woosuk Kwon committed
1
2
3
4
5
6
7
8
9
from typing import List

from cacheflow.utils import Device

BLANK_TOKEN_ID = -1


class LogicalTokenBlock:

Woosuk Kwon's avatar
Woosuk Kwon committed
10
    def __init__(
Woosuk Kwon's avatar
Woosuk Kwon committed
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
        self,
        block_number: int,
        block_size: int,
    ) -> None:
        self.block_number = block_number
        self.block_size = block_size

        self.token_ids = [BLANK_TOKEN_ID] * block_size
        self.num_tokens = 0

    def is_empty(self) -> bool:
        return self.num_tokens == 0

    def get_num_empty_slots(self) -> int:
        return self.block_size - self.num_tokens

    def is_full(self) -> bool:
        return self.num_tokens == self.block_size

30
    def append_tokens(self, token_ids: List[int]) -> None:
Woosuk Kwon's avatar
Woosuk Kwon committed
31
32
33
34
35
36
37
        assert len(token_ids) <= self.get_num_empty_slots()
        self.token_ids[self.num_tokens:self.num_tokens + len(token_ids)] = token_ids
        self.num_tokens += len(token_ids)

    def get_token_ids(self) -> List[int]:
        return self.token_ids[:self.num_tokens]

38
39
40
41
    def get_last_token_id(self) -> int:
        assert self.num_tokens > 0
        return self.token_ids[self.num_tokens - 1]

Woosuk Kwon's avatar
Woosuk Kwon committed
42
43
44
45
46
47
48
49
50
51
52
53
54
55

class PhysicalTokenBlock:

    def __init__(
        self,
        device: Device,
        block_number: int,
        block_size: int,
    ) -> None:
        self.device = device
        self.block_number = block_number
        self.block_size = block_size

        self.ref_count = 0
Woosuk Kwon's avatar
Woosuk Kwon committed
56
57
58
59
60

    def __repr__(self) -> str:
        return (f'PhysicalTokenBlock(device={self.device}, '
                f'block_number={self.block_number}, '
                f'ref_count={self.ref_count})')