Commit a2a9869c authored by Woosuk Kwon's avatar Woosuk Kwon
Browse files

SERVING -> RUNNING

parent 46958cf9
......@@ -95,7 +95,7 @@ class BlockSpaceManager:
# Simple heuristic: If there is at least one free block
# for each sequence, we can append.
num_free_gpu_blocks = self.gpu_allocator.get_num_free_blocks()
num_seqs = seq_group.num_seqs(status=SequenceStatus.SERVING)
num_seqs = seq_group.num_seqs(status=SequenceStatus.RUNNING)
return num_seqs <= num_free_gpu_blocks
def append(self, seq: Sequence) -> Optional[Tuple[int, int]]:
......
......@@ -7,7 +7,7 @@ from cacheflow.decoding import DecodingParams
class SequenceStatus(enum.Enum):
PENDING = enum.auto()
SERVING = enum.auto()
RUNNING = enum.auto()
SWAPPED = enum.auto()
FINISHED = enum.auto()
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment