"git@developer.sourcefind.cn:norm/vllm.git" did not exist on "4858f3bb45ec62fab1fc32dc26eb1e2a8e1df14b"
Unverified Commit ba69c153 authored by Nan Jiang's avatar Nan Jiang Committed by GitHub
Browse files

[RL]: Fix error tagging in multi-stage wake up (#7812)


Co-authored-by: default avatarhebiao064 <hebiaobuaa@gmail.com>
parent 3589aa79
...@@ -2333,9 +2333,8 @@ class Scheduler( ...@@ -2333,9 +2333,8 @@ class Scheduler(
def release_memory_occupation(self, recv_req: ReleaseMemoryOccupationReqInput): def release_memory_occupation(self, recv_req: ReleaseMemoryOccupationReqInput):
tags = recv_req.tags tags = recv_req.tags
import subprocess
if tags is None: if tags is None or len(tags) == 0:
tags = [GPU_MEMORY_TYPE_WEIGHTS, GPU_MEMORY_TYPE_KV_CACHE] tags = [GPU_MEMORY_TYPE_WEIGHTS, GPU_MEMORY_TYPE_KV_CACHE]
if GPU_MEMORY_TYPE_KV_CACHE in tags: if GPU_MEMORY_TYPE_KV_CACHE in tags:
...@@ -2353,6 +2352,7 @@ class Scheduler( ...@@ -2353,6 +2352,7 @@ class Scheduler(
def resume_memory_occupation(self, recv_req: ResumeMemoryOccupationReqInput): def resume_memory_occupation(self, recv_req: ResumeMemoryOccupationReqInput):
tags = recv_req.tags tags = recv_req.tags
if tags is None or len(tags) == 0: if tags is None or len(tags) == 0:
tags = [GPU_MEMORY_TYPE_WEIGHTS, GPU_MEMORY_TYPE_KV_CACHE] tags = [GPU_MEMORY_TYPE_WEIGHTS, GPU_MEMORY_TYPE_KV_CACHE]
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment