Unverified Commit 7de2ce45 authored by Baizhou Zhang's avatar Baizhou Zhang Committed by GitHub
Browse files

Disable radix cache in test_lora_update.py for better stability (#9852)

parent 8c2ffaaf
...@@ -824,6 +824,7 @@ class LoRAUpdateEngineTestSession(LoRAUpdateTestSessionBase): ...@@ -824,6 +824,7 @@ class LoRAUpdateEngineTestSession(LoRAUpdateTestSessionBase):
disable_cuda_graph=self.disable_cuda_graph, disable_cuda_graph=self.disable_cuda_graph,
cuda_graph_max_bs=self.cuda_graph_max_bs, cuda_graph_max_bs=self.cuda_graph_max_bs,
enable_lora=self.enable_lora, enable_lora=self.enable_lora,
disable_radix_cache=True,
) )
self.handle.__enter__() self.handle.__enter__()
return self return self
...@@ -958,6 +959,7 @@ class LoRAUpdateServerTestSession(LoRAUpdateTestSessionBase): ...@@ -958,6 +959,7 @@ class LoRAUpdateServerTestSession(LoRAUpdateTestSessionBase):
"1", "1",
"--mem-fraction-static", "--mem-fraction-static",
str(MEM_FRACTION_STATIC), str(MEM_FRACTION_STATIC),
"--disable-radix-cache",
] ]
if self.enable_lora: if self.enable_lora:
other_args.append("--enable-lora") other_args.append("--enable-lora")
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment