Unverified Commit aaa4ac1c authored by cascade's avatar cascade Committed by GitHub
Browse files

Disable prefix cache by default for benchmark (#18639)


Signed-off-by: default avatarcascade812 <cascade812@outlook.com>
parent 06a03380
......@@ -189,5 +189,8 @@ if __name__ == "__main__":
)
parser = EngineArgs.add_cli_args(parser)
# V1 enables prefix caching by default which skews the latency
# numbers. We need to disable prefix caching by default.
parser.set_defaults(enable_prefix_caching=False)
args = parser.parse_args()
main(args)
......@@ -80,6 +80,9 @@ def add_cli_args(parser: argparse.ArgumentParser):
)
parser = EngineArgs.add_cli_args(parser)
# V1 enables prefix caching by default which skews the latency
# numbers. We need to disable prefix caching by default.
parser.set_defaults(enable_prefix_caching=True)
def main(args: argparse.Namespace):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment