Unverified Commit aaa4ac1c authored by cascade's avatar cascade Committed by GitHub
Browse files

Disable prefix cache by default for benchmark (#18639)


Signed-off-by: default avatarcascade812 <cascade812@outlook.com>
parent 06a03380
...@@ -189,5 +189,8 @@ if __name__ == "__main__": ...@@ -189,5 +189,8 @@ if __name__ == "__main__":
) )
parser = EngineArgs.add_cli_args(parser) parser = EngineArgs.add_cli_args(parser)
# V1 enables prefix caching by default which skews the latency
# numbers. We need to disable prefix caching by default.
parser.set_defaults(enable_prefix_caching=False)
args = parser.parse_args() args = parser.parse_args()
main(args) main(args)
...@@ -80,6 +80,9 @@ def add_cli_args(parser: argparse.ArgumentParser): ...@@ -80,6 +80,9 @@ def add_cli_args(parser: argparse.ArgumentParser):
) )
parser = EngineArgs.add_cli_args(parser) parser = EngineArgs.add_cli_args(parser)
# V1 enables prefix caching by default which skews the latency
# numbers. We need to disable prefix caching by default.
parser.set_defaults(enable_prefix_caching=True)
def main(args: argparse.Namespace): def main(args: argparse.Namespace):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment