Unverified Commit 21c4739b authored by Jacky's avatar Jacky Committed by GitHub
Browse files

test: Increase Cancellation Tests sequence and long prompt length (#4608)


Signed-off-by: default avatarJacky <18255193+kthui@users.noreply.github.com>
parent 5652d670
......@@ -47,7 +47,9 @@ class DynamoWorkerProcess(ManagedProcess):
"--free-gpu-memory-fraction",
"0.45",
"--max-seq-len",
"8192",
"16384",
"--max-num-tokens",
"16384",
"--migration-limit",
migration_limit,
]
......
......@@ -35,7 +35,7 @@ class DynamoWorkerProcess(ManagedProcess):
"--gpu-memory-utilization",
"0.45",
"--max-model-len",
"8192",
"16384",
"--migration-limit",
"3",
]
......
......@@ -253,14 +253,14 @@ def send_cancellable_request(
"""
prompt = "Tell me a very long and detailed story about the history of artificial intelligence, including all major milestones, researchers, and breakthroughs?"
if use_long_prompt:
prompt += " Make sure it is" + " long" * 8000 + "!"
prompt += " Make sure it is" + " long" * 16000 + "!"
if request_type == "completion":
return send_completion_request(prompt, 8192)
return send_completion_request(prompt, 16384)
elif request_type == "chat_completion":
return send_chat_completion_request(prompt, 8192, stream=False)
return send_chat_completion_request(prompt, 16384, stream=False)
elif request_type == "chat_completion_stream":
return send_chat_completion_request(prompt, 8192, stream=True)
return send_chat_completion_request(prompt, 16384, stream=True)
else:
raise ValueError(f"Unknown request type: {request_type}")
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment