"...ssh:/git@developer.sourcefind.cn:2222/OpenDAS/dynamo.git" did not exist on "5e326d6f3ec28d5e1f814a4991450fc0414db46e"
Unverified Commit 21c4739b authored by Jacky's avatar Jacky Committed by GitHub
Browse files

test: Increase Cancellation Tests sequence and long prompt length (#4608)


Signed-off-by: default avatarJacky <18255193+kthui@users.noreply.github.com>
parent 5652d670
...@@ -47,7 +47,9 @@ class DynamoWorkerProcess(ManagedProcess): ...@@ -47,7 +47,9 @@ class DynamoWorkerProcess(ManagedProcess):
"--free-gpu-memory-fraction", "--free-gpu-memory-fraction",
"0.45", "0.45",
"--max-seq-len", "--max-seq-len",
"8192", "16384",
"--max-num-tokens",
"16384",
"--migration-limit", "--migration-limit",
migration_limit, migration_limit,
] ]
......
...@@ -35,7 +35,7 @@ class DynamoWorkerProcess(ManagedProcess): ...@@ -35,7 +35,7 @@ class DynamoWorkerProcess(ManagedProcess):
"--gpu-memory-utilization", "--gpu-memory-utilization",
"0.45", "0.45",
"--max-model-len", "--max-model-len",
"8192", "16384",
"--migration-limit", "--migration-limit",
"3", "3",
] ]
......
...@@ -253,14 +253,14 @@ def send_cancellable_request( ...@@ -253,14 +253,14 @@ def send_cancellable_request(
""" """
prompt = "Tell me a very long and detailed story about the history of artificial intelligence, including all major milestones, researchers, and breakthroughs?" prompt = "Tell me a very long and detailed story about the history of artificial intelligence, including all major milestones, researchers, and breakthroughs?"
if use_long_prompt: if use_long_prompt:
prompt += " Make sure it is" + " long" * 8000 + "!" prompt += " Make sure it is" + " long" * 16000 + "!"
if request_type == "completion": if request_type == "completion":
return send_completion_request(prompt, 8192) return send_completion_request(prompt, 16384)
elif request_type == "chat_completion": elif request_type == "chat_completion":
return send_chat_completion_request(prompt, 8192, stream=False) return send_chat_completion_request(prompt, 16384, stream=False)
elif request_type == "chat_completion_stream": elif request_type == "chat_completion_stream":
return send_chat_completion_request(prompt, 8192, stream=True) return send_chat_completion_request(prompt, 16384, stream=True)
else: else:
raise ValueError(f"Unknown request type: {request_type}") raise ValueError(f"Unknown request type: {request_type}")
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment