"[INST] <<SYS>>\\nYou are a helpful assistant.\\n<</SYS>>\\nToday is a sunny day and I like[/INST]"
'[INST] <<SYS>>\\nYou are a helpful assistant.\\n<</SYS>>\\nWhat are the mental triggers in Jeff Walker\'s Product Launch Formula and "Launch" book?[/INST]',
"[INST] <<SYS>>\\nYou are a helpful assistant.\\n<</SYS>>\\nSummarize Russell Brunson's Perfect Webinar Script...[/INST]",
"[INST] <<SYS>>\\nYou are a helpful assistant.\\n<</SYS>>\\nwho are you?[/INST]",
"[INST] <<SYS>>\\nYou are a helpful assistant.\\n<</SYS>>\\nwhere are you from?[/INST]",
"[INST] <<SYS>>\\nYou are a helpful assistant.\\n<</SYS>>\\nToday is a sunny day and I like[/INST]"
'[INST] <<SYS>>\\nYou are a helpful assistant.\\n<</SYS>>\\nWhat are the mental triggers in Jeff Walker\'s Product Launch Formula and "Launch" book?[/INST]',
"[INST] <<SYS>>\\nYou are a helpful assistant.\\n<</SYS>>\\nSummarize Russell Brunson's Perfect Webinar Script...[/INST]",
"[INST] <<SYS>>\\nYou are a helpful assistant.\\n<</SYS>>\\nwho are you?[/INST]",
"[INST] <<SYS>>\\nYou are a helpful assistant.\\n<</SYS>>\\nwhere are you from?[/INST]",
]
@classmethod
defsetUpClass(cls):
cls.base_url=DEFAULT_URL_FOR_TEST
...
...
@@ -127,17 +176,17 @@ class TestEAGLEServer(unittest.TestCase):
"--speculative-draft-model-path",
DEFAULT_EAGLE_DRAFT_MODEL_FOR_TEST,
"--speculative-num-steps",
"5",
5,
"--speculative-eagle-topk",
"8",
8,
"--speculative-num-draft-tokens",
"64",
64,
"--mem-fraction-static",
"0.7",
0.7,
"--chunked-prefill-size",
"128",
"--cuda-graph-max-bs",
"32",
128,
"--max-running-requests",
8,
],
)
...
...
@@ -147,7 +196,7 @@ class TestEAGLEServer(unittest.TestCase):
defsend_request(self):
time.sleep(random.uniform(0,2))
forpromptinprompts:
forpromptinself.PROMPTS:
url=self.base_url+"/generate"
data={
"text":prompt,
...
...
@@ -160,7 +209,7 @@ class TestEAGLEServer(unittest.TestCase):
assertresponse.status_code==200
defsend_requests_abort(self):
forpromptinprompts:
forpromptinself.PROMPTS:
try:
time.sleep(random.uniform(0,2))
url=self.base_url+"/generate"
...
...
@@ -192,6 +241,8 @@ class TestEAGLEServer(unittest.TestCase):