"vscode:/vscode.git/clone" did not exist on "34a8559be7473e3ba34e9b9e13827e60651e3b41"
Commit aa389394 authored by zhuwenwen's avatar zhuwenwen
Browse files

update torch version

parent 3bb51ca2
...@@ -11,7 +11,7 @@ pytest-asyncio ...@@ -11,7 +11,7 @@ pytest-asyncio
tensorizer>=2.9.0 tensorizer>=2.9.0
setuptools_scm>=8 setuptools_scm>=8
torch == 2.4.0 torch == 2.4.1
triton == 3.0.0 triton == 3.0.0
flash_attn == 2.6.1 flash_attn == 2.6.1
lmslim == 0.2.0 lmslim == 0.2.0
\ No newline at end of file
...@@ -10,7 +10,7 @@ def run_and_test_dummy_opt_api_server(model, tp=1): ...@@ -10,7 +10,7 @@ def run_and_test_dummy_opt_api_server(model, tp=1):
"--gpu-memory-utilization", "--gpu-memory-utilization",
"0.10", "0.10",
"--dtype", "--dtype",
"float32", "float16",# "float32",
"--chat-template", "--chat-template",
str(chatml_jinja_path), str(chatml_jinja_path),
"--load-format", "--load-format",
...@@ -33,7 +33,7 @@ def run_and_test_dummy_opt_api_server(model, tp=1): ...@@ -33,7 +33,7 @@ def run_and_test_dummy_opt_api_server(model, tp=1):
) )
generated_text = completion.choices[0].message.content generated_text = completion.choices[0].message.content
assert generated_text is not None assert generated_text is not None
# make sure only the first token is generated # make sure only the first token is generatedvim
rest = generated_text.replace("<s>", "") rest = generated_text.replace("<s>", "")
assert rest == "" assert rest == ""
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment