Unverified Commit 53179026 authored by Ke Bao's avatar Ke Bao Committed by GitHub
Browse files

Add test for fp8 torch compile (#3246)

parent d7c0b32f
......@@ -62,7 +62,12 @@ class TestDeepseekV3(unittest.TestCase):
cls.model,
cls.base_url,
timeout=DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH,
other_args=["--trust-remote-code"],
other_args=[
"--trust-remote-code",
"--enable-torch-compile",
"--cuda-graph-max-bs",
"2",
],
)
@classmethod
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment