Unverified Commit ea34350d authored by Lianmin Zheng's avatar Lianmin Zheng Committed by GitHub
Browse files

Rename double sparsity config file (#2188)

parent 1605ae12
...@@ -84,7 +84,7 @@ jobs: ...@@ -84,7 +84,7 @@ jobs:
timeout-minutes: 25 timeout-minutes: 25
run: | run: |
cd test/srt cd test/srt
python3 run_suite.py --suite minimal --range-begin 14 --range-end 21 python3 run_suite.py --suite minimal --range-begin 14 --range-end 23
unit-test-backend-part-4: unit-test-backend-part-4:
if: github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request' if: github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request'
...@@ -101,7 +101,7 @@ jobs: ...@@ -101,7 +101,7 @@ jobs:
timeout-minutes: 25 timeout-minutes: 25
run: | run: |
cd test/srt cd test/srt
python3 run_suite.py --suite minimal --range-begin 21 python3 run_suite.py --suite minimal --range-begin 23
unit-test-backend-2-gpu-part-1: unit-test-backend-2-gpu-part-1:
if: github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request' if: github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request'
......
...@@ -18,7 +18,9 @@ class TestDoubleSparsity(unittest.TestCase): ...@@ -18,7 +18,9 @@ class TestDoubleSparsity(unittest.TestCase):
cls.model = DEFAULT_MODEL_NAME_FOR_TEST cls.model = DEFAULT_MODEL_NAME_FOR_TEST
cls.base_url = DEFAULT_URL_FOR_TEST cls.base_url = DEFAULT_URL_FOR_TEST
dirpath = os.path.dirname(__file__) dirpath = os.path.dirname(__file__)
config_file = os.path.join(dirpath, "Llama-3.1-8B-Instruct.json") config_file = os.path.join(
dirpath, "double-sparsity-config-Llama-3.1-8B-Instruct.json"
)
# NOTE: Generate the config file by running https://github.com/andy-yang-1/DoubleSparse/blob/main/evaluation/group_channel_config.py # NOTE: Generate the config file by running https://github.com/andy-yang-1/DoubleSparse/blob/main/evaluation/group_channel_config.py
cls.process = popen_launch_server( cls.process = popen_launch_server(
cls.model, cls.model,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment