Unverified Commit e322a94d authored by Lifu Huang's avatar Lifu Huang Committed by GitHub
Browse files

Reduce CI duration of test_lora_update. (#9024)

parent 2c7f01bc
...@@ -229,6 +229,53 @@ BASIC_TESTS = [ ...@@ -229,6 +229,53 @@ BASIC_TESTS = [
] ]
), ),
), ),
Operation(
type=OperationType.UNLOAD,
data="Nutanix/Meta-Llama-3.1-8B-Instruct_lora_4_alpha_16",
),
Operation(
type=OperationType.UNLOAD,
data="pbevan11/llama-3.1-8b-ocr-correction",
),
Operation(
type=OperationType.FORWARD,
data=create_batch_data(
"Nutanix/Meta-Llama-3.1-8B-Instruct_lora_4_alpha_16"
),
expected_error="not loaded",
),
Operation(
type=OperationType.FORWARD,
data=create_batch_data("pbevan11/llama-3.1-8b-ocr-correction"),
expected_error="not loaded",
),
Operation(
type=OperationType.FORWARD,
data=create_batch_data(None),
),
Operation(
type=OperationType.LOAD,
data="philschmid/code-llama-3-1-8b-text-to-sql-lora",
),
Operation(
type=OperationType.LOAD,
data="Nutanix/Meta-Llama-3.1-8B-Instruct_lora_4_alpha_16",
),
Operation(
type=OperationType.LOAD,
data="pbevan11/llama-3.1-8b-ocr-correction",
),
Operation(
type=OperationType.FORWARD,
data=create_batch_data(
[
"philschmid/code-llama-3-1-8b-text-to-sql-lora",
"Nutanix/Meta-Llama-3.1-8B-Instruct_lora_4_alpha_16",
"pbevan11/llama-3.1-8b-ocr-correction",
None,
]
),
),
], ],
), ),
] ]
...@@ -1194,7 +1241,7 @@ class TestLoRADynamicUpdate(CustomTestCase): ...@@ -1194,7 +1241,7 @@ class TestLoRADynamicUpdate(CustomTestCase):
""" """
Test dynamic LoRA updates in engine mode. Test dynamic LoRA updates in engine mode.
""" """
test_cases = ALL_TESTS test_cases = BASIC_TESTS if is_in_ci() else ALL_TESTS
self._run_dynamic_adapter_updates( self._run_dynamic_adapter_updates(
mode=LoRAUpdateTestSessionMode.ENGINE, mode=LoRAUpdateTestSessionMode.ENGINE,
test_cases=test_cases, test_cases=test_cases,
...@@ -1204,9 +1251,7 @@ class TestLoRADynamicUpdate(CustomTestCase): ...@@ -1204,9 +1251,7 @@ class TestLoRADynamicUpdate(CustomTestCase):
""" """
Test dynamic LoRA updates in server mode. Test dynamic LoRA updates in server mode.
""" """
# In CI, we only run the first test case to save time, as the engine test should be mostly sufficient for ensuring correctness.
test_cases = BASIC_TESTS if is_in_ci() else ALL_TESTS test_cases = BASIC_TESTS if is_in_ci() else ALL_TESTS
self._run_dynamic_adapter_updates( self._run_dynamic_adapter_updates(
mode=LoRAUpdateTestSessionMode.SERVER, test_cases=test_cases mode=LoRAUpdateTestSessionMode.SERVER, test_cases=test_cases
) )
......
...@@ -21,7 +21,7 @@ suites = { ...@@ -21,7 +21,7 @@ suites = {
TestFile("lora/test_lora_backend.py", 99), TestFile("lora/test_lora_backend.py", 99),
TestFile("lora/test_multi_lora_backend.py", 60), TestFile("lora/test_multi_lora_backend.py", 60),
TestFile("lora/test_lora_cuda_graph.py", 250), TestFile("lora/test_lora_cuda_graph.py", 250),
TestFile("lora/test_lora_update.py", 800), TestFile("lora/test_lora_update.py", 400),
TestFile("lora/test_lora_qwen3.py", 97), TestFile("lora/test_lora_qwen3.py", 97),
TestFile("models/test_embedding_models.py", 73), TestFile("models/test_embedding_models.py", 73),
# TestFile("models/test_clip_models.py", 52), # TestFile("models/test_clip_models.py", 52),
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment