fix: trtllm has moved to version 1.2+ to enable cuda graph testing; fixed path...

fix: trtllm has moved to version 1.2+ to enable cuda graph testing; fixed path to config.yaml (#5133)

fix: trtllm has moved to version 1.2+ to enable cuda graph testing; fixed path...
fix: trtllm has moved to version 1.2+ to enable cuda graph testing; fixed path to config.yaml (#5133)
6be9c9a4 · Kyle McGill · GitHub · 5a158552 · 6be9c9a4
Unverified Commit 6be9c9a4 authored Jan 05, 2026 by Kyle McGill Committed by GitHub Jan 05, 2026
Hide whitespace changes
Inline Side-by-side

Showing with 4 additions and 10 deletions

tests/kvbm_integration/test_cuda_graph.py tests/kvbm_integration/test_cuda_graph.py +4 -10

No files found.
--- a/tests/kvbm_integration/test_cuda_graph.py
+++ b/tests/kvbm_integration/test_cuda_graph.py
@@ -151,9 +151,6 @@ def send_completion_request(
 @pytest.mark.nightly
 @pytest.mark.slow
 @pytest.mark.gpu_1
-@pytest.mark.skip(
-    reason="Enable these tests once `main` dynamo upgrades to TRTLLM 1.2+"
-)
 def test_kvbm_without_cuda_graph_enabled(request, runtime_services):
    """
    End-to-end test for TRTLLM worker with cuda_graph_config not defined and
@@ -168,12 +165,12 @@ def test_kvbm_without_cuda_graph_enabled(request, runtime_services):
    with DynamoFrontendProcess(request):
        logger.info("Frontend started.")
-        engine_config_with_cuda_graph_and_kvbm = (
+        engine_config_without_cuda_graph_and_kvbm = (
-            "tests/kvbm/engine_config_without_cuda_graph_and_kvbm.yaml"
+            "tests/kvbm_integration/engine_config_without_cuda_graph_and_kvbm.yaml"
        )
        logger.info("Starting worker...")
        with DynamoWorkerProcess(
-            request, "decode", engine_config_with_cuda_graph_and_kvbm
+            request, "decode", engine_config_without_cuda_graph_and_kvbm
        ) as worker:
            logger.info(f"Worker PID: {worker.get_pid()}")
@@ -190,9 +187,6 @@ def test_kvbm_without_cuda_graph_enabled(request, runtime_services):
 @pytest.mark.slow
 @pytest.mark.nightly
 @pytest.mark.gpu_1
-@pytest.mark.skip(
-    reason="Enable these tests once dynamo `main` upgrades to TRTLLM 1.2+"
-)
 def test_kvbm_with_cuda_graph_enabled(request, runtime_services):
    """
    End-to-end test for TRTLLM worker with cuda_graph_config defined and
@@ -208,7 +202,7 @@ def test_kvbm_with_cuda_graph_enabled(request, runtime_services):
        logger.info("Frontend started.")
        engine_config_with_cuda_graph_and_kvbm = (
-            "tests/kvbm/engine_config_with_cuda_graph_and_kvbm.yaml"
+            "tests/kvbm_integration/engine_config_with_cuda_graph_and_kvbm.yaml"
        )
        logger.info("Starting worker...")
        with DynamoWorkerProcess(