Unverified Commit 70f99382 authored by Anant Sharma's avatar Anant Sharma Committed by GitHub
Browse files

build: enable kvbm in trtllm container (#2956)


Signed-off-by: default avatarAnant Sharma <anants@nvidia.com>
parent 2ae20102
...@@ -693,8 +693,8 @@ if [ ! -z ${RELEASE_BUILD} ]; then ...@@ -693,8 +693,8 @@ if [ ! -z ${RELEASE_BUILD} ]; then
BUILD_ARGS+=" --build-arg RELEASE_BUILD=${RELEASE_BUILD} " BUILD_ARGS+=" --build-arg RELEASE_BUILD=${RELEASE_BUILD} "
fi fi
if [[ $FRAMEWORK == "VLLM" ]]; then if [[ $FRAMEWORK == "VLLM" ]] || [[ $FRAMEWORK == "TRTLLM" ]]; then
echo "Forcing enable_kvbm to true in vLLM image build" echo "Forcing enable_kvbm to true in ${FRAMEWORK} image build"
ENABLE_KVBM=true ENABLE_KVBM=true
fi fi
......
...@@ -775,7 +775,6 @@ class TestDeterminism: ...@@ -775,7 +775,6 @@ class TestDeterminism:
], ],
indirect=True, indirect=True,
) )
@pytest.mark.vllm
def test_determinism_with_cache_reset(self, tester, llm_server, runtime_services): def test_determinism_with_cache_reset(self, tester, llm_server, runtime_services):
"""Test determinism across cache reset: run test with warmup, reset cache, run again without warmup.""" """Test determinism across cache reset: run test with warmup, reset cache, run again without warmup."""
print("\n" + "=" * 70) print("\n" + "=" * 70)
...@@ -916,6 +915,7 @@ class TestDeterminism: ...@@ -916,6 +915,7 @@ class TestDeterminism:
"num_prompts", "num_prompts",
[int(x) for x in os.environ.get("KVBM_IFEVAL_PROMPTS", "120").split(",")], [int(x) for x in os.environ.get("KVBM_IFEVAL_PROMPTS", "120").split(",")],
) )
@pytest.mark.skip(reason="Flaky test: DIS-665")
def test_concurrent_determinism_with_ifeval( def test_concurrent_determinism_with_ifeval(
self, self,
tester, tester,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment