Unverified Commit 70f99382 authored by Anant Sharma's avatar Anant Sharma Committed by GitHub
Browse files

build: enable kvbm in trtllm container (#2956)


Signed-off-by: default avatarAnant Sharma <anants@nvidia.com>
parent 2ae20102
......@@ -693,8 +693,8 @@ if [ ! -z ${RELEASE_BUILD} ]; then
BUILD_ARGS+=" --build-arg RELEASE_BUILD=${RELEASE_BUILD} "
fi
if [[ $FRAMEWORK == "VLLM" ]]; then
echo "Forcing enable_kvbm to true in vLLM image build"
if [[ $FRAMEWORK == "VLLM" ]] || [[ $FRAMEWORK == "TRTLLM" ]]; then
echo "Forcing enable_kvbm to true in ${FRAMEWORK} image build"
ENABLE_KVBM=true
fi
......
......@@ -775,7 +775,6 @@ class TestDeterminism:
],
indirect=True,
)
@pytest.mark.vllm
def test_determinism_with_cache_reset(self, tester, llm_server, runtime_services):
"""Test determinism across cache reset: run test with warmup, reset cache, run again without warmup."""
print("\n" + "=" * 70)
......@@ -916,6 +915,7 @@ class TestDeterminism:
"num_prompts",
[int(x) for x in os.environ.get("KVBM_IFEVAL_PROMPTS", "120").split(",")],
)
@pytest.mark.skip(reason="Flaky test: DIS-665")
def test_concurrent_determinism_with_ifeval(
self,
tester,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment