Unverified Commit 03025c02 authored by Isotr0py's avatar Isotr0py Committed by GitHub
Browse files

[CI/Build] Fix CPU CI online inference timeout (#10314)


Signed-off-by: default avatarIsotr0py <2037008807@qq.com>
parent 29f3ef26
...@@ -61,7 +61,7 @@ function cpu_tests() { ...@@ -61,7 +61,7 @@ function cpu_tests() {
docker exec cpu-test bash -c " docker exec cpu-test bash -c "
set -e set -e
export VLLM_CPU_KVCACHE_SPACE=10 export VLLM_CPU_KVCACHE_SPACE=10
export VLLM_CPU_OMP_THREADS_BIND=$CORE_RANGE export VLLM_CPU_OMP_THREADS_BIND=$1
python3 -m vllm.entrypoints.openai.api_server --model facebook/opt-125m --dtype half & python3 -m vllm.entrypoints.openai.api_server --model facebook/opt-125m --dtype half &
timeout 600 bash -c 'until curl localhost:8000/v1/models; do sleep 1; done' || exit 1 timeout 600 bash -c 'until curl localhost:8000/v1/models; do sleep 1; done' || exit 1
python3 benchmarks/benchmark_serving.py \ python3 benchmarks/benchmark_serving.py \
...@@ -75,4 +75,4 @@ function cpu_tests() { ...@@ -75,4 +75,4 @@ function cpu_tests() {
# All of CPU tests are expected to be finished less than 25 mins. # All of CPU tests are expected to be finished less than 25 mins.
export -f cpu_tests export -f cpu_tests
timeout 25m bash -c "cpu_tests" timeout 25m bash -c "cpu_tests $CORE_RANGE"
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment