[CI/Build] Fix CPU CI online inference timeout (#10314)

Signed-off-by: Isotr0py <2037008807@qq.com>
This commit is contained in:
Isotr0py 2024-11-14 16:45:32 +08:00 committed by GitHub
parent 29f3ef26a3
commit 03025c023f
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -61,7 +61,7 @@ function cpu_tests() {
docker exec cpu-test bash -c " docker exec cpu-test bash -c "
set -e set -e
export VLLM_CPU_KVCACHE_SPACE=10 export VLLM_CPU_KVCACHE_SPACE=10
export VLLM_CPU_OMP_THREADS_BIND=$CORE_RANGE export VLLM_CPU_OMP_THREADS_BIND=$1
python3 -m vllm.entrypoints.openai.api_server --model facebook/opt-125m --dtype half & python3 -m vllm.entrypoints.openai.api_server --model facebook/opt-125m --dtype half &
timeout 600 bash -c 'until curl localhost:8000/v1/models; do sleep 1; done' || exit 1 timeout 600 bash -c 'until curl localhost:8000/v1/models; do sleep 1; done' || exit 1
python3 benchmarks/benchmark_serving.py \ python3 benchmarks/benchmark_serving.py \
@ -75,4 +75,4 @@ function cpu_tests() {
# All of CPU tests are expected to be finished less than 25 mins. # All of CPU tests are expected to be finished less than 25 mins.
export -f cpu_tests export -f cpu_tests
timeout 25m bash -c "cpu_tests" timeout 25m bash -c "cpu_tests $CORE_RANGE"