From 68cf1601d3ccac7b7a661390d972a2469a7b4c61 Mon Sep 17 00:00:00 2001 From: Kunshang Ji Date: Wed, 19 Mar 2025 01:29:25 -0700 Subject: [PATCH] [CI][Intel GPU] update XPU dockerfile and CI script (#15109) Signed-off-by: Kunshang Ji --- .buildkite/run-xpu-test.sh | 9 +++++---- Dockerfile.xpu | 12 +++--------- 2 files changed, 8 insertions(+), 13 deletions(-) diff --git a/.buildkite/run-xpu-test.sh b/.buildkite/run-xpu-test.sh index a9c71201..3a0e6bdb 100644 --- a/.buildkite/run-xpu-test.sh +++ b/.buildkite/run-xpu-test.sh @@ -12,10 +12,11 @@ docker build -t ${image_name} -f Dockerfile.xpu . # Setup cleanup remove_docker_container() { - docker rm -f "${container_name}" || docker image rm -f "${image_name}" || true; + docker rm -f "${container_name}" || true; + docker image rm -f "${image_name}" || true; + docker system prune -f || true; } trap remove_docker_container EXIT -remove_docker_container # Run the image and test offline inference/tensor parallel docker run \ @@ -25,6 +26,6 @@ docker run \ --name "${container_name}" \ "${image_name}" \ sh -c ' - python3 examples/offline_inference/basic/generate.py --model facebook/opt-125m - python3 examples/offline_inference/basic/generate.py --model facebook/opt-125m -tp 2 + VLLM_USE_V1=0 python3 examples/offline_inference/basic/generate.py --model facebook/opt-125m + VLLM_USE_V1=0 python3 examples/offline_inference/basic/generate.py --model facebook/opt-125m -tp 2 ' diff --git a/Dockerfile.xpu b/Dockerfile.xpu index 672a494e..ad4abf16 100644 --- a/Dockerfile.xpu +++ b/Dockerfile.xpu @@ -1,11 +1,7 @@ -FROM intel/deep-learning-essentials:2025.0.1-0-devel-ubuntu22.04 AS vllm-base +# oneapi 2025.0.2 docker base image use rolling 2448 package. https://dgpu-docs.intel.com/releases/packages.html?release=Rolling+2448.13&os=Ubuntu+22.04, and we don't need install driver manually. +FROM intel/deep-learning-essentials:2025.0.2-0-devel-ubuntu22.04 AS vllm-base -RUN wget -O- https://apt.repos.intel.com/intel-gpg-keys/GPG-PUB-KEY-INTEL-SW-PRODUCTS.PUB | gpg --dearmor | tee /usr/share/keyrings/intel-oneapi-archive-keyring.gpg > /dev/null && \ - echo "deb [signed-by=/usr/share/keyrings/intel-oneapi-archive-keyring.gpg] https://apt.repos.intel.com/oneapi all main " | tee /etc/apt/sources.list.d/oneAPI.list && \ - chmod 644 /usr/share/keyrings/intel-oneapi-archive-keyring.gpg && \ - wget -O- https://repositories.intel.com/graphics/intel-graphics.key | gpg --dearmor | tee /usr/share/keyrings/intel-graphics.gpg > /dev/null && \ - echo "deb [arch=amd64,i386 signed-by=/usr/share/keyrings/intel-graphics.gpg] https://repositories.intel.com/graphics/ubuntu jammy arc" | tee /etc/apt/sources.list.d/intel.gpu.jammy.list && \ - chmod 644 /usr/share/keyrings/intel-graphics.gpg +RUN rm /etc/apt/sources.list.d/intel-graphics.list RUN apt-get update -y && \ apt-get install -y --no-install-recommends --fix-missing \ @@ -21,8 +17,6 @@ RUN apt-get update -y && \ python3 \ python3-dev \ python3-pip \ - libze-intel-gpu-dev \ - libze-intel-gpu1 \ wget WORKDIR /workspace/vllm