vllm/Dockerfile.xpu

FROM intel/oneapi-basekit:2024.2.1-0-devel-ubuntu22.04 AS vllm-base

RUN wget -O- https://apt.repos.intel.com/intel-gpg-keys/GPG-PUB-KEY-INTEL-SW-PRODUCTS.PUB | gpg --dearmor | tee /usr/share/keyrings/intel-oneapi-archive-keyring.gpg > /dev/null && \
    echo "deb [signed-by=/usr/share/keyrings/intel-oneapi-archive-keyring.gpg] https://apt.repos.intel.com/oneapi all main " | tee /etc/apt/sources.list.d/oneAPI.list && \
    chmod 644 /usr/share/keyrings/intel-oneapi-archive-keyring.gpg && \
    wget -O- https://repositories.intel.com/graphics/intel-graphics.key | gpg --dearmor | tee /usr/share/keyrings/intel-graphics.gpg > /dev/null && \
    echo "deb [arch=amd64,i386 signed-by=/usr/share/keyrings/intel-graphics.gpg] https://repositories.intel.com/graphics/ubuntu jammy arc" | tee /etc/apt/sources.list.d/intel.gpu.jammy.list && \
    chmod 644 /usr/share/keyrings/intel-graphics.gpg

RUN apt-get update -y && \
    apt-get install -y --no-install-recommends --fix-missing \
    curl \
    ffmpeg \
    git \
    libsndfile1 \
    libsm6 \
    libxext6 \
    libgl1 \
    lsb-release \
    numactl \
    python3 \
    python3-dev \
    python3-pip \
    # vim \
    wget

WORKDIR /workspace/vllm
COPY requirements/xpu.txt /workspace/vllm/requirements/xpu.txt
COPY requirements/common.txt /workspace/vllm/requirements/common.txt

RUN --mount=type=cache,target=/root/.cache/pip \
    pip install --no-cache-dir \
    -r requirements/xpu.txt

RUN git clone https://github.com/intel/pti-gpu && \
    cd pti-gpu/sdk && \
    git checkout 6c491f07a777ed872c2654ca9942f1d0dde0a082 && \
    mkdir build && \
    cd build && \
    cmake -DCMAKE_BUILD_TYPE=Release -DCMAKE_TOOLCHAIN_FILE=../cmake/toolchains/icpx_toolchain.cmake -DBUILD_TESTING=OFF .. && \
    make -j && \
    cmake --install . --config Release --prefix "/usr/local"

ENV LD_LIBRARY_PATH="$LD_LIBRARY_PATH:/usr/local/lib/"

COPY . .
ARG GIT_REPO_CHECK
RUN --mount=type=bind,source=.git,target=.git \
    if [ "$GIT_REPO_CHECK" != 0 ]; then bash tools/check_repo.sh; fi

ENV VLLM_TARGET_DEVICE=xpu

RUN --mount=type=cache,target=/root/.cache/pip \
    --mount=type=bind,source=.git,target=.git \
    python3 setup.py install

CMD ["/bin/bash"]

FROM vllm-base AS vllm-openai

# install additional dependencies for openai api server
RUN --mount=type=cache,target=/root/.cache/pip \
    pip install accelerate hf_transfer 'modelscope!=1.15.0'

ENV VLLM_USAGE_SOURCE production-docker-image \
    TRITON_XPU_PROFILE 1
# install development dependencies (for testing)
RUN python3 -m pip install -e tests/vllm_test_utils
ENTRYPOINT ["python3", "-m", "vllm.entrypoints.openai.api_server"]
[Bugfix][Intel] Fix XPU Dockerfile Build (#7824) Signed-off-by: tylertitsworth <tyler.titsworth@intel.com> Co-authored-by: youkaichao <youkaichao@126.com> 2024-09-27 23:45:50 -07:00			`FROM intel/oneapi-basekit:2024.2.1-0-devel-ubuntu22.04 AS vllm-base`
[Hardware][Intel GPU] Add Intel GPU(XPU) inference backend (#3814) Co-authored-by: Jiang Li <jiang1.li@intel.com> Co-authored-by: Abhilash Majumder <abhilash.majumder@intel.com> Co-authored-by: Abhilash Majumder <30946547+abhilash1910@users.noreply.github.com> 2024-06-18 02:01:25 +08:00
			`RUN wget -O- https://apt.repos.intel.com/intel-gpg-keys/GPG-PUB-KEY-INTEL-SW-PRODUCTS.PUB \| gpg --dearmor \| tee /usr/share/keyrings/intel-oneapi-archive-keyring.gpg > /dev/null && \`
			`echo "deb [signed-by=/usr/share/keyrings/intel-oneapi-archive-keyring.gpg] https://apt.repos.intel.com/oneapi all main " \| tee /etc/apt/sources.list.d/oneAPI.list && \`
			`chmod 644 /usr/share/keyrings/intel-oneapi-archive-keyring.gpg && \`
			`wget -O- https://repositories.intel.com/graphics/intel-graphics.key \| gpg --dearmor \| tee /usr/share/keyrings/intel-graphics.gpg > /dev/null && \`
			`echo "deb [arch=amd64,i386 signed-by=/usr/share/keyrings/intel-graphics.gpg] https://repositories.intel.com/graphics/ubuntu jammy arc" \| tee /etc/apt/sources.list.d/intel.gpu.jammy.list && \`
			`chmod 644 /usr/share/keyrings/intel-graphics.gpg`

[Bugfix][Intel] Fix XPU Dockerfile Build (#7824) Signed-off-by: tylertitsworth <tyler.titsworth@intel.com> Co-authored-by: youkaichao <youkaichao@126.com> 2024-09-27 23:45:50 -07:00			`RUN apt-get update -y && \`
			`apt-get install -y --no-install-recommends --fix-missing \`
			`curl \`
			`ffmpeg \`
			`git \`
			`libsndfile1 \`
			`libsm6 \`
			`libxext6 \`
			`libgl1 \`
			`lsb-release \`
			`numactl \`
			`python3 \`
			`python3-dev \`
			`python3-pip \`
			`# vim \`
			`wget`
[Hardware][Intel GPU] Add Intel GPU(XPU) inference backend (#3814) Co-authored-by: Jiang Li <jiang1.li@intel.com> Co-authored-by: Abhilash Majumder <abhilash.majumder@intel.com> Co-authored-by: Abhilash Majumder <30946547+abhilash1910@users.noreply.github.com> 2024-06-18 02:01:25 +08:00
			`WORKDIR /workspace/vllm`
Move requirements into their own directory (#12547) Signed-off-by: Harry Mellor <19981378+hmellor@users.noreply.github.com> 2025-03-08 17:44:35 +01:00			`COPY requirements/xpu.txt /workspace/vllm/requirements/xpu.txt`
			`COPY requirements/common.txt /workspace/vllm/requirements/common.txt`
[Hardware][Intel GPU] Add Intel GPU(XPU) inference backend (#3814) Co-authored-by: Jiang Li <jiang1.li@intel.com> Co-authored-by: Abhilash Majumder <abhilash.majumder@intel.com> Co-authored-by: Abhilash Majumder <30946547+abhilash1910@users.noreply.github.com> 2024-06-18 02:01:25 +08:00
[CI/Build] use setuptools-scm to set __version__ (#4738) Co-authored-by: youkaichao <youkaichao@126.com> 2024-09-23 18:44:26 +02:00			`RUN --mount=type=cache,target=/root/.cache/pip \`
[Bugfix][Intel] Fix XPU Dockerfile Build (#7824) Signed-off-by: tylertitsworth <tyler.titsworth@intel.com> Co-authored-by: youkaichao <youkaichao@126.com> 2024-09-27 23:45:50 -07:00			`pip install --no-cache-dir \`
Move requirements into their own directory (#12547) Signed-off-by: Harry Mellor <19981378+hmellor@users.noreply.github.com> 2025-03-08 17:44:35 +01:00			`-r requirements/xpu.txt`
[Bugfix][Intel] Fix XPU Dockerfile Build (#7824) Signed-off-by: tylertitsworth <tyler.titsworth@intel.com> Co-authored-by: youkaichao <youkaichao@126.com> 2024-09-27 23:45:50 -07:00
[Misc][XPU] Upgrade to Pytorch 2.5 for xpu backend (#9823) Signed-off-by: Kunshang Ji <kunshang.ji@intel.com> Signed-off-by: yan ma <yan.ma@intel.com> Co-authored-by: Kunshang Ji <kunshang.ji@intel.com> 2024-11-07 09:29:03 +08:00			`RUN git clone https://github.com/intel/pti-gpu && \`
			`cd pti-gpu/sdk && \`
			`git checkout 6c491f07a777ed872c2654ca9942f1d0dde0a082 && \`
			`mkdir build && \`
			`cd build && \`
			`cmake -DCMAKE_BUILD_TYPE=Release -DCMAKE_TOOLCHAIN_FILE=../cmake/toolchains/icpx_toolchain.cmake -DBUILD_TESTING=OFF .. && \`
			`make -j && \`
			`cmake --install . --config Release --prefix "/usr/local"`

			`ENV LD_LIBRARY_PATH="$LD_LIBRARY_PATH:/usr/local/lib/"`

[CI/Build] remove .github from .dockerignore, add dirty repo check (#9375) 2024-10-17 19:25:06 +02:00			`COPY . .`
			`ARG GIT_REPO_CHECK`
			`RUN --mount=type=bind,source=.git,target=.git \`
			`if [ "$GIT_REPO_CHECK" != 0 ]; then bash tools/check_repo.sh; fi`
[Bugfix][Intel] Fix XPU Dockerfile Build (#7824) Signed-off-by: tylertitsworth <tyler.titsworth@intel.com> Co-authored-by: youkaichao <youkaichao@126.com> 2024-09-27 23:45:50 -07:00
			`ENV VLLM_TARGET_DEVICE=xpu`
[Hardware][Intel GPU] Add Intel GPU(XPU) inference backend (#3814) Co-authored-by: Jiang Li <jiang1.li@intel.com> Co-authored-by: Abhilash Majumder <abhilash.majumder@intel.com> Co-authored-by: Abhilash Majumder <30946547+abhilash1910@users.noreply.github.com> 2024-06-18 02:01:25 +08:00
[CI/Build] use setuptools-scm to set __version__ (#4738) Co-authored-by: youkaichao <youkaichao@126.com> 2024-09-23 18:44:26 +02:00			`RUN --mount=type=cache,target=/root/.cache/pip \`
			`--mount=type=bind,source=.git,target=.git \`
[Bugfix][Intel] Fix XPU Dockerfile Build (#7824) Signed-off-by: tylertitsworth <tyler.titsworth@intel.com> Co-authored-by: youkaichao <youkaichao@126.com> 2024-09-27 23:45:50 -07:00			`python3 setup.py install`
[Hardware][Intel GPU] Add Intel GPU(XPU) inference backend (#3814) Co-authored-by: Jiang Li <jiang1.li@intel.com> Co-authored-by: Abhilash Majumder <abhilash.majumder@intel.com> Co-authored-by: Abhilash Majumder <30946547+abhilash1910@users.noreply.github.com> 2024-06-18 02:01:25 +08:00
			`CMD ["/bin/bash"]`
[Bugfix][Intel] Fix XPU Dockerfile Build (#7824) Signed-off-by: tylertitsworth <tyler.titsworth@intel.com> Co-authored-by: youkaichao <youkaichao@126.com> 2024-09-27 23:45:50 -07:00
			`FROM vllm-base AS vllm-openai`

			`# install additional dependencies for openai api server`
			`RUN --mount=type=cache,target=/root/.cache/pip \`
			`pip install accelerate hf_transfer 'modelscope!=1.15.0'`

			`ENV VLLM_USAGE_SOURCE production-docker-image \`
			`TRITON_XPU_PROFILE 1`
[ci] add vllm_test_utils (#10659) Signed-off-by: youkaichao <youkaichao@gmail.com> 2024-11-26 00:20:04 -08:00			`# install development dependencies (for testing)`
			`RUN python3 -m pip install -e tests/vllm_test_utils`
[Bugfix][Intel] Fix XPU Dockerfile Build (#7824) Signed-off-by: tylertitsworth <tyler.titsworth@intel.com> Co-authored-by: youkaichao <youkaichao@126.com> 2024-09-27 23:45:50 -07:00			`ENTRYPOINT ["python3", "-m", "vllm.entrypoints.openai.api_server"]`