Add documentation on how to do incremental builds (#2796)

2024-02-07 14:42:02 -08:00 · 2024-02-07 14:42:02 -08:00 · 931746bc6d
commit 931746bc6d
parent c81dddb45c
2 changed files with 15 additions and 0 deletions
--- a/docs/source/getting_started/installation.rst
+++ b/docs/source/getting_started/installation.rst
@ -67,3 +67,13 @@ You can also build and install vLLM from source:
        $ # Use `--ipc=host` to make sure the shared memory is large enough.
        $ docker run --gpus all -it --rm --ipc=host nvcr.io/nvidia/pytorch:23.10-py3
 .. note::
    If you are developing the C++ backend of vLLM, consider building vLLM with
    .. code-block:: console
        $ python setup.py develop
    since it will give you incremental builds. The downside is that this method
    is `deprecated by setuptools <https://github.com/pypa/setuptools/issues/917>`_.
--- a/setup.py
+++ b/setup.py
@ -15,6 +15,11 @@ from torch.utils.cpp_extension import BuildExtension, CUDAExtension, CUDA_HOME,
 ROOT_DIR = os.path.dirname(__file__)
 # If you are developing the C++ backend of vLLM, consider building vLLM with
 # `python setup.py develop` since it will give you incremental builds.
 # The downside is that this method is deprecated, see
 # https://github.com/pypa/setuptools/issues/917
 MAIN_CUDA_VERSION = "12.1"
 # Supported NVIDIA GPU architectures.