Add documentation on how to do incremental builds (#2796)

2024-02-07 14:42:02 -08:00 · 2024-02-07 14:42:02 -08:00 · 931746bc6d
commit 931746bc6d
parent c81dddb45c
2 changed files with 15 additions and 0 deletions
--- a/docs/source/getting_started/installation.rst
+++ b/docs/source/getting_started/installation.rst
@ -67,3 +67,13 @@ You can also build and install vLLM from source:

        $ # Use `--ipc=host` to make sure the shared memory is large enough.
        $ docker run --gpus all -it --rm --ipc=host nvcr.io/nvidia/pytorch:23.10-py3
+
+.. note::
+    If you are developing the C++ backend of vLLM, consider building vLLM with
+
+    .. code-block:: console
+
+        $ python setup.py develop
+
+    since it will give you incremental builds. The downside is that this method
+    is `deprecated by setuptools <https://github.com/pypa/setuptools/issues/917>`_.
--- a/setup.py
+++ b/setup.py
@ -15,6 +15,11 @@ from torch.utils.cpp_extension import BuildExtension, CUDAExtension, CUDA_HOME,

 ROOT_DIR = os.path.dirname(__file__)

+# If you are developing the C++ backend of vLLM, consider building vLLM with
+# `python setup.py develop` since it will give you incremental builds.
+# The downside is that this method is deprecated, see
+# https://github.com/pypa/setuptools/issues/917
+
 MAIN_CUDA_VERSION = "12.1"

 # Supported NVIDIA GPU architectures.