2024-06-18 11:00:36 -07:00
|
|
|
steps:
|
2025-02-26 22:06:37 -05:00
|
|
|
- label: "Build wheel - CUDA 12.4"
|
|
|
|
agents:
|
|
|
|
queue: cpu_queue_postmerge
|
|
|
|
commands:
|
2025-03-31 21:47:32 +01:00
|
|
|
- "DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --build-arg CUDA_VERSION=12.4.0 --tag vllm-ci:build-image --target build --progress plain -f docker/Dockerfile ."
|
2025-02-26 22:06:37 -05:00
|
|
|
- "mkdir artifacts"
|
|
|
|
- "docker run --rm -v $(pwd)/artifacts:/artifacts_host vllm-ci:build-image bash -c 'cp -r dist /artifacts_host && chmod -R a+rw /artifacts_host'"
|
2025-04-04 12:16:20 -07:00
|
|
|
- "bash .buildkite/scripts/upload-wheels.sh"
|
2025-02-26 22:06:37 -05:00
|
|
|
env:
|
|
|
|
DOCKER_BUILDKIT: "1"
|
|
|
|
|
2024-08-07 11:34:25 -07:00
|
|
|
- label: "Build wheel - CUDA 12.1"
|
2024-07-12 13:56:59 -07:00
|
|
|
agents:
|
2024-12-03 23:02:16 -08:00
|
|
|
queue: cpu_queue_postmerge
|
2024-07-12 13:56:59 -07:00
|
|
|
commands:
|
2025-03-31 21:47:32 +01:00
|
|
|
- "DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --build-arg CUDA_VERSION=12.1.0 --tag vllm-ci:build-image --target build --progress plain -f docker/Dockerfile ."
|
2024-08-07 11:34:25 -07:00
|
|
|
- "mkdir artifacts"
|
|
|
|
- "docker run --rm -v $(pwd)/artifacts:/artifacts_host vllm-ci:build-image bash -c 'cp -r dist /artifacts_host && chmod -R a+rw /artifacts_host'"
|
2025-04-04 12:16:20 -07:00
|
|
|
- "bash .buildkite/scripts/upload-wheels.sh"
|
2024-08-07 11:34:25 -07:00
|
|
|
env:
|
|
|
|
DOCKER_BUILDKIT: "1"
|
|
|
|
|
2024-11-14 23:31:52 -08:00
|
|
|
# Note(simon): We can always build CUDA 11.8 wheel to ensure the build is working.
|
|
|
|
# However, this block can be uncommented to save some compute hours.
|
|
|
|
# - block: "Build CUDA 11.8 wheel"
|
|
|
|
# key: block-build-cu118-wheel
|
|
|
|
|
2024-08-07 11:34:25 -07:00
|
|
|
- label: "Build wheel - CUDA 11.8"
|
2024-11-14 23:31:52 -08:00
|
|
|
# depends_on: block-build-cu118-wheel
|
2024-08-07 11:34:25 -07:00
|
|
|
agents:
|
2024-12-03 23:02:16 -08:00
|
|
|
queue: cpu_queue_postmerge
|
2024-08-07 11:34:25 -07:00
|
|
|
commands:
|
2025-03-31 21:47:32 +01:00
|
|
|
- "DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --build-arg CUDA_VERSION=11.8.0 --tag vllm-ci:build-image --target build --progress plain -f docker/Dockerfile ."
|
2024-07-12 13:56:59 -07:00
|
|
|
- "mkdir artifacts"
|
2024-07-12 15:52:43 -07:00
|
|
|
- "docker run --rm -v $(pwd)/artifacts:/artifacts_host vllm-ci:build-image bash -c 'cp -r dist /artifacts_host && chmod -R a+rw /artifacts_host'"
|
2025-04-04 12:16:20 -07:00
|
|
|
- "bash .buildkite/scripts/upload-wheels.sh"
|
2024-07-22 14:20:41 -07:00
|
|
|
env:
|
|
|
|
DOCKER_BUILDKIT: "1"
|
2024-12-03 23:02:40 -08:00
|
|
|
|
|
|
|
- block: "Build release image"
|
|
|
|
depends_on: ~
|
|
|
|
key: block-release-image-build
|
|
|
|
|
|
|
|
- label: "Build release image"
|
|
|
|
depends_on: block-release-image-build
|
|
|
|
agents:
|
|
|
|
queue: cpu_queue_postmerge
|
|
|
|
commands:
|
|
|
|
- "aws ecr-public get-login-password --region us-east-1 | docker login --username AWS --password-stdin public.ecr.aws/q9t5s3a7"
|
2025-03-31 21:47:32 +01:00
|
|
|
- "DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --build-arg CUDA_VERSION=12.4.0 --tag public.ecr.aws/q9t5s3a7/vllm-release-repo:$BUILDKITE_COMMIT --target vllm-openai --progress plain -f docker/Dockerfile ."
|
2024-12-03 23:02:40 -08:00
|
|
|
- "docker push public.ecr.aws/q9t5s3a7/vllm-release-repo:$BUILDKITE_COMMIT"
|
2024-12-09 15:07:48 -08:00
|
|
|
|
|
|
|
- label: "Build and publish TPU release image"
|
|
|
|
depends_on: ~
|
|
|
|
if: build.env("NIGHTLY") == "1"
|
|
|
|
agents:
|
|
|
|
queue: tpu_queue_postmerge
|
|
|
|
commands:
|
2025-03-31 21:47:32 +01:00
|
|
|
- "DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --tag vllm/vllm-tpu:nightly --tag vllm/vllm-tpu:$BUILDKITE_COMMIT --progress plain -f docker/Dockerfile.tpu ."
|
2024-12-09 15:07:48 -08:00
|
|
|
- "docker push vllm/vllm-tpu:nightly"
|
|
|
|
- "docker push vllm/vllm-tpu:$BUILDKITE_COMMIT"
|
|
|
|
plugins:
|
|
|
|
- docker-login#v3.0.0:
|
|
|
|
username: vllm
|
|
|
|
password-env: DOCKERHUB_TOKEN
|
|
|
|
env:
|
|
|
|
DOCKER_BUILDKIT: "1"
|
2024-12-20 03:46:55 +08:00
|
|
|
|
2025-01-31 13:39:36 -08:00
|
|
|
- input: "Provide Release version here"
|
|
|
|
fields:
|
|
|
|
- text: "What is the release version?"
|
|
|
|
key: "release-version"
|
|
|
|
|
2024-12-20 03:46:55 +08:00
|
|
|
- block: "Build CPU release image"
|
|
|
|
key: block-cpu-release-image-build
|
|
|
|
depends_on: ~
|
|
|
|
|
|
|
|
- label: "Build and publish CPU release image"
|
|
|
|
depends_on: block-cpu-release-image-build
|
|
|
|
agents:
|
|
|
|
queue: cpu_queue_postmerge
|
|
|
|
commands:
|
|
|
|
- "aws ecr-public get-login-password --region us-east-1 | docker login --username AWS --password-stdin public.ecr.aws/q9t5s3a7"
|
2025-03-31 21:47:32 +01:00
|
|
|
- "DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg GIT_REPO_CHECK=1 --tag public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:$(buildkite-agent meta-data get release-version) --tag public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:latest --progress plain --target vllm-openai -f docker/Dockerfile.cpu ."
|
2025-01-31 13:39:36 -08:00
|
|
|
- "docker push public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:$(buildkite-agent meta-data get release-version)"
|
2024-12-20 03:46:55 +08:00
|
|
|
env:
|
|
|
|
DOCKER_BUILDKIT: "1"
|