vllm/.buildkite/test-pipeline.yaml

89 lines
2.5 KiB
YAML
Raw Normal View History

2024-01-14 12:37:58 -08:00
# In this file, you can add more tests to run either by adding a new step or
# adding a new command to an existing step. See different options here for examples.
# This script will be feed into Jinja template in `test-template.j2` to generate
# the final pipeline yaml file.
steps:
- label: Regression Test
command: pytest -v -s test_regression.py
working_dir: "/vllm-workspace/tests" # optional
- label: AsyncEngine Test
command: pytest -v -s async_engine
- label: Basic Correctness Test
command: pytest -v -s --forked basic_correctness
- label: Core Test
command: pytest -v -s core
- label: Distributed Comm Ops Test
command: pytest -v -s --forked test_comm_ops.py
working_dir: "/vllm-workspace/tests/distributed"
num_gpus: 2 # only support 1 or 2 for now.
2024-03-27 00:33:26 -07:00
- label: Distributed Tests
2024-01-14 12:37:58 -08:00
working_dir: "/vllm-workspace/tests/distributed"
num_gpus: 2 # only support 1 or 2 for now.
2024-03-27 00:33:26 -07:00
commands:
- pytest -v -s --forked test_pynccl.py
- TEST_DIST_MODEL=facebook/opt-125m pytest -v -s --forked test_basic_distributed_correctness.py
- TEST_DIST_MODEL=meta-llama/Llama-2-7b-hf pytest -v -s --forked test_basic_distributed_correctness.py
2024-01-14 12:37:58 -08:00
- label: Engine Test
command: pytest -v -s engine tokenization test_sequence.py test_config.py
2024-01-14 12:37:58 -08:00
2024-01-17 05:33:14 +00:00
- label: Entrypoints Test
command: pytest -v -s entrypoints
- label: Kernels Test %N
command: pytest -v -s kernels --shard-id=$$BUILDKITE_PARALLEL_JOB --num-shards=$$BUILDKITE_PARALLEL_JOB_COUNT
parallelism: 4
2024-01-14 12:37:58 -08:00
- label: Models Test
commands:
- bash ../.buildkite/download-images.sh
- pytest -v -s models --ignore=models/test_llava.py --forked
2024-01-14 12:37:58 -08:00
soft_fail: true
- label: Llava Test
commands:
- bash ../.buildkite/download-images.sh
- pytest -v -s models/test_llava.py
- label: Prefix Caching Test
commands:
- pytest -v -s prefix_caching
2024-01-14 12:37:58 -08:00
- label: Samplers Test
command: pytest -v -s samplers
2024-01-14 12:37:58 -08:00
- label: LogitsProcessor Test
command: pytest -v -s test_logits_processor.py
2024-01-14 12:37:58 -08:00
- label: Worker Test
command: pytest -v -s worker
- label: Speculative decoding tests
command: pytest -v -s spec_decode
- label: LoRA Test %N
command: pytest -v -s lora --shard-id=$$BUILDKITE_PARALLEL_JOB --num-shards=$$BUILDKITE_PARALLEL_JOB_COUNT
parallelism: 4
- label: Metrics Test
command: pytest -v -s metrics
2024-01-14 12:37:58 -08:00
- label: Benchmarks
working_dir: "/vllm-workspace/.buildkite"
commands:
- pip install aiohttp
- bash run-benchmarks.sh
- label: Documentation Build
working_dir: "/vllm-workspace/docs"
no_gpu: True
commands:
- pip install -r requirements-docs.txt
- SPHINXOPTS=\"-W\" make html