bootstrapif [[ -n "" ]]; then VLLM_CI_BRANCH= curl -sSL "https://raw.githubusercontent.com/vllm-project/buildkite-ci//scripts/bootstrap.sh" | bash && exit 0; fi && curl -sSL "https://raw.githubusercontent.com/vllm-project/buildkite-ci/main/scripts/bootstrap.sh" | bash

Ran in 19s

build imageaws ecr-public get-login-password --region us-east-1 | docker login --username AWS --password-stdin public.ecr.aws/q9t5s3a7 && #!/bin/bash && if [[ -z $(docker manifest inspect public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:7172e726b7fccd763f7a157e95cbce13cecbc5bb) ]]; then && echo "Image not found, proceeding with build..." && else && echo "Image found" && exit 0 && fi && docker build --file docker/Dockerfile --build-arg max_jobs=16 --build-arg buildkite_commit=7172e726b7fccd763f7a157e95cbce13cecbc5bb --build-arg USE_SCCACHE=1 --tag public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:7172e726b7fccd763f7a157e95cbce13cecbc5bb --target test --progress plain . && docker push public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:7172e726b7fccd763f7a157e95cbce13cecbc5bb

Ran in 34m 5s

build image CUDA 12.1aws ecr-public get-login-password --region us-east-1 | docker login --username AWS --password-stdin public.ecr.aws/q9t5s3a7 && #!/bin/bash && if [[ -z $(docker manifest inspect public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:7172e726b7fccd763f7a157e95cbce13cecbc5bb-cu121) ]]; then && echo "Image not found, proceeding with build..." && else && echo "Image found" && exit 0 && fi && docker build --file docker/Dockerfile --build-arg max_jobs=16 --build-arg buildkite_commit=7172e726b7fccd763f7a157e95cbce13cecbc5bb --build-arg USE_SCCACHE=1 --build-arg CUDA_VERSION=12.1.0 --tag public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:7172e726b7fccd763f7a157e95cbce13cecbc5bb-cu121 --target test --progress plain . && docker push public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:7172e726b7fccd763f7a157e95cbce13cecbc5bb-cu121

build image CUDA 11.8aws ecr-public get-login-password --region us-east-1 | docker login --username AWS --password-stdin public.ecr.aws/q9t5s3a7 && #!/bin/bash && if [[ -z $(docker manifest inspect public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:7172e726b7fccd763f7a157e95cbce13cecbc5bb-cu118) ]]; then && echo "Image not found, proceeding with build..." && else && echo "Image found" && exit 0 && fi && docker build --file docker/Dockerfile --build-arg max_jobs=16 --build-arg buildkite_commit=7172e726b7fccd763f7a157e95cbce13cecbc5bb --build-arg USE_SCCACHE=1 --build-arg CUDA_VERSION=11.8.0 --tag public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:7172e726b7fccd763f7a157e95cbce13cecbc5bb-cu118 --target test --progress plain . && docker push public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:7172e726b7fccd763f7a157e95cbce13cecbc5bb-cu118

Documentation Build

Ran in 4m 37s

Async Engine, Inputs, Utils, Worker Test

Python-only Installation Test

Basic Correctness Test

Chunked Prefill Test

Core Test

Entrypoints Test

Distributed Tests (4 GPUs)

Metrics, Tracing Test

Regression Test

Engine Test

V1 Test

Examples Test

Prefix Caching Test

Samplers Test

LogitsProcessor Test

Speculative decoding tests

1/4

LoRA Test 1

2/4

LoRA Test 2

3/4

LoRA Test 3

4/4

LoRA Test 4

PyTorch Compilation Unit Tests

PyTorch Fullgraph Smoke Test

PyTorch Fullgraph Test

1/4

Kernels Test 1

2/4

Kernels Test 2

3/4

Kernels Test 3

4/4

Kernels Test 4

Tensorizer Test

Benchmarks

Quantization Test

LM Eval Small Models

OpenAI API correctness

Encoder Decoder tests

OpenAI-Compatible Tool Use

Basic Models Test

Language Models Test (Standard)

Language Models Test (Extended)

Multi-Modal Models Test (Standard)

Multi-Modal Models Test (Extended) 1

Multi-Modal Models Test (Extended) 2

Custom Models Test

Distributed Comm Ops Test

2 Node Tests (4 GPUs in total)./.buildkite/scripts/run-multi-node-test.sh /vllm-workspace/tests 2 2 public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:7172e726b7fccd763f7a157e95cbce13cecbc5bb "VLLM_TEST_SAME_HOST=0 torchrun --nnodes 2 --nproc-per-node=2 --rdzv_backend=c10d --rdzv_endpoint=192.168.10.10 distributed/test_same_node.py | grep 'Same node test passed' && VLLM_MULTI_NODE=1 pytest -v -s distributed/test_multi_node_assignment.py && VLLM_MULTI_NODE=1 pytest -v -s distributed/test_pipeline_parallel.py" "VLLM_TEST_SAME_HOST=0 torchrun --nnodes 2 --nproc-per-node=2 --rdzv_backend=c10d --rdzv_endpoint=192.168.10.10 distributed/test_same_node.py | grep 'Same node test passed'"

Distributed Tests (2 GPUs)

Plugin Tests (2 GPUs)

Multi-step Tests (4 GPUs)

Pipeline Parallelism Test

LoRA TP Test (Distributed)

Weight Loading Multiple GPU Test

Weight Loading Multiple GPU Test - Large Models

Distributed Tests (A100)

LM Eval Large Models

AMD:

build imagegrep -i 'from base as test' docker/Dockerfile.rocm && docker build --build-arg max_jobs=16 --tag rocm/vllm-ci:7172e726b7fccd763f7a157e95cbce13cecbc5bb -f docker/Dockerfile.rocm --target test --progress plain . || docker build --build-arg max_jobs=16 --tag rocm/vllm-ci:7172e726b7fccd763f7a157e95cbce13cecbc5bb -f docker/Dockerfile.rocm --progress plain . && docker push rocm/vllm-ci:7172e726b7fccd763f7a157e95cbce13cecbc5bb

Ran in 21m 56s

AMD: Core Testbash .buildkite/scripts/hardware_ci/run-amd-test.sh "(command rocm-smi || true) && export VLLM_LOGGING_LEVEL=DEBUG && export VLLM_ALLOW_DEPRECATED_BEAM_SEARCH=1 && cd /vllm-workspace/tests ; pytest -v -s core"

Ran in 20m 29s

AMD: Metrics, Tracing Testbash .buildkite/scripts/hardware_ci/run-amd-test.sh "(command rocm-smi || true) && export VLLM_LOGGING_LEVEL=DEBUG && export VLLM_ALLOW_DEPRECATED_BEAM_SEARCH=1 && cd /vllm-workspace/tests ; pytest -v -s metrics && pytest -v -s tracing"

Ran in 20m 28s

AMD: Engine Testbash .buildkite/scripts/hardware_ci/run-amd-test.sh "(command rocm-smi || true) && export VLLM_LOGGING_LEVEL=DEBUG && export VLLM_ALLOW_DEPRECATED_BEAM_SEARCH=1 && cd /vllm-workspace/tests ; pytest -v -s engine test_sequence.py test_config.py test_logger.py && pytest -v -s tokenization"

Ran in 22m 42s

AMD: Prefix Caching Testbash .buildkite/scripts/hardware_ci/run-amd-test.sh "(command rocm-smi || true) && export VLLM_LOGGING_LEVEL=DEBUG && export VLLM_ALLOW_DEPRECATED_BEAM_SEARCH=1 && cd /vllm-workspace/tests ; pytest -v -s prefix_caching"

Ran in 16m 38s

AMD: LogitsProcessor Testbash .buildkite/scripts/hardware_ci/run-amd-test.sh "(command rocm-smi || true) && export VLLM_LOGGING_LEVEL=DEBUG && export VLLM_ALLOW_DEPRECATED_BEAM_SEARCH=1 && cd /vllm-workspace/tests ; pytest -v -s test_logits_processor.py && pytest -v -s model_executor/test_guided_processors.py"

Ran in 10m 45s

AMD: Benchmarksbash .buildkite/scripts/hardware_ci/run-amd-test.sh "(command rocm-smi || true) && export VLLM_LOGGING_LEVEL=DEBUG && export VLLM_ALLOW_DEPRECATED_BEAM_SEARCH=1 && cd /vllm-workspace/.buildkite ; bash scripts/run-benchmarks.sh"

Ran in 9m 38s

AMD: Custom Models Testbash .buildkite/scripts/hardware_ci/run-amd-test.sh "(command rocm-smi || true) && export VLLM_LOGGING_LEVEL=DEBUG && export VLLM_ALLOW_DEPRECATED_BEAM_SEARCH=1 && cd /vllm-workspace/tests ; echo 'Testing custom models...'"

Ran in 7m 31s

AMD: Distributed Comm Ops Testbash .buildkite/scripts/hardware_ci/run-amd-test.sh "(command rocm-smi || true) && export VLLM_LOGGING_LEVEL=DEBUG && export VLLM_ALLOW_DEPRECATED_BEAM_SEARCH=1 && cd /vllm-workspace/tests ; pytest -v -s distributed/test_comm_ops.py && pytest -v -s distributed/test_shm_broadcast.py"

Ran in 4m 21s

Neuron Testbash .buildkite/scripts/hardware_ci/run-neuron-test.sh

Ran in 3m 57s

Intel CPU Testbash .buildkite/scripts/hardware_ci/run-cpu-test.sh

Intel HPU Testbash .buildkite/scripts/hardware_ci/run-hpu-test.sh

Ran in 1m 20s

Intel GPU Testbash .buildkite/scripts/hardware_ci/run-xpu-test.sh

Ran in 4m 1s

Harry Mellor unblocked Run IBM Power(ppc64le) CPU Test
Fri 11th Apr at 11:27 AM

IBM Power(ppc64le) CPU Testbash .buildkite/scripts/hardware_ci/run-cpu-test-ppc64le.sh

Ran in 25m 16s

TPU V0 Testyes | docker system prune -a && if [[ -f ".buildkite/scripts/hardware_ci/run-tpu-test.sh" ]]; then bash .buildkite/scripts/hardware_ci/run-tpu-test.sh; fi

Ran in 1s

TPU V1 Testif [[ -f ".buildkite/scripts/hardware_ci/run-tpu-v1-test.sh" ]]; then bash .buildkite/scripts/hardware_ci/run-tpu-v1-test.sh; fi && yes | docker system prune -a

Ran in 35m 41s

Total Job Run Time: 4h 3m