bootstrapif [[ -n "" ]]; then VLLM_CI_BRANCH= curl -sSL "https://raw.githubusercontent.com/vllm-project/buildkite-ci//scripts/bootstrap.sh" | bash && exit 0; fi && curl -sSL "https://raw.githubusercontent.com/vllm-project/buildkite-ci/main/scripts/bootstrap.sh" | bash

Ran in 18s

build imageaws ecr-public get-login-password --region us-east-1 | docker login --username AWS --password-stdin public.ecr.aws/q9t5s3a7 && #!/bin/bash && if [[ -z $(docker manifest inspect public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:89ea6a23db8695fa84b09d260a923c5be810443e) ]]; then && echo "Image not found, proceeding with build..." && else && echo "Image found" && exit 0 && fi && docker build --file docker/Dockerfile --build-arg max_jobs=16 --build-arg buildkite_commit=89ea6a23db8695fa84b09d260a923c5be810443e --build-arg USE_SCCACHE=1 --tag public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:89ea6a23db8695fa84b09d260a923c5be810443e --target test --progress plain . && docker push public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:89ea6a23db8695fa84b09d260a923c5be810443e

Ran in 33m 43s

build image CUDA 12.1aws ecr-public get-login-password --region us-east-1 | docker login --username AWS --password-stdin public.ecr.aws/q9t5s3a7 && #!/bin/bash && if [[ -z $(docker manifest inspect public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:89ea6a23db8695fa84b09d260a923c5be810443e-cu121) ]]; then && echo "Image not found, proceeding with build..." && else && echo "Image found" && exit 0 && fi && docker build --file docker/Dockerfile --build-arg max_jobs=16 --build-arg buildkite_commit=89ea6a23db8695fa84b09d260a923c5be810443e --build-arg USE_SCCACHE=1 --build-arg CUDA_VERSION=12.1.0 --tag public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:89ea6a23db8695fa84b09d260a923c5be810443e-cu121 --target test --progress plain . && docker push public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:89ea6a23db8695fa84b09d260a923c5be810443e-cu121

build image CUDA 11.8aws ecr-public get-login-password --region us-east-1 | docker login --username AWS --password-stdin public.ecr.aws/q9t5s3a7 && #!/bin/bash && if [[ -z $(docker manifest inspect public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:89ea6a23db8695fa84b09d260a923c5be810443e-cu118) ]]; then && echo "Image not found, proceeding with build..." && else && echo "Image found" && exit 0 && fi && docker build --file docker/Dockerfile --build-arg max_jobs=16 --build-arg buildkite_commit=89ea6a23db8695fa84b09d260a923c5be810443e --build-arg USE_SCCACHE=1 --build-arg CUDA_VERSION=11.8.0 --tag public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:89ea6a23db8695fa84b09d260a923c5be810443e-cu118 --target test --progress plain . && docker push public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:89ea6a23db8695fa84b09d260a923c5be810443e-cu118

Documentation Build

Ran in 4m 45s

Async Engine, Inputs, Utils, Worker Test

Python-only Installation Test

Basic Correctness Test

Chunked Prefill Test

Core Test

Entrypoints Test

Distributed Tests (4 GPUs)

Metrics, Tracing Test

Regression Test

Engine Test

V1 Test

Examples Test

Prefix Caching Test

Samplers Test

LogitsProcessor Test

Speculative decoding tests

1/4

LoRA Test 1

2/4

LoRA Test 2

3/4

LoRA Test 3

4/4

LoRA Test 4

PyTorch Compilation Unit Tests

PyTorch Fullgraph Smoke Test

PyTorch Fullgraph Test

1/4

Kernels Test 1

2/4

Kernels Test 2

3/4

Kernels Test 3

4/4

Kernels Test 4

Tensorizer Test

Benchmarks

Quantization Test

LM Eval Small Models

OpenAI API correctness

Encoder Decoder tests

OpenAI-Compatible Tool Use

Basic Models Test

Language Models Test (Standard)

Language Models Test (Extended)

Multi-Modal Models Test (Standard)

Multi-Modal Models Test (Extended) 1

Multi-Modal Models Test (Extended) 2

Custom Models Test

Distributed Comm Ops Test

2 Node Tests (4 GPUs in total)./.buildkite/scripts/run-multi-node-test.sh /vllm-workspace/tests 2 2 public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:89ea6a23db8695fa84b09d260a923c5be810443e "VLLM_TEST_SAME_HOST=0 torchrun --nnodes 2 --nproc-per-node=2 --rdzv_backend=c10d --rdzv_endpoint=192.168.10.10 distributed/test_same_node.py | grep 'Same node test passed' && VLLM_MULTI_NODE=1 pytest -v -s distributed/test_multi_node_assignment.py && VLLM_MULTI_NODE=1 pytest -v -s distributed/test_pipeline_parallel.py" "VLLM_TEST_SAME_HOST=0 torchrun --nnodes 2 --nproc-per-node=2 --rdzv_backend=c10d --rdzv_endpoint=192.168.10.10 distributed/test_same_node.py | grep 'Same node test passed'"

Distributed Tests (2 GPUs)

Plugin Tests (2 GPUs)

Multi-step Tests (4 GPUs)

Pipeline Parallelism Test

LoRA TP Test (Distributed)

Weight Loading Multiple GPU Test

Weight Loading Multiple GPU Test - Large Models

Distributed Tests (A100)

LM Eval Large Models

AMD:

build imagegrep -i 'from base as test' docker/Dockerfile.rocm && docker build --build-arg max_jobs=16 --tag rocm/vllm-ci:89ea6a23db8695fa84b09d260a923c5be810443e -f docker/Dockerfile.rocm --target test --progress plain . || docker build --build-arg max_jobs=16 --tag rocm/vllm-ci:89ea6a23db8695fa84b09d260a923c5be810443e -f docker/Dockerfile.rocm --progress plain . && docker push rocm/vllm-ci:89ea6a23db8695fa84b09d260a923c5be810443e

Ran in 22m 23s

AMD: Core Testbash .buildkite/scripts/hardware_ci/run-amd-test.sh "(command rocm-smi || true) && export VLLM_LOGGING_LEVEL=DEBUG && export VLLM_ALLOW_DEPRECATED_BEAM_SEARCH=1 && cd /vllm-workspace/tests ; pytest -v -s core"

Ran in 22m 15s

AMD: Metrics, Tracing Testbash .buildkite/scripts/hardware_ci/run-amd-test.sh "(command rocm-smi || true) && export VLLM_LOGGING_LEVEL=DEBUG && export VLLM_ALLOW_DEPRECATED_BEAM_SEARCH=1 && cd /vllm-workspace/tests ; pytest -v -s metrics && pytest -v -s tracing"

Ran in 21m 19s

AMD: Engine Testbash .buildkite/scripts/hardware_ci/run-amd-test.sh "(command rocm-smi || true) && export VLLM_LOGGING_LEVEL=DEBUG && export VLLM_ALLOW_DEPRECATED_BEAM_SEARCH=1 && cd /vllm-workspace/tests ; pytest -v -s engine test_sequence.py test_config.py test_logger.py && pytest -v -s tokenization"

Ran in 24m 11s

AMD: Prefix Caching Testbash .buildkite/scripts/hardware_ci/run-amd-test.sh "(command rocm-smi || true) && export VLLM_LOGGING_LEVEL=DEBUG && export VLLM_ALLOW_DEPRECATED_BEAM_SEARCH=1 && cd /vllm-workspace/tests ; pytest -v -s prefix_caching"

Ran in 16m 52s

AMD: LogitsProcessor Testbash .buildkite/scripts/hardware_ci/run-amd-test.sh "(command rocm-smi || true) && export VLLM_LOGGING_LEVEL=DEBUG && export VLLM_ALLOW_DEPRECATED_BEAM_SEARCH=1 && cd /vllm-workspace/tests ; pytest -v -s test_logits_processor.py && pytest -v -s model_executor/test_guided_processors.py"

Ran in 11m 4s

AMD: Benchmarksbash .buildkite/scripts/hardware_ci/run-amd-test.sh "(command rocm-smi || true) && export VLLM_LOGGING_LEVEL=DEBUG && export VLLM_ALLOW_DEPRECATED_BEAM_SEARCH=1 && cd /vllm-workspace/.buildkite ; bash scripts/run-benchmarks.sh"

Ran in 11m 26s

AMD: Custom Models Testbash .buildkite/scripts/hardware_ci/run-amd-test.sh "(command rocm-smi || true) && export VLLM_LOGGING_LEVEL=DEBUG && export VLLM_ALLOW_DEPRECATED_BEAM_SEARCH=1 && cd /vllm-workspace/tests ; echo 'Testing custom models...'"

Ran in 8m 0s

AMD: Distributed Comm Ops Testbash .buildkite/scripts/hardware_ci/run-amd-test.sh "(command rocm-smi || true) && export VLLM_LOGGING_LEVEL=DEBUG && export VLLM_ALLOW_DEPRECATED_BEAM_SEARCH=1 && cd /vllm-workspace/tests ; pytest -v -s distributed/test_comm_ops.py && pytest -v -s distributed/test_shm_broadcast.py"

Ran in 4m 3s

Neuron Testbash .buildkite/scripts/hardware_ci/run-neuron-test.sh

Ran in 3m 48s

Intel CPU Testbash .buildkite/scripts/hardware_ci/run-cpu-test.sh

Intel HPU Testbash .buildkite/scripts/hardware_ci/run-hpu-test.sh

Ran in 1m 20s

Intel GPU Testbash .buildkite/scripts/hardware_ci/run-xpu-test.sh

Ran in 2m 29s

Harry Mellor unblocked Run IBM Power(ppc64le) CPU Test
Friday at 6:13 PM

IBM Power(ppc64le) CPU Testbash .buildkite/scripts/hardware_ci/run-cpu-test-ppc64le.sh

Ran in 33m 37s

TPU V0 Testyes | docker system prune -a && if [[ -f ".buildkite/scripts/hardware_ci/run-tpu-test.sh" ]]; then bash .buildkite/scripts/hardware_ci/run-tpu-test.sh; fi

Ran in 1s

TPU V1 Testif [[ -f ".buildkite/scripts/hardware_ci/run-tpu-v1-test.sh" ]]; then bash .buildkite/scripts/hardware_ci/run-tpu-v1-test.sh; fi && yes | docker system prune -a

Ran in 35m 15s

Total Job Run Time: 4h 16m