11steps :
2- # aarch64 + CUDA builds. PyTorch 2.8 aarch64 + CUDA wheel is only available on CUDA 12.9
2+ # aarch64 + CUDA builds
33 - label : " Build arm64 wheel - CUDA 12.9"
44 depends_on : ~
55 id : build-wheel-arm64-cuda-12-9
@@ -15,20 +15,21 @@ steps:
1515 env :
1616 DOCKER_BUILDKIT : " 1"
1717
18- # aarch64 build.
18+ # aarch64 build
1919 - label : " Build arm64 CPU wheel"
2020 depends_on : ~
2121 id : build-wheel-arm64-cpu
2222 agents :
2323 queue : arm64_cpu_queue_postmerge
2424 commands :
25- - " DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --tag vllm-ci:build-image --target build --progress plain -f docker/Dockerfile.cpu ."
25+ - " DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --build-arg VLLM_BUILD_ACL=ON -- tag vllm-ci:build-image --target build --progress plain -f docker/Dockerfile.cpu ."
2626 - " mkdir artifacts"
2727 - " docker run --rm -v $(pwd)/artifacts:/artifacts_host vllm-ci:build-image bash -c 'cp -r dist /artifacts_host && chmod -R a+rw /artifacts_host'"
2828 - " bash .buildkite/scripts/upload-wheels.sh"
2929 env :
3030 DOCKER_BUILDKIT : " 1"
3131
32+ # x86 + CUDA builds
3233 - label : " Build wheel - CUDA 12.8"
3334 depends_on : ~
3435 id : build-wheel-cuda-12-8
@@ -42,47 +43,46 @@ steps:
4243 env :
4344 DOCKER_BUILDKIT : " 1"
4445
45- - label : " Build wheel - CUDA 12.6 "
46+ - label : " Build wheel - CUDA 12.9 "
4647 depends_on : ~
47- id : build-wheel-cuda-12-6
48+ id : build-wheel-cuda-12-9
4849 agents :
4950 queue : cpu_queue_postmerge
5051 commands :
51- - " DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --build-arg CUDA_VERSION=12.6.3 --build-arg torch_cuda_arch_list='7.0 7.5 8.0 8.9 9.0+PTX' --tag vllm-ci:build-image --target build --progress plain -f docker/Dockerfile ."
52+ - " DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --build-arg CUDA_VERSION=12.9.1 --tag vllm-ci:build-image --target build --progress plain -f docker/Dockerfile ."
5253 - " mkdir artifacts"
5354 - " docker run --rm -v $(pwd)/artifacts:/artifacts_host vllm-ci:build-image bash -c 'cp -r dist /artifacts_host && chmod -R a+rw /artifacts_host'"
5455 - " bash .buildkite/scripts/upload-wheels.sh"
5556 env :
5657 DOCKER_BUILDKIT : " 1"
5758
58- # x86 + CUDA builds
59- - label : " Build wheel - CUDA 12.9"
59+ - label : " Build wheel - CUDA 13.0"
6060 depends_on : ~
61- id : build-wheel-cuda-12-9
61+ id : build-wheel-cuda-13-0
6262 agents :
6363 queue : cpu_queue_postmerge
6464 commands :
65- - " DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --build-arg CUDA_VERSION=12.9.1 --tag vllm-ci:build-image --target build --progress plain -f docker/Dockerfile ."
65+ - " DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --build-arg CUDA_VERSION=13.0.1 --build-arg BUILD_BASE_IMAGE=nvidia/cuda:13.0.1-devel-ubuntu22.04 --tag vllm-ci:build-image --target build --progress plain -f docker/Dockerfile ."
6666 - " mkdir artifacts"
6767 - " docker run --rm -v $(pwd)/artifacts:/artifacts_host vllm-ci:build-image bash -c 'cp -r dist /artifacts_host && chmod -R a+rw /artifacts_host'"
6868 - " bash .buildkite/scripts/upload-wheels.sh"
6969 env :
7070 DOCKER_BUILDKIT : " 1"
7171
72+ # Build release images (12.9)
7273 - label : " Build release image (x86)"
7374 depends_on : ~
7475 id : build-release-image-x86
7576 agents :
7677 queue : cpu_queue_postmerge
7778 commands :
7879 - " aws ecr-public get-login-password --region us-east-1 | docker login --username AWS --password-stdin public.ecr.aws/q9t5s3a7"
79- - " DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --build-arg CUDA_VERSION=12.8 .1 --build-arg FLASHINFER_AOT_COMPILE=true --build-arg INSTALL_KV_CONNECTORS=true --tag public.ecr.aws/q9t5s3a7/vllm-release-repo:$BUILDKITE_COMMIT-$(uname -m) --target vllm-openai --progress plain -f docker/Dockerfile ."
80+ - " DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --build-arg CUDA_VERSION=12.9 .1 --build-arg FLASHINFER_AOT_COMPILE=true --build-arg INSTALL_KV_CONNECTORS=true --tag public.ecr.aws/q9t5s3a7/vllm-release-repo:$BUILDKITE_COMMIT-$(uname -m) --target vllm-openai --progress plain -f docker/Dockerfile ."
8081 - " docker push public.ecr.aws/q9t5s3a7/vllm-release-repo:$BUILDKITE_COMMIT-$(uname -m)"
8182 # re-tag to default image tag and push, just in case arm64 build fails
8283 - " docker tag public.ecr.aws/q9t5s3a7/vllm-release-repo:$BUILDKITE_COMMIT-$(uname -m) public.ecr.aws/q9t5s3a7/vllm-release-repo:$BUILDKITE_COMMIT"
8384 - " docker push public.ecr.aws/q9t5s3a7/vllm-release-repo:$BUILDKITE_COMMIT"
8485
85- # PyTorch 2.8 aarch64 + CUDA wheel is only available on CUDA 12.9
8686 - label : " Build release image (arm64)"
8787 depends_on : ~
8888 id : build-release-image-arm64
0 commit comments