Skip to content

Commit 5d80096

Browse files
huydhnilmarkov
authored andcommitted
Update release pipeline for PyTorch 2.9.0 (vllm-project#27303)
Signed-off-by: Huy Do <huydhn@gmail.com>
1 parent ce15379 commit 5d80096

File tree

3 files changed

+19
-27
lines changed

3 files changed

+19
-27
lines changed

.buildkite/release-pipeline.yaml

Lines changed: 12 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
steps:
2-
# aarch64 + CUDA builds. PyTorch 2.8 aarch64 + CUDA wheel is only available on CUDA 12.9
2+
# aarch64 + CUDA builds
33
- label: "Build arm64 wheel - CUDA 12.9"
44
depends_on: ~
55
id: build-wheel-arm64-cuda-12-9
@@ -15,20 +15,21 @@ steps:
1515
env:
1616
DOCKER_BUILDKIT: "1"
1717

18-
# aarch64 build.
18+
# aarch64 build
1919
- label: "Build arm64 CPU wheel"
2020
depends_on: ~
2121
id: build-wheel-arm64-cpu
2222
agents:
2323
queue: arm64_cpu_queue_postmerge
2424
commands:
25-
- "DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --tag vllm-ci:build-image --target build --progress plain -f docker/Dockerfile.cpu ."
25+
- "DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --build-arg VLLM_BUILD_ACL=ON --tag vllm-ci:build-image --target build --progress plain -f docker/Dockerfile.cpu ."
2626
- "mkdir artifacts"
2727
- "docker run --rm -v $(pwd)/artifacts:/artifacts_host vllm-ci:build-image bash -c 'cp -r dist /artifacts_host && chmod -R a+rw /artifacts_host'"
2828
- "bash .buildkite/scripts/upload-wheels.sh"
2929
env:
3030
DOCKER_BUILDKIT: "1"
3131

32+
# x86 + CUDA builds
3233
- label: "Build wheel - CUDA 12.8"
3334
depends_on: ~
3435
id: build-wheel-cuda-12-8
@@ -42,47 +43,46 @@ steps:
4243
env:
4344
DOCKER_BUILDKIT: "1"
4445

45-
- label: "Build wheel - CUDA 12.6"
46+
- label: "Build wheel - CUDA 12.9"
4647
depends_on: ~
47-
id: build-wheel-cuda-12-6
48+
id: build-wheel-cuda-12-9
4849
agents:
4950
queue: cpu_queue_postmerge
5051
commands:
51-
- "DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --build-arg CUDA_VERSION=12.6.3 --build-arg torch_cuda_arch_list='7.0 7.5 8.0 8.9 9.0+PTX' --tag vllm-ci:build-image --target build --progress plain -f docker/Dockerfile ."
52+
- "DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --build-arg CUDA_VERSION=12.9.1 --tag vllm-ci:build-image --target build --progress plain -f docker/Dockerfile ."
5253
- "mkdir artifacts"
5354
- "docker run --rm -v $(pwd)/artifacts:/artifacts_host vllm-ci:build-image bash -c 'cp -r dist /artifacts_host && chmod -R a+rw /artifacts_host'"
5455
- "bash .buildkite/scripts/upload-wheels.sh"
5556
env:
5657
DOCKER_BUILDKIT: "1"
5758

58-
# x86 + CUDA builds
59-
- label: "Build wheel - CUDA 12.9"
59+
- label: "Build wheel - CUDA 13.0"
6060
depends_on: ~
61-
id: build-wheel-cuda-12-9
61+
id: build-wheel-cuda-13-0
6262
agents:
6363
queue: cpu_queue_postmerge
6464
commands:
65-
- "DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --build-arg CUDA_VERSION=12.9.1 --tag vllm-ci:build-image --target build --progress plain -f docker/Dockerfile ."
65+
- "DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --build-arg CUDA_VERSION=13.0.1 --build-arg BUILD_BASE_IMAGE=nvidia/cuda:13.0.1-devel-ubuntu22.04 --tag vllm-ci:build-image --target build --progress plain -f docker/Dockerfile ."
6666
- "mkdir artifacts"
6767
- "docker run --rm -v $(pwd)/artifacts:/artifacts_host vllm-ci:build-image bash -c 'cp -r dist /artifacts_host && chmod -R a+rw /artifacts_host'"
6868
- "bash .buildkite/scripts/upload-wheels.sh"
6969
env:
7070
DOCKER_BUILDKIT: "1"
7171

72+
# Build release images (12.9)
7273
- label: "Build release image (x86)"
7374
depends_on: ~
7475
id: build-release-image-x86
7576
agents:
7677
queue: cpu_queue_postmerge
7778
commands:
7879
- "aws ecr-public get-login-password --region us-east-1 | docker login --username AWS --password-stdin public.ecr.aws/q9t5s3a7"
79-
- "DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --build-arg CUDA_VERSION=12.8.1 --build-arg FLASHINFER_AOT_COMPILE=true --build-arg INSTALL_KV_CONNECTORS=true --tag public.ecr.aws/q9t5s3a7/vllm-release-repo:$BUILDKITE_COMMIT-$(uname -m) --target vllm-openai --progress plain -f docker/Dockerfile ."
80+
- "DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --build-arg CUDA_VERSION=12.9.1 --build-arg FLASHINFER_AOT_COMPILE=true --build-arg INSTALL_KV_CONNECTORS=true --tag public.ecr.aws/q9t5s3a7/vllm-release-repo:$BUILDKITE_COMMIT-$(uname -m) --target vllm-openai --progress plain -f docker/Dockerfile ."
8081
- "docker push public.ecr.aws/q9t5s3a7/vllm-release-repo:$BUILDKITE_COMMIT-$(uname -m)"
8182
# re-tag to default image tag and push, just in case arm64 build fails
8283
- "docker tag public.ecr.aws/q9t5s3a7/vllm-release-repo:$BUILDKITE_COMMIT-$(uname -m) public.ecr.aws/q9t5s3a7/vllm-release-repo:$BUILDKITE_COMMIT"
8384
- "docker push public.ecr.aws/q9t5s3a7/vllm-release-repo:$BUILDKITE_COMMIT"
8485

85-
# PyTorch 2.8 aarch64 + CUDA wheel is only available on CUDA 12.9
8686
- label: "Build release image (arm64)"
8787
depends_on: ~
8888
id: build-release-image-arm64

.buildkite/scripts/upload-wheels.sh

Lines changed: 6 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -58,33 +58,25 @@ python3 .buildkite/generate_index.py --wheel "$normal_wheel"
5858
aws s3 cp "$wheel" "s3://vllm-wheels/$BUILDKITE_COMMIT/"
5959
aws s3 cp "$normal_wheel" "s3://vllm-wheels/$BUILDKITE_COMMIT/"
6060

61-
if [[ $normal_wheel == *"cu126"* ]]; then
62-
# if $normal_wheel matches cu126, do not upload the index.html
63-
echo "Skipping index files for cu126 wheels"
64-
elif [[ $normal_wheel == *"cu128"* ]]; then
65-
# if $normal_wheel matches cu128, do not upload the index.html
66-
echo "Skipping index files for cu128 wheels"
67-
else
61+
if [[ $normal_wheel == *"cu129"* ]]; then
6862
# only upload index.html for cu129 wheels (default wheels) as it
6963
# is available on both x86 and arm64
7064
aws s3 cp index.html "s3://vllm-wheels/$BUILDKITE_COMMIT/vllm/index.html"
7165
aws s3 cp "s3://vllm-wheels/nightly/index.html" "s3://vllm-wheels/$BUILDKITE_COMMIT/index.html"
66+
else
67+
echo "Skipping index files for non-cu129 wheels"
7268
fi
7369

7470
# generate index for nightly
7571
aws s3 cp "$wheel" "s3://vllm-wheels/nightly/"
7672
aws s3 cp "$normal_wheel" "s3://vllm-wheels/nightly/"
7773

78-
if [[ $normal_wheel == *"cu126"* ]]; then
79-
# if $normal_wheel matches cu126, do not upload the index.html
80-
echo "Skipping index files for cu126 wheels"
81-
elif [[ $normal_wheel == *"cu128"* ]]; then
82-
# if $normal_wheel matches cu128, do not upload the index.html
83-
echo "Skipping index files for cu128 wheels"
84-
else
74+
if [[ $normal_wheel == *"cu129"* ]]; then
8575
# only upload index.html for cu129 wheels (default wheels) as it
8676
# is available on both x86 and arm64
8777
aws s3 cp index.html "s3://vllm-wheels/nightly/vllm/index.html"
78+
else
79+
echo "Skipping index files for non-cu129 wheels"
8880
fi
8981

9082
aws s3 cp "$wheel" "s3://vllm-wheels/$version/"

docker/Dockerfile.cpu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -31,7 +31,7 @@ ARG PIP_EXTRA_INDEX_URL="https://download.pytorch.org/whl/cpu"
3131
RUN --mount=type=cache,target=/var/cache/apt,sharing=locked \
3232
--mount=type=cache,target=/var/lib/apt,sharing=locked \
3333
apt-get update -y \
34-
&& apt-get install -y --no-install-recommends ccache git curl wget ca-certificates \
34+
&& apt-get install -y --no-install-recommends sudo ccache git curl wget ca-certificates \
3535
gcc-12 g++-12 libtcmalloc-minimal4 libnuma-dev ffmpeg libsm6 libxext6 libgl1 jq lsof \
3636
&& update-alternatives --install /usr/bin/gcc gcc /usr/bin/gcc-12 10 --slave /usr/bin/g++ g++ /usr/bin/g++-12 \
3737
&& curl -LsSf https://astral.sh/uv/install.sh | sh

0 commit comments

Comments
 (0)