Skip to content

Commit 8ce8954

Browse files
youkaichaohuydhn
authored andcommitted
Update release pipeline post PyTorch 2.8.0 update (vllm-project#24073)
Signed-off-by: Huy Do <[email protected]> Signed-off-by: youkaichao <[email protected]> Co-authored-by: Huy Do <[email protected]>
1 parent 232fc8c commit 8ce8954

File tree

3 files changed

+29
-27
lines changed

3 files changed

+29
-27
lines changed

.buildkite/release-pipeline.yaml

Lines changed: 16 additions & 16 deletions
Original file line numberDiff line numberDiff line change
@@ -1,21 +1,24 @@
11
steps:
2-
# aarch64 + CUDA builds
3-
- label: "Build arm64 wheel - CUDA 12.8"
4-
id: build-wheel-arm64-cuda-12-8
2+
# aarch64 + CUDA builds. PyTorch 2.8 aarch64 + CUDA wheel is only available on CUDA 12.9
3+
- label: "Build arm64 wheel - CUDA 12.9"
4+
id: build-wheel-arm64-cuda-12-9
55
agents:
66
queue: arm64_cpu_queue_postmerge
77
commands:
88
# #NOTE: torch_cuda_arch_list is derived from upstream PyTorch build files here:
99
# https://github.com/pytorch/pytorch/blob/main/.ci/aarch64_linux/aarch64_ci_build.sh#L7
10-
- "DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --build-arg CUDA_VERSION=12.8.1 --build-arg torch_cuda_arch_list='8.7 9.0 10.0+PTX 12.0' --tag vllm-ci:build-image --target build --progress plain -f docker/Dockerfile ."
10+
- "DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --build-arg CUDA_VERSION=12.9.1 --build-arg torch_cuda_arch_list='8.7 9.0 10.0+PTX 12.0' --tag vllm-ci:build-image --target build --progress plain -f docker/Dockerfile ."
1111
- "mkdir artifacts"
1212
- "docker run --rm -v $(pwd)/artifacts:/artifacts_host vllm-ci:build-image bash -c 'cp -r dist /artifacts_host && chmod -R a+rw /artifacts_host'"
1313
- "bash .buildkite/scripts/upload-wheels.sh"
1414
env:
1515
DOCKER_BUILDKIT: "1"
1616

17-
# x86 + CUDA builds
17+
- block: "Build CUDA 12.8 wheel"
18+
key: block-build-cu128-wheel
19+
1820
- label: "Build wheel - CUDA 12.8"
21+
depends_on: block-build-cu128-wheel
1922
id: build-wheel-cuda-12-8
2023
agents:
2124
queue: cpu_queue_postmerge
@@ -44,18 +47,14 @@ steps:
4447
env:
4548
DOCKER_BUILDKIT: "1"
4649

47-
# Note(simon): We can always build CUDA 11.8 wheel to ensure the build is working.
48-
# However, this block can be uncommented to save some compute hours.
49-
# - block: "Build CUDA 11.8 wheel"
50-
# key: block-build-cu118-wheel
51-
52-
- label: "Build wheel - CUDA 11.8"
53-
# depends_on: block-build-cu118-wheel
54-
id: build-wheel-cuda-11-8
50+
# x86 + CUDA builds
51+
- label: "Build wheel - CUDA 12.9"
52+
depends_on: ~
53+
id: build-wheel-cuda-12-9
5554
agents:
5655
queue: cpu_queue_postmerge
5756
commands:
58-
- "DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --build-arg CUDA_VERSION=11.8.0 --build-arg torch_cuda_arch_list='7.0 7.5 8.0 8.9 9.0+PTX' --tag vllm-ci:build-image --target build --progress plain -f docker/Dockerfile ."
57+
- "DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --build-arg CUDA_VERSION=12.9.1 --build-arg torch_cuda_arch_list='7.0 7.5 8.0 8.9 9.0+PTX' --tag vllm-ci:build-image --target build --progress plain -f docker/Dockerfile ."
5958
- "mkdir artifacts"
6059
- "docker run --rm -v $(pwd)/artifacts:/artifacts_host vllm-ci:build-image bash -c 'cp -r dist /artifacts_host && chmod -R a+rw /artifacts_host'"
6160
- "bash .buildkite/scripts/upload-wheels.sh"
@@ -75,14 +74,15 @@ steps:
7574
- "docker tag public.ecr.aws/q9t5s3a7/vllm-release-repo:$BUILDKITE_COMMIT-$(uname -m) public.ecr.aws/q9t5s3a7/vllm-release-repo:$BUILDKITE_COMMIT"
7675
- "docker push public.ecr.aws/q9t5s3a7/vllm-release-repo:$BUILDKITE_COMMIT"
7776

77+
# PyTorch 2.8 aarch64 + CUDA wheel is only available on CUDA 12.9
7878
- label: "Build release image (arm64)"
7979
depends_on: ~
8080
id: build-release-image-arm64
8181
agents:
8282
queue: arm64_cpu_queue_postmerge
8383
commands:
8484
- "aws ecr-public get-login-password --region us-east-1 | docker login --username AWS --password-stdin public.ecr.aws/q9t5s3a7"
85-
- "DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --build-arg CUDA_VERSION=12.8.1 --build-arg torch_cuda_arch_list='8.7 9.0 10.0+PTX 12.0' --build-arg INSTALL_KV_CONNECTORS=true --tag public.ecr.aws/q9t5s3a7/vllm-release-repo:$BUILDKITE_COMMIT-$(uname -m) --target vllm-openai --progress plain -f docker/Dockerfile ."
85+
- "DOCKER_BUILDKIT=1 docker build --build-arg max_jobs=16 --build-arg USE_SCCACHE=1 --build-arg GIT_REPO_CHECK=1 --build-arg CUDA_VERSION=12.9.1 --build-arg torch_cuda_arch_list='8.7 9.0 10.0+PTX 12.0' --build-arg INSTALL_KV_CONNECTORS=true --tag public.ecr.aws/q9t5s3a7/vllm-release-repo:$BUILDKITE_COMMIT-$(uname -m) --target vllm-openai --progress plain -f docker/Dockerfile ."
8686
- "docker push public.ecr.aws/q9t5s3a7/vllm-release-repo:$BUILDKITE_COMMIT-$(uname -m)"
8787

8888
# Add job to create multi-arch manifest
@@ -103,7 +103,7 @@ steps:
103103
- create-multi-arch-manifest
104104
- build-wheel-cuda-12-8
105105
- build-wheel-cuda-12-6
106-
- build-wheel-cuda-11-8
106+
- build-wheel-cuda-12-9
107107
id: annotate-release-workflow
108108
agents:
109109
queue: cpu_queue_postmerge

.buildkite/scripts/upload-wheels.sh

Lines changed: 12 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -58,14 +58,15 @@ python3 .buildkite/generate_index.py --wheel "$normal_wheel"
5858
aws s3 cp "$wheel" "s3://vllm-wheels/$BUILDKITE_COMMIT/"
5959
aws s3 cp "$normal_wheel" "s3://vllm-wheels/$BUILDKITE_COMMIT/"
6060

61-
if [[ $normal_wheel == *"cu118"* ]]; then
62-
# if $normal_wheel matches cu118, do not upload the index.html
63-
echo "Skipping index files for cu118 wheels"
64-
elif [[ $normal_wheel == *"cu126"* ]]; then
61+
if [[ $normal_wheel == *"cu126"* ]]; then
6562
# if $normal_wheel matches cu126, do not upload the index.html
6663
echo "Skipping index files for cu126 wheels"
64+
elif [[ $normal_wheel == *"cu128"* ]]; then
65+
# if $normal_wheel matches cu128, do not upload the index.html
66+
echo "Skipping index files for cu128 wheels"
6767
else
68-
# only upload index.html for cu128 wheels (default wheels)
68+
# only upload index.html for cu129 wheels (default wheels) as it
69+
# is available on both x86 and arm64
6970
aws s3 cp index.html "s3://vllm-wheels/$BUILDKITE_COMMIT/vllm/index.html"
7071
aws s3 cp "s3://vllm-wheels/nightly/index.html" "s3://vllm-wheels/$BUILDKITE_COMMIT/index.html"
7172
fi
@@ -74,14 +75,15 @@ fi
7475
aws s3 cp "$wheel" "s3://vllm-wheels/nightly/"
7576
aws s3 cp "$normal_wheel" "s3://vllm-wheels/nightly/"
7677

77-
if [[ $normal_wheel == *"cu118"* ]]; then
78-
# if $normal_wheel matches cu118, do not upload the index.html
79-
echo "Skipping index files for cu118 wheels"
80-
elif [[ $normal_wheel == *"cu126"* ]]; then
78+
if [[ $normal_wheel == *"cu126"* ]]; then
8179
# if $normal_wheel matches cu126, do not upload the index.html
8280
echo "Skipping index files for cu126 wheels"
81+
elif [[ $normal_wheel == *"cu128"* ]]; then
82+
# if $normal_wheel matches cu128, do not upload the index.html
83+
echo "Skipping index files for cu128 wheels"
8384
else
84-
# only upload index.html for cu128 wheels (default wheels)
85+
# only upload index.html for cu129 wheels (default wheels) as it
86+
# is available on both x86 and arm64
8587
aws s3 cp index.html "s3://vllm-wheels/nightly/vllm/index.html"
8688
fi
8789

tools/install_deepgemm.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -105,4 +105,4 @@ fi
105105

106106
popd
107107

108-
echo "✅ DeepGEMM installation completed successfully"
108+
echo "✅ DeepGEMM installation completed successfully"

0 commit comments

Comments
 (0)