Skip to content

Commit a2617b1

Browse files
committed
Update package version mapping
1 parent 8372362 commit a2617b1

File tree

2 files changed

+15
-21
lines changed

2 files changed

+15
-21
lines changed

.github/workflows/build-vllm.yaml

+9-13
Original file line numberDiff line numberDiff line change
@@ -5,13 +5,12 @@ env:
55
TORCH_CUDA_ARCH_LIST: 9.0a
66
VLLM_FA_CMAKE_GPU_ARCHES: 90a-real
77
TRITON_REF: release/3.2.x
8-
TRITON_BUILD_VERSION: 3.2.0
8+
TRITON_BUILD_SUFFIX: +cu126
99
XFORMERS_REF: v0.0.29.post2
10-
XFORMERS_BUILD_VERSION: 0.0.29.post2
10+
XFORMERS_BUILD_VERSION: 0.0.29.post2+cu126
1111
FLASHINFER_REF: v0.2.2.post1
12-
FLASHINFER_BUILD_VERSION: 0.2.2.post1
13-
VLLM_REF: v0.8.0
14-
VLLM_BUILD_VERSION: 0.8.0
12+
FLASHINFER_BUILD_SUFFIX: cu126
13+
VLLM_REF: v0.8.0rc2
1514

1615
on:
1716
push:
@@ -54,25 +53,22 @@ jobs:
5453
build-args: |
5554
CUDA_VERSION=${{ matrix.cuda_version }}
5655
IMAGE_DISTRO=${{ matrix.image_distro }}
57-
MAX_JOBS=${{ env.MAX_JOBS }}
58-
NVCC_THREADS=${{ env.NVCC_THREADS }}
5956
TORCH_CUDA_ARCH_LIST=${{ env.TORCH_CUDA_ARCH_LIST }}
6057
VLLM_FA_CMAKE_GPU_ARCHES=${{ env.VLLM_FA_CMAKE_GPU_ARCHES }}
6158
TRITON_REF=${{ env.TRITON_REF }}
62-
TRITON_BUILD_VERSION=${{ env.TRITON_BUILD_VERSION }}
59+
TRITON_BUILD_SUFFIX=${{ env.TRITON_BUILD_SUFFIX }}
6360
XFORMERS_REF=${{ env.XFORMERS_REF }}
6461
XFORMERS_BUILD_VERSION=${{ env.XFORMERS_BUILD_VERSION }}
6562
FLASHINFER_REF=${{ env.FLASHINFER_REF }}
66-
FLASHINFER_BUILD_VERSION=${{ env.FLASHINFER_BUILD_VERSION }}
63+
FLASHINFER_BUILD_SUFFIX=${{ env.FLASHINFER_BUILD_SUFFIX }}
6764
VLLM_REF=${{ env.VLLM_REF }}
68-
VLLM_BUILD_VERSION=${{ env.VLLM_BUILD_VERSION }}
6965
cache-from: type=registry,ref=${{ env.GHCR_IMAGE }}:cache-cu${{ env.CUDA_TAG }}-${{ matrix.arch }}
7066
cache-to: type=registry,ref=${{ env.GHCR_IMAGE }}:cache-cu${{ env.CUDA_TAG }}-${{ matrix.arch }},mode=max
7167
context: .
7268
file: Dockerfile
7369
platforms: linux/${{ matrix.arch }}
7470
push: true
75-
tags: ${{ env.GHCR_IMAGE }}:${{ env.VLLM_BUILD_VERSION }}-cu${{ env.CUDA_TAG }}-${{ matrix.arch }}
71+
tags: ${{ env.GHCR_IMAGE }}:${{ env.VLLM_REF }}-cu${{ env.CUDA_TAG }}-${{ matrix.arch }}
7672

7773
# Fix this to use matrix and handle imagetools create --append
7874
ghcr:
@@ -93,6 +89,6 @@ jobs:
9389

9490
- name: Tag images
9591
run: |
96-
TAGS=(${VLLM_BUILD_VERSION}-cu${CUDA_TAG}-{amd,arm}64)
97-
docker buildx imagetools create -t ${GHCR_IMAGE}:${VLLM_BUILD_VERSION} ${TAGS[@]/#/${GHCR_IMAGE}:}
92+
TAGS=(${VLLM_REF}-cu${CUDA_TAG}-{amd,arm}64)
93+
docker buildx imagetools create -t ${GHCR_IMAGE}:${VLLM_REF} ${TAGS[@]/#/${GHCR_IMAGE}:}
9894
docker buildx imagetools create -t ${GHCR_IMAGE}:latest ${TAGS[@]/#/${GHCR_IMAGE}:}

Dockerfile

+6-8
Original file line numberDiff line numberDiff line change
@@ -57,8 +57,8 @@ RUN uv pip install -U build cmake ninja pybind11 setuptools wheel
5757

5858
FROM build-base AS build-triton
5959
ARG TRITON_REF=release/3.2.x
60-
ARG TRITON_BUILD_VERSION=3.2.0
61-
ENV BUILD_VERSION=${TRITON_BUILD_VERSION:-${TRITON_REF#v}}
60+
ARG TRITON_BUILD_SUFFIX=+cu126
61+
ENV TRITON_WHEEL_VERSION_SUFFIX=${TRITON_BUILD_SUFFIX:-}
6262
RUN git clone https://github.com/triton-lang/triton.git
6363
RUN cd triton && \
6464
git checkout ${TRITON_REF} && \
@@ -68,7 +68,7 @@ RUN cd triton && \
6868

6969
FROM build-base AS build-xformers
7070
ARG XFORMERS_REF=v0.0.29.post2
71-
ARG XFORMERS_BUILD_VERSION=0.0.29.post2
71+
ARG XFORMERS_BUILD_VERSION=0.0.29.post2+cu126
7272
ENV BUILD_VERSION=${XFORMERS_BUILD_VERSION:-${XFORMERS_REF#v}}
7373
RUN git clone https://github.com/facebookresearch/xformers.git
7474
RUN cd xformers && \
@@ -80,8 +80,8 @@ RUN cd xformers && \
8080
FROM build-base AS build-flashinfer
8181
ARG FLASHINFER_ENABLE_AOT=1
8282
ARG FLASHINFER_REF=v0.2.2.post1
83-
ARG FLASHINFER_BUILD_VERSION=0.2.2.post1
84-
ENV FLASHINFER_LOCAL_VERSION=${FLASHINFER_BUILD_VERSION:-${FLASHINFER_REF#v}}
83+
ARG FLASHINFER_BUILD_SUFFIX=cu126
84+
ENV FLASHINFER_LOCAL_VERSION=${FLASHINFER_BUILD_SUFFIX:-}
8585
RUN git clone https://github.com/flashinfer-ai/flashinfer.git
8686
RUN cd flashinfer && \
8787
git checkout ${FLASHINFER_REF} && \
@@ -90,9 +90,7 @@ RUN cd flashinfer && \
9090
uv build --wheel --no-build-isolation -o /wheels
9191

9292
FROM build-base AS build-vllm
93-
ARG VLLM_REF=v0.8.0
94-
ARG VLLM_BUILD_VERSION=0.8.0
95-
ENV BUILD_VERSION=${VLLM_BUILD_VERSION:-${VLLM_REF#v}}
93+
ARG VLLM_REF=v0.8.0rc2
9694
RUN git clone https://github.com/vllm-project/vllm.git
9795
RUN cd vllm && \
9896
git checkout ${VLLM_REF} && \

0 commit comments

Comments
 (0)