|
5 | 5 | TORCH_CUDA_ARCH_LIST: 9.0a
|
6 | 6 | VLLM_FA_CMAKE_GPU_ARCHES: 90a-real
|
7 | 7 | TRITON_REF: release/3.2.x
|
8 |
| - TRITON_BUILD_VERSION: 3.2.0 |
| 8 | + TRITON_BUILD_SUFFIX: +cu126 |
9 | 9 | XFORMERS_REF: v0.0.29.post2
|
10 |
| - XFORMERS_BUILD_VERSION: 0.0.29.post2 |
| 10 | + XFORMERS_BUILD_VERSION: 0.0.29.post2+cu126 |
11 | 11 | FLASHINFER_REF: v0.2.2.post1
|
12 |
| - FLASHINFER_BUILD_VERSION: 0.2.2.post1 |
13 |
| - VLLM_REF: v0.8.0 |
14 |
| - VLLM_BUILD_VERSION: 0.8.0 |
| 12 | + FLASHINFER_BUILD_SUFFIX: cu126 |
| 13 | + VLLM_REF: v0.8.0rc2 |
15 | 14 |
|
16 | 15 | on:
|
17 | 16 | push:
|
@@ -54,25 +53,22 @@ jobs:
|
54 | 53 | build-args: |
|
55 | 54 | CUDA_VERSION=${{ matrix.cuda_version }}
|
56 | 55 | IMAGE_DISTRO=${{ matrix.image_distro }}
|
57 |
| - MAX_JOBS=${{ env.MAX_JOBS }} |
58 |
| - NVCC_THREADS=${{ env.NVCC_THREADS }} |
59 | 56 | TORCH_CUDA_ARCH_LIST=${{ env.TORCH_CUDA_ARCH_LIST }}
|
60 | 57 | VLLM_FA_CMAKE_GPU_ARCHES=${{ env.VLLM_FA_CMAKE_GPU_ARCHES }}
|
61 | 58 | TRITON_REF=${{ env.TRITON_REF }}
|
62 |
| - TRITON_BUILD_VERSION=${{ env.TRITON_BUILD_VERSION }} |
| 59 | + TRITON_BUILD_SUFFIX=${{ env.TRITON_BUILD_SUFFIX }} |
63 | 60 | XFORMERS_REF=${{ env.XFORMERS_REF }}
|
64 | 61 | XFORMERS_BUILD_VERSION=${{ env.XFORMERS_BUILD_VERSION }}
|
65 | 62 | FLASHINFER_REF=${{ env.FLASHINFER_REF }}
|
66 |
| - FLASHINFER_BUILD_VERSION=${{ env.FLASHINFER_BUILD_VERSION }} |
| 63 | + FLASHINFER_BUILD_SUFFIX=${{ env.FLASHINFER_BUILD_SUFFIX }} |
67 | 64 | VLLM_REF=${{ env.VLLM_REF }}
|
68 |
| - VLLM_BUILD_VERSION=${{ env.VLLM_BUILD_VERSION }} |
69 | 65 | cache-from: type=registry,ref=${{ env.GHCR_IMAGE }}:cache-cu${{ env.CUDA_TAG }}-${{ matrix.arch }}
|
70 | 66 | cache-to: type=registry,ref=${{ env.GHCR_IMAGE }}:cache-cu${{ env.CUDA_TAG }}-${{ matrix.arch }},mode=max
|
71 | 67 | context: .
|
72 | 68 | file: Dockerfile
|
73 | 69 | platforms: linux/${{ matrix.arch }}
|
74 | 70 | push: true
|
75 |
| - tags: ${{ env.GHCR_IMAGE }}:${{ env.VLLM_BUILD_VERSION }}-cu${{ env.CUDA_TAG }}-${{ matrix.arch }} |
| 71 | + tags: ${{ env.GHCR_IMAGE }}:${{ env.VLLM_REF }}-cu${{ env.CUDA_TAG }}-${{ matrix.arch }} |
76 | 72 |
|
77 | 73 | # Fix this to use matrix and handle imagetools create --append
|
78 | 74 | ghcr:
|
|
93 | 89 |
|
94 | 90 | - name: Tag images
|
95 | 91 | run: |
|
96 |
| - TAGS=(${VLLM_BUILD_VERSION}-cu${CUDA_TAG}-{amd,arm}64) |
97 |
| - docker buildx imagetools create -t ${GHCR_IMAGE}:${VLLM_BUILD_VERSION} ${TAGS[@]/#/${GHCR_IMAGE}:} |
| 92 | + TAGS=(${VLLM_REF}-cu${CUDA_TAG}-{amd,arm}64) |
| 93 | + docker buildx imagetools create -t ${GHCR_IMAGE}:${VLLM_REF} ${TAGS[@]/#/${GHCR_IMAGE}:} |
98 | 94 | docker buildx imagetools create -t ${GHCR_IMAGE}:latest ${TAGS[@]/#/${GHCR_IMAGE}:}
|
0 commit comments