-
Notifications
You must be signed in to change notification settings - Fork 53
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Separates the workflows for building the RAPIDS end user images and the cuVS images. The cuVS images do not depend on the RAPIDS end user images, so they can be built in parallel. This also allows for finer grained retries in case of failures. Also switches to using `rapids-mamba-retry` for installing conda packages. Finally, disables building the `cuvs-bench-datasets` images which are consistently failing (#724) until a better solution than the workaround in #723 is ready. 5adab54 can be reverted to re-enable this. Authors: - Ray Douglass (https://github.com/raydouglass) Approvers: - Jake Awe (https://github.com/AyodeAwe) URL: #725
- Loading branch information
1 parent
4f0424d
commit b2701d6
Showing
10 changed files
with
318 additions
and
159 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,110 @@ | ||
name: Build and push image variant | ||
|
||
on: | ||
workflow_call: | ||
inputs: | ||
ARCHES: | ||
required: true | ||
type: string | ||
CUDA_VER: | ||
required: true | ||
type: string | ||
LINUX_DISTRO: | ||
required: true | ||
type: string | ||
LINUX_DISTRO_VER: | ||
required: true | ||
type: string | ||
LINUX_VER: | ||
required: true | ||
type: string | ||
PYTHON_VER: | ||
required: true | ||
type: string | ||
RAPIDS_VER: | ||
required: true | ||
type: string | ||
BASE_TAG: | ||
required: true | ||
type: string | ||
NOTEBOOKS_TAG: | ||
required: true | ||
type: string | ||
|
||
jobs: | ||
build: | ||
strategy: | ||
matrix: | ||
ARCH: ${{ fromJSON(inputs.ARCHES) }} | ||
CUDA_VER: ["${{ inputs.CUDA_VER }}"] | ||
LINUX_VER: ["${{ inputs.LINUX_VER }}"] | ||
PYTHON_VER: ["${{ inputs.PYTHON_VER }}"] | ||
RAPIDS_VER: ["${{ inputs.RAPIDS_VER }}"] | ||
fail-fast: false | ||
runs-on: "linux-${{ matrix.ARCH }}-cpu4" | ||
steps: | ||
- name: Checkout | ||
uses: actions/checkout@v4 | ||
with: | ||
fetch-depth: 0 | ||
- name: Install gha-tools | ||
run: | | ||
mkdir -p /tmp/gha-tools | ||
curl -s -L 'https://github.com/rapidsai/gha-tools/releases/latest/download/tools.tar.gz' | tar -xz -C /tmp/gha-tools | ||
echo "/tmp/gha-tools" >> "${GITHUB_PATH}" | ||
- name: Clean up condarc for release builds | ||
run: | | ||
GIT_DESCRIBE_TAG="$(git describe --tags --abbrev=0)" | ||
GIT_DESCRIBE_TAG="${GIT_DESCRIBE_TAG:1}" # remove leading 'v' | ||
if [[ ! $GIT_DESCRIBE_TAG =~ [a-z] ]]; then | ||
rapids-logger "Most recent tag is for release, adding `rapidsai` channel and removing `rapidsai-nightly` and `dask/label/dev` channels." | ||
sed -i 's|rapidsai-nightly|rapidsai|;\|dask/label/dev|d' context/condarc | ||
else | ||
rapids-logger "Most recent tag is an alpha. Build will use nightly channels." | ||
fi | ||
- name: Login to DockerHub | ||
uses: docker/login-action@v3 | ||
with: | ||
username: ${{ secrets.GPUCIBOT_DOCKERHUB_USER }} | ||
password: ${{ secrets.GPUCIBOT_DOCKERHUB_TOKEN }} | ||
- name: Set up Docker Context for Buildx | ||
id: buildx-context | ||
run: | | ||
docker context create builders | ||
- name: Set up Docker Buildx | ||
uses: docker/setup-buildx-action@v3 | ||
with: | ||
driver: docker | ||
endpoint: builders | ||
- name: Build base image | ||
uses: docker/build-push-action@v6 | ||
with: | ||
context: context | ||
file: Dockerfile | ||
target: base | ||
push: true | ||
pull: true | ||
build-args: | | ||
CUDA_VER=${{ inputs.CUDA_VER }} | ||
LINUX_DISTRO=${{ inputs.LINUX_DISTRO }} | ||
LINUX_DISTRO_VER=${{ inputs.LINUX_DISTRO_VER }} | ||
LINUX_VER=${{ inputs.LINUX_VER }} | ||
PYTHON_VER=${{ inputs.PYTHON_VER }} | ||
RAPIDS_VER=${{ inputs.RAPIDS_VER }} | ||
tags: ${{ inputs.BASE_TAG }}-${{ matrix.ARCH }} | ||
- name: Build notebooks image | ||
uses: docker/build-push-action@v6 | ||
with: | ||
context: context | ||
file: Dockerfile | ||
target: notebooks | ||
push: true | ||
pull: true | ||
build-args: | | ||
CUDA_VER=${{ inputs.CUDA_VER }} | ||
LINUX_DISTRO=${{ inputs.LINUX_DISTRO }} | ||
LINUX_DISTRO_VER=${{ inputs.LINUX_DISTRO_VER }} | ||
LINUX_VER=${{ inputs.LINUX_VER }} | ||
PYTHON_VER=${{ inputs.PYTHON_VER }} | ||
RAPIDS_VER=${{ inputs.RAPIDS_VER }} | ||
tags: ${{ inputs.NOTEBOOKS_TAG }}-${{ matrix.ARCH }} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -36,8 +36,10 @@ jobs: | |
needs: | ||
- checks | ||
- compute-matrix | ||
- build | ||
- build-multiarch-manifest | ||
- build-rapids | ||
- build-rapids-multiarch-manifest | ||
- build-cuvs | ||
- build-cuvs-multiarch-manifest | ||
- test | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/[email protected] | ||
|
@@ -137,13 +139,13 @@ jobs: | |
export TEST_MATRIX | ||
echo "TEST_MATRIX=$(yq -n -o json 'env(TEST_MATRIX)' | jq -c '{include: .}')" | tee --append "${GITHUB_OUTPUT}" | ||
build: | ||
build-rapids: | ||
needs: [checks, compute-matrix] | ||
strategy: | ||
matrix: ${{ fromJSON(needs.compute-matrix.outputs.MATRIX) }} | ||
fail-fast: false | ||
secrets: inherit | ||
uses: ./.github/workflows/build-image.yml | ||
uses: ./.github/workflows/build-rapids-image.yml | ||
with: | ||
ARCHES: ${{ toJSON(matrix.ARCHES) }} | ||
CUDA_VER: ${{ matrix.CUDA_VER }} | ||
|
@@ -152,7 +154,6 @@ jobs: | |
LINUX_VER: ${{ matrix.LINUX_VER }} | ||
PYTHON_VER: ${{ matrix.PYTHON_VER }} | ||
RAPIDS_VER: ${{ needs.compute-matrix.outputs.RAPIDS_VER }} | ||
BUILD_CUVS_BENCH_CPU_IMAGE: ${{ matrix.BUILD_CUVS_BENCH_CPU_IMAGE }} | ||
BASE_TAG: | ||
"rapidsai/${{ needs.compute-matrix.outputs.BASE_IMAGE_REPO }}:\ | ||
${{ needs.compute-matrix.outputs.BASE_TAG_PREFIX }}\ | ||
|
@@ -167,6 +168,22 @@ jobs: | |
${{ needs.compute-matrix.outputs.ALPHA_TAG }}-\ | ||
cuda${{ matrix.CUDA_TAG }}-\ | ||
py${{ matrix.PYTHON_VER }}" | ||
build-cuvs: | ||
needs: [checks, compute-matrix] | ||
strategy: | ||
matrix: ${{ fromJSON(needs.compute-matrix.outputs.MATRIX) }} | ||
fail-fast: false | ||
secrets: inherit | ||
uses: ./.github/workflows/build-cuvs-image.yml | ||
with: | ||
ARCHES: ${{ toJSON(matrix.ARCHES) }} | ||
CUDA_VER: ${{ matrix.CUDA_VER }} | ||
LINUX_DISTRO: ${{ matrix.LINUX_DISTRO }} | ||
LINUX_DISTRO_VER: ${{ matrix.LINUX_DISTRO_VER }} | ||
LINUX_VER: ${{ matrix.LINUX_VER }} | ||
PYTHON_VER: ${{ matrix.PYTHON_VER }} | ||
RAPIDS_VER: ${{ needs.compute-matrix.outputs.RAPIDS_VER }} | ||
BUILD_CUVS_BENCH_CPU_IMAGE: ${{ matrix.BUILD_CUVS_BENCH_CPU_IMAGE }} | ||
CUVS_BENCH_TAG: | ||
"rapidsai/${{ needs.compute-matrix.outputs.CUVS_BENCH_IMAGE_REPO }}:\ | ||
${{ needs.compute-matrix.outputs.CUVS_BENCH_TAG_PREFIX }}\ | ||
|
@@ -187,8 +204,8 @@ jobs: | |
${{ needs.compute-matrix.outputs.RAPIDS_VER }}\ | ||
${{ needs.compute-matrix.outputs.ALPHA_TAG }}-\ | ||
py${{ matrix.PYTHON_VER }}" | ||
build-multiarch-manifest: | ||
needs: [build, compute-matrix] | ||
build-rapids-multiarch-manifest: | ||
needs: [build-rapids, compute-matrix] | ||
strategy: | ||
matrix: ${{ fromJSON(needs.compute-matrix.outputs.MATRIX) }} | ||
fail-fast: false | ||
|
@@ -206,7 +223,6 @@ jobs: | |
- name: Create multiarch manifest | ||
shell: bash | ||
env: | ||
CUVS_BENCH_CPU_IMAGE_BUILT: ${{ matrix.BUILD_CUVS_BENCH_CPU_IMAGE }} | ||
BASE_IMAGE_REPO: ${{ needs.compute-matrix.outputs.BASE_IMAGE_REPO }} | ||
BASE_TAG_PREFIX: ${{ needs.compute-matrix.outputs.BASE_TAG_PREFIX }} | ||
RAPIDS_VER: ${{ needs.compute-matrix.outputs.RAPIDS_VER }} | ||
|
@@ -215,6 +231,34 @@ jobs: | |
PYTHON_VER: ${{ matrix.PYTHON_VER }} | ||
NOTEBOOKS_IMAGE_REPO: ${{ needs.compute-matrix.outputs.NOTEBOOKS_IMAGE_REPO }} | ||
NOTEBOOKS_TAG_PREFIX: ${{ needs.compute-matrix.outputs.NOTEBOOKS_TAG_PREFIX }} | ||
GPUCIBOT_DOCKERHUB_USER: ${{ secrets.GPUCIBOT_DOCKERHUB_USER }} | ||
GPUCIBOT_DOCKERHUB_TOKEN: ${{ secrets.GPUCIBOT_DOCKERHUB_TOKEN }} | ||
ARCHES: ${{ toJSON(matrix.ARCHES) }} | ||
run: ci/create-rapids-multiarch-manifest.sh | ||
build-cuvs-multiarch-manifest: | ||
needs: [build-cuvs, compute-matrix] | ||
strategy: | ||
matrix: ${{ fromJSON(needs.compute-matrix.outputs.MATRIX) }} | ||
fail-fast: false | ||
runs-on: ubuntu-latest | ||
steps: | ||
- name: Checkout | ||
uses: actions/checkout@v4 | ||
with: | ||
fetch-depth: 0 | ||
- name: Login to DockerHub | ||
uses: docker/login-action@v3 | ||
with: | ||
username: ${{ secrets.GPUCIBOT_DOCKERHUB_USER }} | ||
password: ${{ secrets.GPUCIBOT_DOCKERHUB_TOKEN }} | ||
- name: Create multiarch manifest | ||
shell: bash | ||
env: | ||
RAPIDS_VER: ${{ needs.compute-matrix.outputs.RAPIDS_VER }} | ||
ALPHA_TAG: ${{ needs.compute-matrix.outputs.ALPHA_TAG }} | ||
CUDA_TAG: ${{ matrix.CUDA_TAG }} | ||
PYTHON_VER: ${{ matrix.PYTHON_VER }} | ||
CUVS_BENCH_CPU_IMAGE_BUILT: ${{ matrix.BUILD_CUVS_BENCH_CPU_IMAGE }} | ||
CUVS_BENCH_IMAGE_REPO: ${{ needs.compute-matrix.outputs.CUVS_BENCH_IMAGE_REPO }} | ||
CUVS_BENCH_TAG_PREFIX: ${{ needs.compute-matrix.outputs.CUVS_BENCH_TAG_PREFIX }} | ||
CUVS_BENCH_DATASETS_IMAGE_REPO: ${{ needs.compute-matrix.outputs.CUVS_BENCH_DATASETS_IMAGE_REPO }} | ||
|
@@ -224,9 +268,9 @@ jobs: | |
GPUCIBOT_DOCKERHUB_USER: ${{ secrets.GPUCIBOT_DOCKERHUB_USER }} | ||
GPUCIBOT_DOCKERHUB_TOKEN: ${{ secrets.GPUCIBOT_DOCKERHUB_TOKEN }} | ||
ARCHES: ${{ toJSON(matrix.ARCHES) }} | ||
run: ci/create-multiarch-manifest.sh | ||
run: ci/create-cuvs-multiarch-manifest.sh | ||
test: | ||
needs: [compute-matrix, build] | ||
needs: [compute-matrix, build-rapids] | ||
if: inputs.run_tests | ||
strategy: | ||
matrix: ${{ fromJSON(needs.compute-matrix.outputs.TEST_MATRIX) }} | ||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,29 @@ | ||
#!/bin/bash | ||
|
||
set -eEuo pipefail | ||
|
||
# Authenticate and retrieve DockerHub token | ||
HUB_TOKEN=$( | ||
curl -s -H "Content-Type: application/json" \ | ||
-X POST \ | ||
-d "{\"username\": \"$GPUCIBOT_DOCKERHUB_USER\", \"password\": \"$GPUCIBOT_DOCKERHUB_TOKEN\"}" \ | ||
https://hub.docker.com/v2/users/login/ | jq -r .token \ | ||
) | ||
echo "::add-mask::${HUB_TOKEN}" | ||
export HUB_TOKEN | ||
|
||
# Function to check if a Docker tag exists | ||
check_tag_exists() { | ||
local repo="$1" | ||
local tag="$2" | ||
local exists | ||
exists=$(curl -s -o /dev/null -w "%{http_code}" -H "Authorization: JWT $HUB_TOKEN" \ | ||
"https://hub.docker.com/v2/repositories/${org}/${repo}/tags/${tag}/") | ||
|
||
if [ "$exists" -ne 200 ]; then | ||
echo "Error: Required image tag ${repo}:${tag} does not exist. This implies that the image was not built successfully in the build job." | ||
exit 1 | ||
fi | ||
} | ||
|
||
export org="rapidsai" |
Oops, something went wrong.