-
Notifications
You must be signed in to change notification settings - Fork 532
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
- Loading branch information
Showing
1 changed file
with
146 additions
and
28 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -9,7 +9,60 @@ concurrency: | |
group: ${{ github.workflow }}-${{ github.ref }} | ||
cancel-in-progress: true | ||
|
||
env: | ||
# TODO: put this in a shared org-wide secret? | ||
OTEL_SERVICE_NAME: 'pr-cuml' | ||
# TODO: this should be set as an org-wide variable | ||
OTEL_EXPORTER_OTLP_ENDPOINT: https://tempo.gha-runners.nvidia.com:4318 | ||
# These are where the secrets in github env vars are written to files. These files don't | ||
# exist unless you explicitly write them in a step. | ||
# The purpose of setting the environment variable is to tell OpenTelemetry tools where to find them. | ||
# We abuse it a bit by also using it as the write destination for the certificate files. | ||
OTEL_EXPORTER_OTLP_CERTIFICATE: "/tmp/certs/ca.crt" | ||
OTEL_EXPORTER_OTLP_CLIENT_CERTIFICATE: "/tmp/certs/client.crt" | ||
OTEL_EXPORTER_OTLP_CLIENT_KEY: "/tmp/certs/client.key" | ||
OTEL_EXPORTER_OTLP_PROTOCOL: "http/protobuf" | ||
OTEL_EXPORTER_OTLP_HEADERS: ${{ secrets.OTEL_EXPORTER_OTLP_HEADERS }} | ||
|
||
jobs: | ||
telemetry-setup: | ||
runs-on: ubuntu-latest | ||
outputs: | ||
start_time: ${{ steps.timestamp.outputs.START_TIME }} | ||
traceparent: ${{ steps.telemetry-setup.outputs.traceparent }} | ||
endpoint: ${{ steps.var-reexports.outputs.endpoint }} | ||
top_level_service_name: ${{ steps.var-reexports.outputs.service_name }} | ||
steps: | ||
- name: Get starting timestamp | ||
id: timestamp | ||
run: | ||
echo "START_TIME=$(date +%s.%N)" >> ${GITHUB_OUTPUT} | ||
- name: Echo endpoint to make it available to shared workflows | ||
id: var-reexports | ||
run: | | ||
echo endpoint="${OTEL_EXPORTER_OTLP_ENDPOINT}" >> ${GITHUB_OUTPUT} | ||
echo service_name="${OTEL_SERVICE_NAME}" >> ${GITHUB_OUTPUT} | ||
- name: Write certificate files for mTLS | ||
run: | | ||
mkdir -p /tmp/certs | ||
cat << EOF > "${OTEL_EXPORTER_OTLP_CERTIFICATE}" | ||
${{ secrets.OTEL_EXPORTER_OTLP_CA_CERTIFICATE }} | ||
EOF | ||
cat << EOF > "${OTEL_EXPORTER_OTLP_CLIENT_CERTIFICATE}" | ||
${{ secrets.OTEL_EXPORTER_OTLP_CLIENT_CERTIFICATE }} | ||
EOF | ||
cat << EOF > "${OTEL_EXPORTER_OTLP_CLIENT_KEY}" | ||
${{ secrets.OTEL_EXPORTER_OTLP_CLIENT_KEY }} | ||
EOF | ||
- name: Telemetry setup | ||
id: telemetry-setup | ||
uses: rapidsai/shared-actions/telemetry-traceparent@add-telemetry | ||
- name: Start root span | ||
uses: rapidsai/shared-actions/telemetry-create-span@add-telemetry | ||
with: | ||
name: "root span" | ||
traceparent: ${{steps.telemetry-setup.outputs.traceparent}} | ||
start_time: ${{steps.timestamp.outputs.start_time}} | ||
pr-builder: | ||
needs: | ||
- changed-files | ||
|
@@ -27,13 +80,14 @@ jobs: | |
- wheel-tests-cuml | ||
- devcontainer | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/pr-builder.yaml@branch-24.12 | ||
uses: rapidsai/shared-workflows/.github/workflows/pr-builder.yaml@add-telemetry | ||
if: always() | ||
with: | ||
needs: ${{ toJSON(needs) }} | ||
changed-files: | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/[email protected] | ||
needs: telemetry-setup | ||
uses: rapidsai/shared-workflows/.github/workflows/changed-files.yaml@add-telemetry | ||
with: | ||
files_yaml: | | ||
test_cpp: | ||
|
@@ -66,120 +120,184 @@ jobs: | |
- '!thirdparty/LICENSES/**' | ||
checks: | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/[email protected] | ||
needs: telemetry-setup | ||
uses: rapidsai/shared-workflows/.github/workflows/checks.yaml@add-telemetry | ||
with: | ||
enable_check_generated_files: false | ||
ignored_pr_jobs: >- | ||
optional-job-conda-python-tests-cudf-pandas-integration | ||
final-span-update | ||
default_endpoint: "${{needs.telemetry-setup.outputs.endpoint}}" | ||
traceparent: ${{ needs.telemetry-setup.outputs.traceparent }} | ||
clang-tidy: | ||
needs: checks | ||
needs: [checks, telemetry-setup] | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/custom-job.yaml@branch-24.12 | ||
uses: rapidsai/shared-workflows/.github/workflows/custom-job.yaml@add-telemetry | ||
with: | ||
build_type: pull-request | ||
node_type: "cpu8" | ||
arch: "amd64" | ||
container_image: "rapidsai/ci-conda:cuda11.8.0-ubuntu22.04-py3.10" | ||
run_script: "ci/run_clang_tidy.sh" | ||
default_endpoint: "${{needs.telemetry-setup.outputs.endpoint}}" | ||
traceparent: ${{ needs.telemetry-setup.outputs.traceparent }} | ||
conda-cpp-build: | ||
needs: checks | ||
needs: [checks, telemetry-setup] | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/conda-cpp-build.yaml@branch-24.12 | ||
uses: rapidsai/shared-workflows/.github/workflows/conda-cpp-build.yaml@add-telemetry | ||
with: | ||
build_type: pull-request | ||
default_endpoint: "${{needs.telemetry-setup.outputs.endpoint}}" | ||
traceparent: ${{ needs.telemetry-setup.outputs.traceparent }} | ||
conda-cpp-tests: | ||
needs: [conda-cpp-build, changed-files] | ||
needs: [conda-cpp-build, changed-files, telemetry-setup] | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/conda-cpp-tests.yaml@branch-24.12 | ||
uses: rapidsai/shared-workflows/.github/workflows/conda-cpp-tests.yaml@add-telemetry | ||
if: fromJSON(needs.changed-files.outputs.changed_file_groups).test_cpp | ||
with: | ||
build_type: pull-request | ||
default_endpoint: "${{needs.telemetry-setup.outputs.endpoint}}" | ||
traceparent: ${{ needs.telemetry-setup.outputs.traceparent }} | ||
conda-cpp-checks: | ||
needs: conda-cpp-build | ||
needs: [conda-cpp-build, telemetry-setup] | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/conda-cpp-post-build-checks.yaml@branch-24.12 | ||
uses: rapidsai/shared-workflows/.github/workflows/conda-cpp-post-build-checks.yaml@add-telemetry | ||
with: | ||
build_type: pull-request | ||
enable_check_symbols: true | ||
symbol_exclusions: raft_cutlass | ||
default_endpoint: "${{needs.telemetry-setup.outputs.endpoint}}" | ||
traceparent: ${{ needs.telemetry-setup.outputs.traceparent }} | ||
conda-python-build: | ||
needs: conda-cpp-build | ||
needs: [conda-cpp-build, telemetry-setup] | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/conda-python-build.yaml@branch-24.12 | ||
uses: rapidsai/shared-workflows/.github/workflows/conda-python-build.yaml@add-telemetry | ||
with: | ||
build_type: pull-request | ||
default_endpoint: "${{needs.telemetry-setup.outputs.endpoint}}" | ||
traceparent: ${{ needs.telemetry-setup.outputs.traceparent }} | ||
conda-python-tests-singlegpu: | ||
needs: [conda-python-build, changed-files] | ||
needs: [conda-python-build, changed-files, telemetry-setup] | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/conda-python-tests.yaml@branch-24.12 | ||
uses: rapidsai/shared-workflows/.github/workflows/conda-python-tests.yaml@add-telemetry | ||
if: fromJSON(needs.changed-files.outputs.changed_file_groups).test_python | ||
with: | ||
build_type: pull-request | ||
script: "ci/test_python_singlegpu.sh" | ||
default_endpoint: "${{needs.telemetry-setup.outputs.endpoint}}" | ||
traceparent: ${{ needs.telemetry-setup.outputs.traceparent }} | ||
optional-job-conda-python-tests-cudf-pandas-integration: | ||
needs: [conda-python-build, changed-files] | ||
needs: [conda-python-build, changed-files, telemetry-setup] | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/conda-python-tests.yaml@branch-24.12 | ||
uses: rapidsai/shared-workflows/.github/workflows/conda-python-tests.yaml@add-telemetry | ||
if: fromJSON(needs.changed-files.outputs.changed_file_groups).test_python | ||
with: | ||
matrix_filter: map(select(.ARCH == "amd64")) | ||
build_type: pull-request | ||
script: "ci/test_python_integration.sh" | ||
default_endpoint: "${{needs.telemetry-setup.outputs.endpoint}}" | ||
traceparent: ${{ needs.telemetry-setup.outputs.traceparent }} | ||
conda-python-tests-dask: | ||
needs: [conda-python-build, changed-files] | ||
needs: [conda-python-build, changed-files, telemetry-setup] | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/conda-python-tests.yaml@branch-24.12 | ||
uses: rapidsai/shared-workflows/.github/workflows/conda-python-tests.yaml@add-telemetry | ||
if: fromJSON(needs.changed-files.outputs.changed_file_groups).test_python | ||
with: | ||
build_type: pull-request | ||
script: "ci/test_python_dask.sh" | ||
default_endpoint: "${{needs.telemetry-setup.outputs.endpoint}}" | ||
traceparent: ${{ needs.telemetry-setup.outputs.traceparent }} | ||
conda-notebook-tests: | ||
needs: [conda-python-build, changed-files] | ||
needs: [conda-python-build, changed-files, telemetry-setup] | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/custom-job.yaml@branch-24.12 | ||
uses: rapidsai/shared-workflows/.github/workflows/custom-job.yaml@add-telemetry | ||
if: fromJSON(needs.changed-files.outputs.changed_file_groups).test_notebooks | ||
with: | ||
build_type: pull-request | ||
node_type: "gpu-v100-latest-1" | ||
arch: "amd64" | ||
container_image: "rapidsai/ci-conda:latest" | ||
run_script: "ci/test_notebooks.sh" | ||
default_endpoint: "${{needs.telemetry-setup.outputs.endpoint}}" | ||
traceparent: ${{ needs.telemetry-setup.outputs.traceparent }} | ||
docs-build: | ||
needs: conda-python-build | ||
needs: [conda-python-build, telemetry-setup] | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/custom-job.yaml@branch-24.12 | ||
uses: rapidsai/shared-workflows/.github/workflows/custom-job.yaml@add-telemetry | ||
with: | ||
build_type: pull-request | ||
node_type: "gpu-v100-latest-1" | ||
arch: "amd64" | ||
container_image: "rapidsai/ci-conda:latest" | ||
run_script: "ci/build_docs.sh" | ||
default_endpoint: "${{needs.telemetry-setup.outputs.endpoint}}" | ||
traceparent: ${{ needs.telemetry-setup.outputs.traceparent }} | ||
wheel-build-cuml: | ||
needs: checks | ||
needs: [checks, telemetry-setup] | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/wheels-build.yaml@branch-24.12 | ||
uses: rapidsai/shared-workflows/.github/workflows/wheels-build.yaml@add-telemetry | ||
with: | ||
build_type: pull-request | ||
script: ci/build_wheel.sh | ||
extra-repo: rapidsai/cumlprims_mg | ||
extra-repo-sha: branch-24.12 | ||
extra-repo-deploy-key: CUMLPRIMS_SSH_PRIVATE_DEPLOY_KEY | ||
default_endpoint: "${{needs.telemetry-setup.outputs.endpoint}}" | ||
traceparent: ${{ needs.telemetry-setup.outputs.traceparent }} | ||
wheel-tests-cuml: | ||
needs: [wheel-build-cuml, changed-files] | ||
needs: [wheel-build-cuml, changed-files, telemetry-setup] | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/wheels-test.yaml@branch-24.12 | ||
uses: rapidsai/shared-workflows/.github/workflows/wheels-test.yaml@add-telemetry | ||
if: fromJSON(needs.changed-files.outputs.changed_file_groups).test_python | ||
with: | ||
build_type: pull-request | ||
script: ci/test_wheel.sh | ||
default_endpoint: "${{needs.telemetry-setup.outputs.endpoint}}" | ||
traceparent: ${{ needs.telemetry-setup.outputs.traceparent }} | ||
devcontainer: | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/[email protected] | ||
needs: telemetry-setup | ||
uses: rapidsai/shared-workflows/.github/workflows/build-in-devcontainer.yaml@add-telemetry | ||
with: | ||
arch: '["amd64"]' | ||
cuda: '["12.5"]' | ||
extra-repo-deploy-key: CUMLPRIMS_SSH_PRIVATE_DEPLOY_KEY | ||
default_endpoint: "${{needs.telemetry-setup.outputs.endpoint}}" | ||
traceparent: ${{ needs.telemetry-setup.outputs.traceparent }} | ||
build_command: | | ||
sccache -z; | ||
build-all --verbose; | ||
sccache -s; | ||
final_span_update: | ||
runs-on: ubuntu-latest | ||
needs: [pr-builder, telemetry-setup] | ||
steps: | ||
- name: Get final timestamp | ||
id: timestamp | ||
run: | ||
echo "FINAL_TIME=$(date +%s.%N)" >> ${GITHUB_OUTPUT} | ||
# Main purpose of this traceparent line here is to ensure that otel-cli is installed. | ||
- name: Get job traceparent | ||
uses: rapidsai/shared-actions/telemetry-traceparent@add-telemetry | ||
- name: Write certificate files for mTLS | ||
run: | | ||
mkdir -p /tmp/certs | ||
cat << EOF > ${OTEL_EXPORTER_OTLP_CERTIFICATE} | ||
${{ secrets.OTEL_EXPORTER_OTLP_CA_CERTIFICATE }} | ||
EOF | ||
cat << EOF > ${OTEL_EXPORTER_OTLP_CLIENT_CERTIFICATE} | ||
${{ secrets.OTEL_EXPORTER_OTLP_CLIENT_CERTIFICATE }} | ||
EOF | ||
cat << EOF > ${OTEL_EXPORTER_OTLP_CLIENT_KEY} | ||
${{ secrets.OTEL_EXPORTER_OTLP_CLIENT_KEY }} | ||
EOF | ||
- name: Update root span with final completion time | ||
if: always() | ||
uses: rapidsai/shared-actions/telemetry-create-span@add-telemetry | ||
with: | ||
service: ${{needs.telemetry-setup.outputs.top_level_service_name}} | ||
name: "end-of-job update" | ||
default_endpoint: "${{needs.telemetry-setup.outputs.endpoint}}" | ||
traceparent: ${{needs.telemetry-setup.outputs.traceparent}} | ||
start_time: ${{needs.telemetry-setup.outputs.start_time}} | ||
end_time: ${{steps.timestamp.outputs.FINAL_TIME}} |