This repository has been archived by the owner on Jul 23, 2024. It is now read-only.
[Task Submission] ICL consistency test (icl_consistency_test
)
#100
Workflow file for this run
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
# Adapted from https://github.com/huggingface/evaluate/blob/main/.github/workflows/ci.yml | |
name: CI | |
on: | |
pull_request: | |
types: | |
- labeled | |
branches: | |
- main | |
jobs: | |
check_code_quality: | |
if: github.event.label.name == 'task-submission' | |
runs-on: ubuntu-latest | |
steps: | |
- uses: actions/checkout@v3 | |
- name: Set up Python | |
uses: actions/setup-python@v4 | |
with: | |
python-version: "3.9" | |
cache: 'pip' | |
cache-dependency-path: setup.py | |
- name: Install dependencies | |
run: | | |
python -m pip install --upgrade pip | |
pip install .[quality] | |
- name: Check quality | |
run: | | |
make check-quality | |
test_genbench_impl: | |
needs: check_code_quality | |
runs-on: ubuntu-latest | |
steps: | |
- uses: actions/checkout@v3 | |
with: | |
fetch-depth: 0 | |
- name: Set up Python 3.9 | |
uses: actions/setup-python@v4 | |
with: | |
python-version: "3.9" | |
cache: 'pip' | |
cache-dependency-path: setup.py | |
- name: Upgrade pip | |
run: python -m pip install --upgrade pip | |
- name: Install dependencies | |
run: | | |
pip install .[tests] | |
- name: Test with pytest | |
run: | | |
pytest -xrpP tests/ --ignore=./tests/test_task.py | |
test_task: | |
needs: test_genbench_impl | |
runs-on: ubuntu-latest | |
steps: | |
# Pattern: '[Task Submission] Task Name (`task_id`) with optional description' | |
# Fail if the PR title does not match the pattern | |
- name: Parse the Task ID from PR's title | |
id: pr_task_id | |
run: | | |
task_id=$(echo '${{ github.event.pull_request.title }}' | sed -n -e 's/^\[Task Submission\][[:alnum:][:space:]()_-]\+[[:space:]]*(`\([^`]*\)`)[[:space:]]*.*/\1/p') | |
echo "Task ID: $task_id" | |
echo "task_id=$task_id" >> $GITHUB_OUTPUT | |
shell: bash | |
- name: Check if the Task ID is valid | |
id: check_task_id | |
run: | | |
if [[ -z "${{ steps.pr_task_id.outputs.task_id }}" ]]; then | |
echo "Could not parse the Task ID from the PR title." | |
exit 1 | |
fi | |
shell: bash | |
- uses: actions/checkout@v3 | |
with: | |
fetch-depth: 0 | |
- name: Detect New Task ID | |
id: task_id | |
# Get the most recent modified task directory and extract the task ID | |
run: | | |
task_id=$(ls -td src/genbench/tasks/*/ | head -n 1 | cut -d'/' -f4) | |
echo "Task ID: $task_id" | |
echo "task_id=$task_id" >> $GITHUB_OUTPUT | |
- name: Check if PR task ID matches | |
id: check_pr_task_id | |
run: | | |
if [[ "${{ steps.pr_task_id.outputs.task_id }}" != "${{ steps.task_id.outputs.task_id }}" ]]; then | |
echo "Task ID in PR title does not match the most recent task ID." | |
echo "PR Task ID: ${{ steps.pr_task_id.outputs.task_id }}" | |
echo "Most Recent Task ID: ${{ steps.task_id.outputs.task_id }}" | |
echo "Continuing with the PR Task ID..." | |
fi | |
- name: Set up Python 3.9 | |
uses: actions/setup-python@v4 | |
with: | |
python-version: "3.9" | |
cache: 'pip' | |
cache-dependency-path: setup.py | |
- name: Upgrade pip | |
run: python -m pip install --upgrade pip | |
- name: Install dependencies | |
run: | | |
pip install .[tests] | |
- name: Test Task | |
run: | | |
genbench-cli test-task -i ${{ steps.pr_task_id.outputs.task_id }} --tests-dir ./tests |