From bc0e31548e61f678bcbf1bc9e44bbb6d23163b1b Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Thu, 4 Apr 2024 13:34:53 -0700 Subject: [PATCH 01/52] Create validate_docker_image.yml Add a file to print a statement. --- .github/workflows/validate_docker_image.yml | 3 +++ 1 file changed, 3 insertions(+) create mode 100644 .github/workflows/validate_docker_image.yml diff --git a/.github/workflows/validate_docker_image.yml b/.github/workflows/validate_docker_image.yml new file mode 100644 index 000000000..999318980 --- /dev/null +++ b/.github/workflows/validate_docker_image.yml @@ -0,0 +1,3 @@ +steps: + - name: Validate docker image + run: echo "Validating docker image." From 51944423ae9c837f913f904a6694e7755d2813f2 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Thu, 4 Apr 2024 13:39:44 -0700 Subject: [PATCH 02/52] Update validate_docker_image.yml --- .github/workflows/validate_docker_image.yml | 17 ++++++++++++++--- 1 file changed, 14 insertions(+), 3 deletions(-) diff --git a/.github/workflows/validate_docker_image.yml b/.github/workflows/validate_docker_image.yml index 999318980..6fa6e3ad8 100644 --- a/.github/workflows/validate_docker_image.yml +++ b/.github/workflows/validate_docker_image.yml @@ -1,3 +1,14 @@ -steps: - - name: Validate docker image - run: echo "Validating docker image." +name: Validate docker image + +on: + push: + branches: + - '*' +jobs: + build: + runs-on: ubuntu-latest + + steps: + - name: print a statement + run: echo "Validating docker image." + From 8c775c024924d70eb9925ad293e1eb409cedff06 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Thu, 4 Apr 2024 13:48:08 -0700 Subject: [PATCH 03/52] Update validate_docker_image.yml --- .github/workflows/validate_docker_image.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/validate_docker_image.yml b/.github/workflows/validate_docker_image.yml index 6fa6e3ad8..ca03317ba 100644 --- a/.github/workflows/validate_docker_image.yml +++ b/.github/workflows/validate_docker_image.yml @@ -1,7 +1,7 @@ name: Validate docker image on: - push: + pull_request: branches: - '*' jobs: From 32911b3a9c7f302d8f798fd219cb820d392114f9 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Thu, 4 Apr 2024 13:57:46 -0700 Subject: [PATCH 04/52] Add docker pull command --- .github/workflows/validate_docker_image.yml | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/.github/workflows/validate_docker_image.yml b/.github/workflows/validate_docker_image.yml index ca03317ba..cf98eea84 100644 --- a/.github/workflows/validate_docker_image.yml +++ b/.github/workflows/validate_docker_image.yml @@ -11,4 +11,5 @@ jobs: steps: - name: print a statement run: echo "Validating docker image." - + - name: Pull Docker image + run: docker pull ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel From e630f17dfb69410da573c8bb0e83821c910854db Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Thu, 4 Apr 2024 13:59:21 -0700 Subject: [PATCH 05/52] Update validate_docker_image.yml --- .github/workflows/validate_docker_image.yml | 2 ++ 1 file changed, 2 insertions(+) diff --git a/.github/workflows/validate_docker_image.yml b/.github/workflows/validate_docker_image.yml index cf98eea84..48d2e897b 100644 --- a/.github/workflows/validate_docker_image.yml +++ b/.github/workflows/validate_docker_image.yml @@ -13,3 +13,5 @@ jobs: run: echo "Validating docker image." - name: Pull Docker image run: docker pull ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel + - name: print a statement + run: echo "Done pulling docker image." From 8645bc7a46ee90e47b900a7a631ca9b0f18c6d91 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Thu, 4 Apr 2024 14:04:07 -0700 Subject: [PATCH 06/52] Update validate_docker_image.yml --- .github/workflows/validate_docker_image.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/validate_docker_image.yml b/.github/workflows/validate_docker_image.yml index 48d2e897b..3d7a6376f 100644 --- a/.github/workflows/validate_docker_image.yml +++ b/.github/workflows/validate_docker_image.yml @@ -1,7 +1,7 @@ name: Validate docker image on: - pull_request: + push: branches: - '*' jobs: From 674ea86064a79f5765088877e37672980d0e11e4 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Thu, 4 Apr 2024 15:29:26 -0700 Subject: [PATCH 07/52] Add more steps in validate_docker_images.yml --- .github/workflows/validate_docker_image.yml | 17 ---------------- .github/workflows/validate_docker_images.yml | 21 ++++++++++++++++++++ 2 files changed, 21 insertions(+), 17 deletions(-) delete mode 100644 .github/workflows/validate_docker_image.yml create mode 100644 .github/workflows/validate_docker_images.yml diff --git a/.github/workflows/validate_docker_image.yml b/.github/workflows/validate_docker_image.yml deleted file mode 100644 index 3d7a6376f..000000000 --- a/.github/workflows/validate_docker_image.yml +++ /dev/null @@ -1,17 +0,0 @@ -name: Validate docker image - -on: - push: - branches: - - '*' -jobs: - build: - runs-on: ubuntu-latest - - steps: - - name: print a statement - run: echo "Validating docker image." - - name: Pull Docker image - run: docker pull ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel - - name: print a statement - run: echo "Done pulling docker image." diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml new file mode 100644 index 000000000..6d9938d35 --- /dev/null +++ b/.github/workflows/validate_docker_images.yml @@ -0,0 +1,21 @@ +name: Validate docker images + +on: + push: + branches: + - '*' +jobs: + build: + runs-on: ubuntu-latest + + steps: + - name: Print a statement + run: echo "Validating docker images." + - name: Pull Docker image + run: docker pull ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel + - name: Print a statement + run: echo "Done pulling docker image." + - name: Checkout the branch + uses: pytorch/builder/test/smoke_test/smoke_test.py@main + - name: Run smoke tests + run: python pytorch/builder/test/smoke_test/smoke_test.py --package torch_only --runtime-error-check enabled From ab428ce587b44f57a302b0c5ce48b56c5502b923 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Thu, 4 Apr 2024 15:30:21 -0700 Subject: [PATCH 08/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 6d9938d35..a3a3befb3 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -18,4 +18,4 @@ jobs: - name: Checkout the branch uses: pytorch/builder/test/smoke_test/smoke_test.py@main - name: Run smoke tests - run: python pytorch/builder/test/smoke_test/smoke_test.py --package torch_only --runtime-error-check enabled + run: python -c "import torch;print(torch.__version__)" From e7065ce805e42d2058421b631c01ffc9eeee9041 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Thu, 4 Apr 2024 15:31:41 -0700 Subject: [PATCH 09/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index a3a3befb3..50985fdcf 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -17,5 +17,4 @@ jobs: run: echo "Done pulling docker image." - name: Checkout the branch uses: pytorch/builder/test/smoke_test/smoke_test.py@main - - name: Run smoke tests - run: python -c "import torch;print(torch.__version__)" + From 671db734b12055477bd95c9b90c5ad9299286f42 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Thu, 4 Apr 2024 15:32:39 -0700 Subject: [PATCH 10/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 50985fdcf..05a25a5ea 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -16,5 +16,7 @@ jobs: - name: Print a statement run: echo "Done pulling docker image." - name: Checkout the branch - uses: pytorch/builder/test/smoke_test/smoke_test.py@main + uses: pytorch/builder@main + - name: Run smoke tests + run: python -c "import torch;print(torch.__version__)" From 87b8ecdacf68d1d99a95a4d84b0b4302c0dfe629 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Thu, 4 Apr 2024 15:34:26 -0700 Subject: [PATCH 11/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 05a25a5ea..e3df69cf6 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -15,8 +15,8 @@ jobs: run: docker pull ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel - name: Print a statement run: echo "Done pulling docker image." - - name: Checkout the branch - uses: pytorch/builder@main + - name: Checkout PyTorch builder + uses: actions/checkout@v3 - name: Run smoke tests run: python -c "import torch;print(torch.__version__)" From e52e864311fdd44adfba1563325d16e16f05e78d Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Thu, 4 Apr 2024 15:34:37 -0700 Subject: [PATCH 12/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index e3df69cf6..ec78ef99e 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -16,7 +16,7 @@ jobs: - name: Print a statement run: echo "Done pulling docker image." - name: Checkout PyTorch builder - uses: actions/checkout@v3 + uses: actions/checkout@v3 - name: Run smoke tests run: python -c "import torch;print(torch.__version__)" From a65f44c2a7ed26d2037eef00e31ef9e64be7b33c Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Thu, 4 Apr 2024 15:40:07 -0700 Subject: [PATCH 13/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index ec78ef99e..13aa2fa7a 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -10,13 +10,13 @@ jobs: steps: - name: Print a statement - run: echo "Validating docker images." + run: echo "Validating docker images." - name: Pull Docker image - run: docker pull ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel + run: docker pull ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel - name: Print a statement - run: echo "Done pulling docker image." + run: echo "Done pulling docker image." - name: Checkout PyTorch builder uses: actions/checkout@v3 - name: Run smoke tests - run: python -c "import torch;print(torch.__version__)" + run: python -c "import math; print(math.sqrt(16))" From 5f7828660244a651fe008fc23f6abede6c2fedd5 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Thu, 4 Apr 2024 15:45:28 -0700 Subject: [PATCH 14/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 13aa2fa7a..7ff0c9400 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -18,5 +18,5 @@ jobs: - name: Checkout PyTorch builder uses: actions/checkout@v3 - name: Run smoke tests - run: python -c "import math; print(math.sqrt(16))" + run: python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled From 37fea378fce5b2306b2fa808a77d3d2b4c99be54 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Thu, 4 Apr 2024 15:50:25 -0700 Subject: [PATCH 15/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 2 ++ 1 file changed, 2 insertions(+) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 7ff0c9400..bb0d56e3c 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -15,6 +15,8 @@ jobs: run: docker pull ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel - name: Print a statement run: echo "Done pulling docker image." + - name: Install Torch + run: conda install -c pytorch pytorch - name: Checkout PyTorch builder uses: actions/checkout@v3 - name: Run smoke tests From d928903527b4071d21f19569375bf2664c515013 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Thu, 4 Apr 2024 15:55:34 -0700 Subject: [PATCH 16/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 2 -- 1 file changed, 2 deletions(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index bb0d56e3c..7ff0c9400 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -15,8 +15,6 @@ jobs: run: docker pull ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel - name: Print a statement run: echo "Done pulling docker image." - - name: Install Torch - run: conda install -c pytorch pytorch - name: Checkout PyTorch builder uses: actions/checkout@v3 - name: Run smoke tests From 6b9e1934fea1ace7da7b084f57a0453a41597f07 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Thu, 4 Apr 2024 16:03:38 -0700 Subject: [PATCH 17/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 7ff0c9400..0af60226d 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -18,5 +18,6 @@ jobs: - name: Checkout PyTorch builder uses: actions/checkout@v3 - name: Run smoke tests - run: python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled + run: docker run -it ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel python -c "import torch; print(torch.__version__)" + From 91a25855a00292d376c4bb5fc5ed562e84f06d23 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Thu, 4 Apr 2024 16:08:02 -0700 Subject: [PATCH 18/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 0af60226d..06d11f533 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -18,6 +18,6 @@ jobs: - name: Checkout PyTorch builder uses: actions/checkout@v3 - name: Run smoke tests - run: docker run -it ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel python -c "import torch; print(torch.__version__)" + run: docker run ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel python -c "import torch; print(torch.__version__)" From 521cdadf7af2b80f85a212af011621d4210cd4f3 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Thu, 4 Apr 2024 16:14:26 -0700 Subject: [PATCH 19/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 06d11f533..38e59be28 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -13,11 +13,11 @@ jobs: run: echo "Validating docker images." - name: Pull Docker image run: docker pull ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel - - name: Print a statement - run: echo "Done pulling docker image." + - name: Run docker image + run: docker run ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel - name: Checkout PyTorch builder uses: actions/checkout@v3 - name: Run smoke tests - run: docker run ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel python -c "import torch; print(torch.__version__)" + run: python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled From 1f7de120c5ed6522a4788380d908b94767be38be Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Thu, 4 Apr 2024 16:22:31 -0700 Subject: [PATCH 20/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 12 ++++-------- 1 file changed, 4 insertions(+), 8 deletions(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 38e59be28..d8d41acc8 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -11,13 +11,9 @@ jobs: steps: - name: Print a statement run: echo "Validating docker images." - - name: Pull Docker image - run: docker pull ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel - - name: Run docker image - run: docker run ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel - name: Checkout PyTorch builder uses: actions/checkout@v3 - - name: Run smoke tests - run: python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled - - + - name: Pull Docker image + run: docker pull ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel + - name: Run docker image and run smoke tests + run: docker run ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled From eea99f1bea28f93b553a56dd2c38ea4cbb0dc8e1 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Thu, 4 Apr 2024 18:13:32 -0700 Subject: [PATCH 21/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index d8d41acc8..631ebb0b4 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -16,4 +16,4 @@ jobs: - name: Pull Docker image run: docker pull ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel - name: Run docker image and run smoke tests - run: docker run ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled + run: docker run ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel From 31229e96ad988fff6f944c685fcc4ff2e4b0f713 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Thu, 4 Apr 2024 18:36:48 -0700 Subject: [PATCH 22/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 8 +++++--- 1 file changed, 5 insertions(+), 3 deletions(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 631ebb0b4..a7e317fc1 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -11,9 +11,11 @@ jobs: steps: - name: Print a statement run: echo "Validating docker images." - - name: Checkout PyTorch builder - uses: actions/checkout@v3 - name: Pull Docker image run: docker pull ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel - - name: Run docker image and run smoke tests + - name: Run docker image run: docker run ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel + - name: Checkout PyTorch builder + uses: actions/checkout@v3 + - name: Run smoke tests + run: python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled From 6a5f1b5fd8743b23a8c43502e4ef226ee4d3251c Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Thu, 4 Apr 2024 18:46:40 -0700 Subject: [PATCH 23/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 33 ++++++++++++-------- 1 file changed, 20 insertions(+), 13 deletions(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index a7e317fc1..fb59e667e 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -5,17 +5,24 @@ on: branches: - '*' jobs: - build: - runs-on: ubuntu-latest - + run_tests: + runs-on: ubuntu-latest + container: ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel steps: - - name: Print a statement - run: echo "Validating docker images." - - name: Pull Docker image - run: docker pull ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel - - name: Run docker image - run: docker run ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel - - name: Checkout PyTorch builder - uses: actions/checkout@v3 - - name: Run smoke tests - run: python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled + - uses: actions/checkout@v3 + - name: Run tests + run: python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled + + # steps: + # - name: Print a statement + # run: echo "Validating docker images." + # - name: Pull Docker image + # run: docker pull ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel + # - name: Run docker image + # run: docker run ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel + # - name: Checkout PyTorch builder + # uses: actions/checkout@v3 + # - name: Run smoke tests + # run: python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled + + From 712dbc16cb862efe46b74b6a6f71c7375bbc9123 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Thu, 4 Apr 2024 18:53:33 -0700 Subject: [PATCH 24/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 14 +------------- 1 file changed, 1 insertion(+), 13 deletions(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index fb59e667e..78ed84e45 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -10,19 +10,7 @@ jobs: container: ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel steps: - uses: actions/checkout@v3 - - name: Run tests + - name: Run smoke tests run: python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled - - # steps: - # - name: Print a statement - # run: echo "Validating docker images." - # - name: Pull Docker image - # run: docker pull ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel - # - name: Run docker image - # run: docker run ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel - # - name: Checkout PyTorch builder - # uses: actions/checkout@v3 - # - name: Run smoke tests - # run: python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled From 3ecd72b78afe17613092b8382153141dd7077a9d Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Sat, 6 Apr 2024 13:09:09 -0700 Subject: [PATCH 25/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 38 +++++++++++++++----- 1 file changed, 30 insertions(+), 8 deletions(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 78ed84e45..16fad0807 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -1,16 +1,38 @@ -name: Validate docker images +name: Validate Docker Images (with Matrix Generation) on: + workflow_dispatch: + inputs: + channel: + description: 'PyTorch channel to use (nightly, test, release, all)' + required: true + type: choice + default: 'all' + options: + - 'nightly' + - 'test' + - 'release' + - 'all' push: branches: - '*' + jobs: - run_tests: - runs-on: ubuntu-latest - container: ghcr.io/pytorch/pytorch:2.2.2-cuda11.8-cudnn8-devel + generate-matrix: + uses: pytorch/test-infra/.github/workflows/generate_docker_release_matrix.yml@main + with: + channel: ${{ inputs.channel }} + secrets: inherit + + run-tests: + needs: generate-matrix + runs-on: ubuntu-latest + strategy: + matrix: ${{ fromJson(needs.generate-matrix.outputs.matrix) }} + container: + image: ghcr.io/pytorch/pytorch:${{ matrix.cuda_full_version }}-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} + platform: ${{ matrix.platform }} steps: - - uses: actions/checkout@v3 + - uses: actions/checkout@v3 - name: Run smoke tests - run: python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled - - + run: python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled From 4e7bbc7f4f81093e80fc12a53b31603d543b9657 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Sat, 6 Apr 2024 13:10:51 -0700 Subject: [PATCH 26/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 1 - 1 file changed, 1 deletion(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 16fad0807..7368a9939 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -31,7 +31,6 @@ jobs: matrix: ${{ fromJson(needs.generate-matrix.outputs.matrix) }} container: image: ghcr.io/pytorch/pytorch:${{ matrix.cuda_full_version }}-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} - platform: ${{ matrix.platform }} steps: - uses: actions/checkout@v3 - name: Run smoke tests From 2dcff31a59d24bc77eeed1ae3e7ee585ab470859 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Sat, 6 Apr 2024 13:15:18 -0700 Subject: [PATCH 27/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 7368a9939..cfbbc338f 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -30,7 +30,7 @@ jobs: strategy: matrix: ${{ fromJson(needs.generate-matrix.outputs.matrix) }} container: - image: ghcr.io/pytorch/pytorch:${{ matrix.cuda_full_version }}-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} + image: ghcr.io/pytorch/pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} steps: - uses: actions/checkout@v3 - name: Run smoke tests From e32a8033c0c9c09de3eb89323e6cd16624650dcc Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Sat, 6 Apr 2024 13:20:03 -0700 Subject: [PATCH 28/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index cfbbc338f..3013e3acc 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -32,6 +32,8 @@ jobs: container: image: ghcr.io/pytorch/pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} steps: - - uses: actions/checkout@v3 + - uses: actions/setup-python@v4 + with: + python-version: '3.10' - name: Run smoke tests run: python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled From d02f074a83e9e182c8d61461a5fbcabdb750c3b6 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Sat, 6 Apr 2024 13:23:23 -0700 Subject: [PATCH 29/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 4 +--- 1 file changed, 1 insertion(+), 3 deletions(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 3013e3acc..cfbbc338f 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -32,8 +32,6 @@ jobs: container: image: ghcr.io/pytorch/pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} steps: - - uses: actions/setup-python@v4 - with: - python-version: '3.10' + - uses: actions/checkout@v3 - name: Run smoke tests run: python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled From a75f640ea6010d542f17cc2c06809b3618d44026 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Mon, 8 Apr 2024 10:32:56 -0700 Subject: [PATCH 30/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 10 ++++++++-- 1 file changed, 8 insertions(+), 2 deletions(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index cfbbc338f..4190692c5 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -20,13 +20,16 @@ on: jobs: generate-matrix: uses: pytorch/test-infra/.github/workflows/generate_docker_release_matrix.yml@main + strategy: + matrix: + runner_type: ["linux.g5.4xlarge.nvidia.gpu"] with: channel: ${{ inputs.channel }} secrets: inherit run-tests: needs: generate-matrix - runs-on: ubuntu-latest + runs-on: ${{ matrix.runner-type }} strategy: matrix: ${{ fromJson(needs.generate-matrix.outputs.matrix) }} container: @@ -34,4 +37,7 @@ jobs: steps: - uses: actions/checkout@v3 - name: Run smoke tests - run: python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled + run: | + export MATRIX_GPU_ARCH_TYPE="cuda" + export MATRIX_GPU_ARCH_VERSION="${{ matrix.cuda }}" + python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled From a4d5e8b6c91f10cdad4a5f6bff266b734223e103 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Mon, 8 Apr 2024 10:38:09 -0700 Subject: [PATCH 31/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 5 +---- 1 file changed, 1 insertion(+), 4 deletions(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 4190692c5..c6f0896c9 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -20,16 +20,13 @@ on: jobs: generate-matrix: uses: pytorch/test-infra/.github/workflows/generate_docker_release_matrix.yml@main - strategy: - matrix: - runner_type: ["linux.g5.4xlarge.nvidia.gpu"] with: channel: ${{ inputs.channel }} secrets: inherit run-tests: needs: generate-matrix - runs-on: ${{ matrix.runner-type }} + runs-on: linux.g5.4xlarge.nvidia.gpu strategy: matrix: ${{ fromJson(needs.generate-matrix.outputs.matrix) }} container: From a0763084c6491c13787a900d2adaa00793af0bc9 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Mon, 8 Apr 2024 15:57:15 -0700 Subject: [PATCH 32/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 25 ++++++++++++-------- 1 file changed, 15 insertions(+), 10 deletions(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index c6f0896c9..1a2651edb 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -26,15 +26,20 @@ jobs: run-tests: needs: generate-matrix - runs-on: linux.g5.4xlarge.nvidia.gpu strategy: matrix: ${{ fromJson(needs.generate-matrix.outputs.matrix) }} - container: - image: ghcr.io/pytorch/pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} - steps: - - uses: actions/checkout@v3 - - name: Run smoke tests - run: | - export MATRIX_GPU_ARCH_TYPE="cuda" - export MATRIX_GPU_ARCH_VERSION="${{ matrix.cuda }}" - python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled + fail-fast: false + uses: pytorch/test-infra/.github/workflows/linux_job.yml@main + with: + runner: linux.g5.4xlarge.nvidia.gpu + repository: "pytorch/builder" + ref: ${{ inputs.ref || github.ref }} + job-name: pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} + binary-matrix: ${{ toJSON(matrix) }} + docker-image: ghcr.io/pytorch/pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} + timeout: 180 + script: | + set -ex + export MATRIX_GPU_ARCH_TYPE="cuda" + export MATRIX_GPU_ARCH_VERSION="${{ matrix.cuda }}" + python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled From 041d904fc2690a1787a23e9715b474a170ec5f9e Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Mon, 8 Apr 2024 16:04:40 -0700 Subject: [PATCH 33/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 1a2651edb..4829f3e2a 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -31,7 +31,7 @@ jobs: fail-fast: false uses: pytorch/test-infra/.github/workflows/linux_job.yml@main with: - runner: linux.g5.4xlarge.nvidia.gpu + runner: ubuntu-latest repository: "pytorch/builder" ref: ${{ inputs.ref || github.ref }} job-name: pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} From 67a56ac557b9c9b31702fa4fabd55974d4c289c8 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Mon, 8 Apr 2024 16:07:58 -0700 Subject: [PATCH 34/52] Update validate_docker_images.yml From 9ba608803b2d6db914173e7fc7e4fa569a9bf485 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Mon, 8 Apr 2024 16:16:11 -0700 Subject: [PATCH 35/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 30 +++++++++++--------- 1 file changed, 16 insertions(+), 14 deletions(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 4829f3e2a..03d172fe1 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -29,17 +29,19 @@ jobs: strategy: matrix: ${{ fromJson(needs.generate-matrix.outputs.matrix) }} fail-fast: false - uses: pytorch/test-infra/.github/workflows/linux_job.yml@main - with: - runner: ubuntu-latest - repository: "pytorch/builder" - ref: ${{ inputs.ref || github.ref }} - job-name: pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} - binary-matrix: ${{ toJSON(matrix) }} - docker-image: ghcr.io/pytorch/pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} - timeout: 180 - script: | - set -ex - export MATRIX_GPU_ARCH_TYPE="cuda" - export MATRIX_GPU_ARCH_VERSION="${{ matrix.cuda }}" - python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled + runs-on: ubuntu-latest + steps: + - uses: actions/checkout@v3 + - uses: pytorch/test-infra/.github/workflows/linux_job.yml@main + with: + repository: "pytorch/builder" + ref: ${{ inputs.ref || github.ref }} + job-name: pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} + binary-matrix: ${{ toJSON(matrix) }} + docker-image: ghcr.io/pytorch/pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} + timeout: 180 + script: | + set -ex + export MATRIX_GPU_ARCH_TYPE="cuda" + export MATRIX_GPU_ARCH_VERSION="${{ matrix.cuda }}" + python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled From 010759309d7fe70ab90f686830b55a1c34cd7e1d Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Mon, 8 Apr 2024 16:17:14 -0700 Subject: [PATCH 36/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 03d172fe1..8b9a2723a 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -22,7 +22,7 @@ jobs: uses: pytorch/test-infra/.github/workflows/generate_docker_release_matrix.yml@main with: channel: ${{ inputs.channel }} - secrets: inherit + secrets: inherit run-tests: needs: generate-matrix @@ -32,7 +32,7 @@ jobs: runs-on: ubuntu-latest steps: - uses: actions/checkout@v3 - - uses: pytorch/test-infra/.github/workflows/linux_job.yml@main + - uses: pytorch/test-infra/.github/workflows/linux_job.yml@main with: repository: "pytorch/builder" ref: ${{ inputs.ref || github.ref }} From b6051921875ddd8a4daa6bc7d0b35de6df31fe69 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Mon, 8 Apr 2024 16:21:00 -0700 Subject: [PATCH 37/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 32 +++++++++----------- 1 file changed, 15 insertions(+), 17 deletions(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 8b9a2723a..1a2651edb 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -22,26 +22,24 @@ jobs: uses: pytorch/test-infra/.github/workflows/generate_docker_release_matrix.yml@main with: channel: ${{ inputs.channel }} - secrets: inherit + secrets: inherit run-tests: needs: generate-matrix strategy: matrix: ${{ fromJson(needs.generate-matrix.outputs.matrix) }} fail-fast: false - runs-on: ubuntu-latest - steps: - - uses: actions/checkout@v3 - - uses: pytorch/test-infra/.github/workflows/linux_job.yml@main - with: - repository: "pytorch/builder" - ref: ${{ inputs.ref || github.ref }} - job-name: pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} - binary-matrix: ${{ toJSON(matrix) }} - docker-image: ghcr.io/pytorch/pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} - timeout: 180 - script: | - set -ex - export MATRIX_GPU_ARCH_TYPE="cuda" - export MATRIX_GPU_ARCH_VERSION="${{ matrix.cuda }}" - python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled + uses: pytorch/test-infra/.github/workflows/linux_job.yml@main + with: + runner: linux.g5.4xlarge.nvidia.gpu + repository: "pytorch/builder" + ref: ${{ inputs.ref || github.ref }} + job-name: pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} + binary-matrix: ${{ toJSON(matrix) }} + docker-image: ghcr.io/pytorch/pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} + timeout: 180 + script: | + set -ex + export MATRIX_GPU_ARCH_TYPE="cuda" + export MATRIX_GPU_ARCH_VERSION="${{ matrix.cuda }}" + python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled From 86c475550a81c38b5c177312ef987b52e75c00bd Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Mon, 8 Apr 2024 16:25:05 -0700 Subject: [PATCH 38/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 30 +++++++++++--------- 1 file changed, 16 insertions(+), 14 deletions(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 1a2651edb..79e89b718 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -26,20 +26,22 @@ jobs: run-tests: needs: generate-matrix + runs-on: ubuntu-latest strategy: matrix: ${{ fromJson(needs.generate-matrix.outputs.matrix) }} fail-fast: false - uses: pytorch/test-infra/.github/workflows/linux_job.yml@main - with: - runner: linux.g5.4xlarge.nvidia.gpu - repository: "pytorch/builder" - ref: ${{ inputs.ref || github.ref }} - job-name: pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} - binary-matrix: ${{ toJSON(matrix) }} - docker-image: ghcr.io/pytorch/pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} - timeout: 180 - script: | - set -ex - export MATRIX_GPU_ARCH_TYPE="cuda" - export MATRIX_GPU_ARCH_VERSION="${{ matrix.cuda }}" - python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled + steps: # Existing `linux_job.yml` content will be inlined or used here + - uses: actions/checkout@v3 + - uses: pytorch/test-infra/.github/workflows/linux_job.yml@main + with: + repository: "pytorch/builder" + ref: ${{ inputs.ref || github.ref }} + job-name: pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} + binary-matrix: ${{ toJSON(matrix) }} + docker-image: ghcr.io/pytorch/pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} + timeout: 180 + script: | + set -ex + export MATRIX_GPU_ARCH_TYPE="cuda" + export MATRIX_GPU_ARCH_VERSION="${{ matrix.cuda }}" + python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled From 46561c0d4621fc54949233c26cbd29ddfe43d197 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Mon, 8 Apr 2024 16:26:36 -0700 Subject: [PATCH 39/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 35 +++++++++++--------- 1 file changed, 19 insertions(+), 16 deletions(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 79e89b718..6fedca2d2 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -22,26 +22,29 @@ jobs: uses: pytorch/test-infra/.github/workflows/generate_docker_release_matrix.yml@main with: channel: ${{ inputs.channel }} - secrets: inherit + secrets: inherit run-tests: needs: generate-matrix - runs-on: ubuntu-latest + runs-on: ubuntu-latest strategy: matrix: ${{ fromJson(needs.generate-matrix.outputs.matrix) }} fail-fast: false - steps: # Existing `linux_job.yml` content will be inlined or used here + steps: - uses: actions/checkout@v3 - - uses: pytorch/test-infra/.github/workflows/linux_job.yml@main - with: - repository: "pytorch/builder" - ref: ${{ inputs.ref || github.ref }} - job-name: pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} - binary-matrix: ${{ toJSON(matrix) }} - docker-image: ghcr.io/pytorch/pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} - timeout: 180 - script: | - set -ex - export MATRIX_GPU_ARCH_TYPE="cuda" - export MATRIX_GPU_ARCH_VERSION="${{ matrix.cuda }}" - python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled + + call-reusable-workflow: # New job to call the reusable workflow + needs: run-tests # Ensure the matrix is built first + uses: pytorch/test-infra/.github/workflows/linux_job.yml@main + with: + repository: "pytorch/builder" + ref: ${{ inputs.ref || github.ref }} + job-name: pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} + binary-matrix: ${{ toJSON(matrix) }} + docker-image: ghcr.io/pytorch/pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cuda_version }}-${{ matrix.image_type }} + timeout: 180 + script: | + set -ex + export MATRIX_GPU_ARCH_TYPE="cuda" + export MATRIX_GPU_ARCH_VERSION="${{ matrix.cuda }}" + python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled From 9cc71adc985d97a0184a7d3e7a8692335fbce8d2 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Mon, 8 Apr 2024 16:50:31 -0700 Subject: [PATCH 40/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 28 +++++--------------- 1 file changed, 6 insertions(+), 22 deletions(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 6fedca2d2..be4542315 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -1,5 +1,4 @@ name: Validate Docker Images (with Matrix Generation) - on: workflow_dispatch: inputs: @@ -16,35 +15,20 @@ on: push: branches: - '*' - jobs: generate-matrix: uses: pytorch/test-infra/.github/workflows/generate_docker_release_matrix.yml@main with: channel: ${{ inputs.channel }} - secrets: inherit - + secrets: inherit run-tests: needs: generate-matrix - runs-on: ubuntu-latest + runs-on: ubuntu-latest strategy: matrix: ${{ fromJson(needs.generate-matrix.outputs.matrix) }} - fail-fast: false + container: + image: ghcr.io/pytorch/pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} steps: - uses: actions/checkout@v3 - - call-reusable-workflow: # New job to call the reusable workflow - needs: run-tests # Ensure the matrix is built first - uses: pytorch/test-infra/.github/workflows/linux_job.yml@main - with: - repository: "pytorch/builder" - ref: ${{ inputs.ref || github.ref }} - job-name: pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} - binary-matrix: ${{ toJSON(matrix) }} - docker-image: ghcr.io/pytorch/pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cuda_version }}-${{ matrix.image_type }} - timeout: 180 - script: | - set -ex - export MATRIX_GPU_ARCH_TYPE="cuda" - export MATRIX_GPU_ARCH_VERSION="${{ matrix.cuda }}" - python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled + - name: Run smoke tests + run: python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled From 99d11d0cf11d7675ce1f4830227ba3bb422fdeb0 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Mon, 8 Apr 2024 17:18:20 -0700 Subject: [PATCH 41/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index be4542315..47259e5e4 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -31,4 +31,8 @@ jobs: steps: - uses: actions/checkout@v3 - name: Run smoke tests - run: python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled + run: | + export MATRIX_GPU_ARCH_TYPE="cuda" + export MATRIX_GPU_ARCH_VERSION="${{ matrix.cuda }}" + python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled + From 0a99f1efe929da8ac42735cc783206cf27119b82 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Mon, 8 Apr 2024 17:24:24 -0700 Subject: [PATCH 42/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 4 +--- 1 file changed, 1 insertion(+), 3 deletions(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 47259e5e4..75d10abb8 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -31,8 +31,6 @@ jobs: steps: - uses: actions/checkout@v3 - name: Run smoke tests - run: | - export MATRIX_GPU_ARCH_TYPE="cuda" - export MATRIX_GPU_ARCH_VERSION="${{ matrix.cuda }}" + run: python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled From a11467f240745b63a87b5c63fc66fe83b9b42cca Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Wed, 10 Apr 2024 09:28:57 -0700 Subject: [PATCH 43/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 75d10abb8..5e5befeb5 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -27,7 +27,7 @@ jobs: strategy: matrix: ${{ fromJson(needs.generate-matrix.outputs.matrix) }} container: - image: ghcr.io/pytorch/pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} + image: ${{ fromJson(needs.generate-matrix.outputs.matrix.docker) }} steps: - uses: actions/checkout@v3 - name: Run smoke tests From 58085f55865d38f8ac1f0322e41051afc927510b Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Wed, 10 Apr 2024 10:02:11 -0700 Subject: [PATCH 44/52] Update validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 5e5befeb5..d63545696 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -27,7 +27,7 @@ jobs: strategy: matrix: ${{ fromJson(needs.generate-matrix.outputs.matrix) }} container: - image: ${{ fromJson(needs.generate-matrix.outputs.matrix.docker) }} + image: ${{matrix.docker}} steps: - uses: actions/checkout@v3 - name: Run smoke tests From 42e036a193b5302c21315a16c76e66c3071445aa Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Wed, 10 Apr 2024 10:55:35 -0700 Subject: [PATCH 45/52] Remove trigger on pushes to finalize the logic --- .github/workflows/validate_docker_images.yml | 4 +--- 1 file changed, 1 insertion(+), 3 deletions(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index d63545696..8fdb1a964 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -12,9 +12,7 @@ on: - 'test' - 'release' - 'all' - push: - branches: - - '*' + jobs: generate-matrix: uses: pytorch/test-infra/.github/workflows/generate_docker_release_matrix.yml@main From c46f7bed2759a0b7127497528e3b652d79563353 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Wed, 10 Apr 2024 12:24:12 -0700 Subject: [PATCH 46/52] Add gpu tests --- .github/workflows/validate_docker_images.yml | 22 ++++++++++++++++++-- 1 file changed, 20 insertions(+), 2 deletions(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 8fdb1a964..8d3ad01f4 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -19,7 +19,7 @@ jobs: with: channel: ${{ inputs.channel }} secrets: inherit - run-tests: + run-cpu-tests: needs: generate-matrix runs-on: ubuntu-latest strategy: @@ -31,4 +31,22 @@ jobs: - name: Run smoke tests run: python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled - + run-gpu-tests: + needs: generate-matrix + strategy: + matrix: ${{ fromJson(needs.generate-matrix.outputs.matrix) }} + fail-fast: false + uses: pytorch/test-infra/.github/workflows/linux_job.yml@main + with: + runner: linux.g5.4xlarge.nvidia.gpu + repository: "pytorch/builder" + ref: ${{ inputs.ref || github.ref }} + job-name: pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} + binary-matrix: ${{ toJSON(matrix) }} + docker-image: ${{matrix.docker}} + timeout: 180 + script: | + set -ex + export MATRIX_GPU_ARCH_TYPE="cuda" + export MATRIX_GPU_ARCH_VERSION="${{ matrix.cuda }}" + python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled From d9ac7f328c9dfbbf96762c84dca444195e334f32 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Wed, 10 Apr 2024 12:27:43 -0700 Subject: [PATCH 47/52] Testing using push --- .github/workflows/validate_docker_images.yml | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 8d3ad01f4..99779e04f 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -13,6 +13,10 @@ on: - 'release' - 'all' + push: + branches: + - '*' + jobs: generate-matrix: uses: pytorch/test-infra/.github/workflows/generate_docker_release_matrix.yml@main From fcb32e0c12c53dee8bd52303a81a50e02056bb94 Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Wed, 10 Apr 2024 12:33:31 -0700 Subject: [PATCH 48/52] Remove trigger on push --- .github/workflows/validate_docker_images.yml | 4 ---- 1 file changed, 4 deletions(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 99779e04f..8d3ad01f4 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -13,10 +13,6 @@ on: - 'release' - 'all' - push: - branches: - - '*' - jobs: generate-matrix: uses: pytorch/test-infra/.github/workflows/generate_docker_release_matrix.yml@main From 404cff893a684100847b5bca51872ad078f88abd Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Wed, 10 Apr 2024 12:47:32 -0700 Subject: [PATCH 49/52] Remove run-cpu-tests --- .github/workflows/validate_docker_images.yml | 12 ------------ 1 file changed, 12 deletions(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 8d3ad01f4..4c1eacc5a 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -19,18 +19,6 @@ jobs: with: channel: ${{ inputs.channel }} secrets: inherit - run-cpu-tests: - needs: generate-matrix - runs-on: ubuntu-latest - strategy: - matrix: ${{ fromJson(needs.generate-matrix.outputs.matrix) }} - container: - image: ${{matrix.docker}} - steps: - - uses: actions/checkout@v3 - - name: Run smoke tests - run: - python test/smoke_test/smoke_test.py --package torchonly --runtime-error-check enabled run-gpu-tests: needs: generate-matrix strategy: From 30e49bda9fe8492be6d8aeb467d85e202345e97d Mon Sep 17 00:00:00 2001 From: Julia Guo <153684546+juliagmt-google@users.noreply.github.com> Date: Wed, 10 Apr 2024 12:48:23 -0700 Subject: [PATCH 50/52] Update job_name Co-authored-by: Andrey Talman --- .github/workflows/validate_docker_images.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 4c1eacc5a..3362a791c 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -29,7 +29,7 @@ jobs: runner: linux.g5.4xlarge.nvidia.gpu repository: "pytorch/builder" ref: ${{ inputs.ref || github.ref }} - job-name: pytorch:2.2.2-cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} + job-name: cuda${{ matrix.cuda }}-cudnn${{ matrix.cudnn_version }}-${{ matrix.image_type }} binary-matrix: ${{ toJSON(matrix) }} docker-image: ${{matrix.docker}} timeout: 180 From 1a49fe076ecbca8d8c7433c061efbfb500350abc Mon Sep 17 00:00:00 2001 From: Andrey Talman Date: Wed, 10 Apr 2024 15:49:32 -0400 Subject: [PATCH 51/52] Update .github/workflows/validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 1 - 1 file changed, 1 deletion(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 3362a791c..04946e693 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -11,7 +11,6 @@ on: - 'nightly' - 'test' - 'release' - - 'all' jobs: generate-matrix: From 9089c5d34e0562d684bff7c94ac4728f3dff8341 Mon Sep 17 00:00:00 2001 From: Andrey Talman Date: Wed, 10 Apr 2024 15:49:59 -0400 Subject: [PATCH 52/52] Update .github/workflows/validate_docker_images.yml --- .github/workflows/validate_docker_images.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/validate_docker_images.yml b/.github/workflows/validate_docker_images.yml index 04946e693..b55b54d5c 100644 --- a/.github/workflows/validate_docker_images.yml +++ b/.github/workflows/validate_docker_images.yml @@ -6,7 +6,7 @@ on: description: 'PyTorch channel to use (nightly, test, release, all)' required: true type: choice - default: 'all' + default: 'nightly' options: - 'nightly' - 'test'