From a96b93183db6cf0d129a6bdb8e7628ce6eced017 Mon Sep 17 00:00:00 2001 From: Logan Adams Date: Wed, 3 Apr 2024 11:46:10 -0700 Subject: [PATCH 1/2] Update workflows that use cu116 to cu117 --- .github/workflows/nv-accelerate-v100.yml | 2 +- .github/workflows/nv-ds-chat.yml | 2 +- .github/workflows/nv-inference.yml | 2 +- .github/workflows/nv-mii.yml | 2 +- .github/workflows/nv-nightly.yml | 4 ++-- .github/workflows/nv-torch-latest-v100.yml | 2 +- .github/workflows/nv-torch-nightly-v100.yml | 2 +- .github/workflows/nv-transformers-v100.yml | 2 +- 8 files changed, 9 insertions(+), 9 deletions(-) diff --git a/.github/workflows/nv-accelerate-v100.yml b/.github/workflows/nv-accelerate-v100.yml index 93286b62610a..1fccbece2994 100644 --- a/.github/workflows/nv-accelerate-v100.yml +++ b/.github/workflows/nv-accelerate-v100.yml @@ -19,7 +19,7 @@ concurrency: jobs: unit-tests: - runs-on: [self-hosted, nvidia, cu116, v100] + runs-on: [self-hosted, nvidia, cu117, v100] steps: - uses: actions/checkout@v3 diff --git a/.github/workflows/nv-ds-chat.yml b/.github/workflows/nv-ds-chat.yml index 61011a85b92c..f61637be7e0e 100644 --- a/.github/workflows/nv-ds-chat.yml +++ b/.github/workflows/nv-ds-chat.yml @@ -21,7 +21,7 @@ permissions: jobs: unit-tests: - runs-on: [self-hosted, nvidia, cu116, v100] + runs-on: [self-hosted, nvidia, cu117, v100] steps: - uses: actions/checkout@v3 diff --git a/.github/workflows/nv-inference.yml b/.github/workflows/nv-inference.yml index 2b74e7e155df..6b339f457802 100644 --- a/.github/workflows/nv-inference.yml +++ b/.github/workflows/nv-inference.yml @@ -22,7 +22,7 @@ concurrency: jobs: unit-tests: - runs-on: [self-hosted, nvidia, cu116, v100] + runs-on: [self-hosted, nvidia, cu117, v100] steps: - uses: actions/checkout@v3 diff --git a/.github/workflows/nv-mii.yml b/.github/workflows/nv-mii.yml index 0b3f128be5a4..31379f7e758b 100644 --- a/.github/workflows/nv-mii.yml +++ b/.github/workflows/nv-mii.yml @@ -27,7 +27,7 @@ concurrency: jobs: unit-tests: - runs-on: [self-hosted, nvidia, cu116, v100] + runs-on: [self-hosted, nvidia, cu117, v100] steps: - uses: actions/checkout@v3 diff --git a/.github/workflows/nv-nightly.yml b/.github/workflows/nv-nightly.yml index e540b5acaf33..3de5adcaea73 100644 --- a/.github/workflows/nv-nightly.yml +++ b/.github/workflows/nv-nightly.yml @@ -15,7 +15,7 @@ permissions: jobs: unit-tests: - runs-on: [self-hosted, nvidia, cu116, v100] + runs-on: [self-hosted, nvidia, cu117, v100] steps: - uses: actions/checkout@v3 @@ -25,7 +25,7 @@ jobs: - name: Install pytorch run: | - pip install -U --cache-dir $TORCH_CACHE torch==1.13.1 torchvision --index-url https://download.pytorch.org/whl/cu116 + pip install -U --cache-dir $TORCH_CACHE torch==1.13.1 torchvision --index-url https://download.pytorch.org/whl/cu117 python -c "import torch; print('torch:', torch.__version__, torch)" python -c "import torch; print('CUDA available:', torch.cuda.is_available())" diff --git a/.github/workflows/nv-torch-latest-v100.yml b/.github/workflows/nv-torch-latest-v100.yml index e2d0f172dcbf..14d33680521d 100644 --- a/.github/workflows/nv-torch-latest-v100.yml +++ b/.github/workflows/nv-torch-latest-v100.yml @@ -19,7 +19,7 @@ concurrency: jobs: unit-tests: - runs-on: [self-hosted, nvidia, cu116, v100] + runs-on: [self-hosted, nvidia, cu117, v100] steps: - uses: actions/checkout@v3 diff --git a/.github/workflows/nv-torch-nightly-v100.yml b/.github/workflows/nv-torch-nightly-v100.yml index f46c5089b241..bd13047f6078 100644 --- a/.github/workflows/nv-torch-nightly-v100.yml +++ b/.github/workflows/nv-torch-nightly-v100.yml @@ -15,7 +15,7 @@ permissions: jobs: unit-tests: - runs-on: [self-hosted, nvidia, cu116, v100] + runs-on: [self-hosted, nvidia, cu117, v100] steps: - uses: actions/checkout@v3 diff --git a/.github/workflows/nv-transformers-v100.yml b/.github/workflows/nv-transformers-v100.yml index 4fbc42abec5f..75f53c95c235 100644 --- a/.github/workflows/nv-transformers-v100.yml +++ b/.github/workflows/nv-transformers-v100.yml @@ -18,7 +18,7 @@ concurrency: jobs: unit-tests: - runs-on: [self-hosted, nvidia, cu116, v100] + runs-on: [self-hosted, nvidia, cu117, v100] steps: - uses: actions/checkout@v3 From 0a780d9d533b79151c08682d4124a88a6acc67f3 Mon Sep 17 00:00:00 2001 From: Logan Adams Date: Thu, 4 Apr 2024 09:04:55 -0700 Subject: [PATCH 2/2] Update cuda version being checked --- .github/workflows/nv-nightly.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/nv-nightly.yml b/.github/workflows/nv-nightly.yml index 3de5adcaea73..ca091990cf4b 100644 --- a/.github/workflows/nv-nightly.yml +++ b/.github/workflows/nv-nightly.yml @@ -55,7 +55,7 @@ jobs: run: | unset TORCH_CUDA_ARCH_LIST # only jit compile for current arch cd tests - pytest $PYTEST_OPTS --forked -m 'nightly' unit/ --torch_ver="1.13" --cuda_ver="11.6" + pytest $PYTEST_OPTS --forked -m 'nightly' unit/ --torch_ver="1.13" --cuda_ver="11.7" - name: Open GitHub issue if nightly CI fails if: ${{ failure() && (github.event_name == 'schedule') }}