From 14b65941b08a9ceb479621394ae02059f8f1e1e7 Mon Sep 17 00:00:00 2001 From: Jirka Borovec <6035284+Borda@users.noreply.github.com> Date: Tue, 25 Jul 2023 10:30:09 -1000 Subject: [PATCH] ci: bump CUDA for nightly (#18162) MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Co-authored-by: Carlos MocholĂ­ --- .azure/gpu-benchmarks.yml | 2 +- .azure/gpu-tests-fabric.yml | 6 +++--- .azure/gpu-tests-pytorch.yml | 6 +++--- .github/checkgroup.yml | 7 ++++--- .github/workflows/ci-dockers.yml | 8 ++++---- .github/workflows/release-docker.yml | 4 +++- 6 files changed, 18 insertions(+), 15 deletions(-) diff --git a/.azure/gpu-benchmarks.yml b/.azure/gpu-benchmarks.yml index 1859403af8..d03365ec17 100644 --- a/.azure/gpu-benchmarks.yml +++ b/.azure/gpu-benchmarks.yml @@ -46,7 +46,7 @@ jobs: variables: DEVICES: $( python -c 'print("$(Agent.Name)".split("_")[-1])' ) container: - image: "pytorchlightning/pytorch_lightning:base-cuda-py3.10-torch2.0-cuda11.7.1" + image: "pytorchlightning/pytorch_lightning:base-cuda-py3.10-torch2.0-cuda11.8.0" options: "--gpus=all --shm-size=32g" strategy: matrix: diff --git a/.azure/gpu-tests-fabric.yml b/.azure/gpu-tests-fabric.yml index c32b92b8db..d1dd3b0b20 100644 --- a/.azure/gpu-tests-fabric.yml +++ b/.azure/gpu-tests-fabric.yml @@ -60,15 +60,15 @@ jobs: strategy: matrix: 'Fabric | latest': - image: "pytorchlightning/pytorch_lightning:base-cuda-py3.10-torch2.0-cuda11.7.1" + image: "pytorchlightning/pytorch_lightning:base-cuda-py3.10-torch2.0-cuda11.8.0" IS_NIGHTLY: "false" PACKAGE_NAME: "fabric" 'Lightning | latest': - image: "pytorchlightning/pytorch_lightning:base-cuda-py3.10-torch2.0-cuda11.7.1" + image: "pytorchlightning/pytorch_lightning:base-cuda-py3.10-torch2.0-cuda11.8.0" IS_NIGHTLY: "false" PACKAGE_NAME: "lightning" 'Lightning | nightly': - image: "pytorchlightning/pytorch_lightning:base-cuda-py3.10-torch2.0-cuda11.7.1" + image: "pytorchlightning/pytorch_lightning:base-cuda-py3.10-torch2.0-cuda11.8.0" IS_NIGHTLY: "true" PACKAGE_NAME: "lightning" workspace: diff --git a/.azure/gpu-tests-pytorch.yml b/.azure/gpu-tests-pytorch.yml index e205588bee..4c9036cf4d 100644 --- a/.azure/gpu-tests-pytorch.yml +++ b/.azure/gpu-tests-pytorch.yml @@ -52,15 +52,15 @@ jobs: strategy: matrix: 'PyTorch | latest': - image: "pytorchlightning/pytorch_lightning:base-cuda-py3.10-torch2.0-cuda11.7.1" + image: "pytorchlightning/pytorch_lightning:base-cuda-py3.10-torch2.0-cuda11.8.0" IS_NIGHTLY: "false" PACKAGE_NAME: "pytorch" 'Lightning | latest': - image: "pytorchlightning/pytorch_lightning:base-cuda-py3.10-torch2.0-cuda11.7.1" + image: "pytorchlightning/pytorch_lightning:base-cuda-py3.10-torch2.0-cuda11.8.0" IS_NIGHTLY: "false" PACKAGE_NAME: "lightning" 'Lightning | nightly': - image: "pytorchlightning/pytorch_lightning:base-cuda-py3.10-torch2.0-cuda11.7.1" + image: "pytorchlightning/pytorch_lightning:base-cuda-py3.10-torch2.0-cuda11.8.0" IS_NIGHTLY: "true" PACKAGE_NAME: "lightning" pool: lit-rtx-3090 diff --git a/.github/checkgroup.yml b/.github/checkgroup.yml index c278552aef..06f5da5b32 100644 --- a/.github/checkgroup.yml +++ b/.github/checkgroup.yml @@ -139,15 +139,16 @@ subprojects: - "!*.md" - "!**/*.md" checks: - - "build-cuda (3.9, 1.11, 11.3.1)" - "build-cuda (3.9, 1.12, 11.7.1)" + - "build-cuda (3.9, 1.13, 11.8.0)" - "build-cuda (3.9, 1.13, 12.0.1)" + - "build-cuda (3.10, 2.0, 11.8.0)" - "build-cuda (3.10, 2.0, 12.0.1)" - - "build-cuda (3.10, 2.0, 11.7.1)" #- "build-NGC" - - "build-pl (3.9, 1.11, 11.3.1)" - "build-pl (3.9, 1.12, 11.7.1)" + - "build-pl (3.9, 1.13, 11.8.0)" - "build-pl (3.9, 1.13, 12.0.1)" + - "build-pl (3.10, 2.0, 11.8.0)" - "build-pl (3.10, 2.0, 12.0.1)" # SECTIONS: lightning_data diff --git a/.github/workflows/ci-dockers.yml b/.github/workflows/ci-dockers.yml index d982539e6d..be23c28d46 100644 --- a/.github/workflows/ci-dockers.yml +++ b/.github/workflows/ci-dockers.yml @@ -42,9 +42,10 @@ jobs: include: # We only release one docker image per PyTorch version. # The matrix here is the same as the one in release-docker.yml. - - {python_version: "3.9", pytorch_version: "1.11", cuda_version: "11.3.1"} - {python_version: "3.9", pytorch_version: "1.12", cuda_version: "11.7.1"} + - {python_version: "3.9", pytorch_version: "1.13", cuda_version: "11.8.0"} - {python_version: "3.9", pytorch_version: "1.13", cuda_version: "12.0.1"} + - {python_version: "3.10", pytorch_version: "2.0", cuda_version: "11.8.0"} - {python_version: "3.10", pytorch_version: "2.0", cuda_version: "12.0.1"} steps: - uses: actions/checkout@v3 @@ -70,12 +71,11 @@ jobs: include: # These are the base images for PL release docker images, # so include at least all of the combinations in release-dockers.yml. - - {python_version: "3.9", pytorch_version: "1.11", cuda_version: "11.3.1"} - {python_version: "3.9", pytorch_version: "1.12", cuda_version: "11.7.1"} + - {python_version: "3.9", pytorch_version: "1.13", cuda_version: "11.8.0"} - {python_version: "3.9", pytorch_version: "1.13", cuda_version: "12.0.1"} + - {python_version: "3.10", pytorch_version: "2.0", cuda_version: "11.8.0"} - {python_version: "3.10", pytorch_version: "2.0", cuda_version: "12.0.1"} - # these are used in Azure GPU CI - - {python_version: "3.10", pytorch_version: "2.0", cuda_version: "11.7.1"} steps: - uses: actions/checkout@v3 - uses: docker/setup-buildx-action@v2 diff --git a/.github/workflows/release-docker.yml b/.github/workflows/release-docker.yml index a3a13e1f3f..41b7ac7c23 100644 --- a/.github/workflows/release-docker.yml +++ b/.github/workflows/release-docker.yml @@ -16,9 +16,11 @@ jobs: matrix: include: # We only release one docker image per PyTorch version. - - {python_version: "3.9", pytorch_version: "1.11", cuda_version: "11.3.1"} - {python_version: "3.9", pytorch_version: "1.12", cuda_version: "11.7.1"} + - {python_version: "3.9", pytorch_version: "1.13", cuda_version: "11.8.0"} - {python_version: "3.9", pytorch_version: "1.13", cuda_version: "12.0.1"} + - {python_version: "3.10", pytorch_version: "2.0", cuda_version: "11.8.0"} + - {python_version: "3.10", pytorch_version: "2.0", cuda_version: "12.0.1"} steps: - name: Checkout uses: actions/checkout@v3