diff --git a/.github/workflows/check_failed_tests.yml b/.github/workflows/check_failed_tests.yml index 478f9d0ae2a..adafd5c046b 100644 --- a/.github/workflows/check_failed_tests.yml +++ b/.github/workflows/check_failed_tests.yml @@ -41,7 +41,7 @@ jobs: check_new_failures: name: " " runs-on: - group: aws-g4dn-4xlarge-cache + group: aws-g5-4xlarge-cache container: image: ${{ inputs.docker }} options: --gpus all --shm-size "16gb" --ipc host -v /mnt/cache/.cache/huggingface:/mnt/cache/ diff --git a/.github/workflows/doctest_job.yml b/.github/workflows/doctest_job.yml index b881bc38e59..86368b0f4ca 100644 --- a/.github/workflows/doctest_job.yml +++ b/.github/workflows/doctest_job.yml @@ -28,7 +28,7 @@ jobs: matrix: split_keys: ${{ fromJson(inputs.split_keys) }} runs-on: - group: aws-g4dn-4xlarge-cache + group: aws-g5-4xlarge-cache container: image: huggingface/transformers-all-latest-gpu options: --gpus 0 --shm-size "16gb" --ipc host -v /mnt/cache/.cache/huggingface:/mnt/cache/ diff --git a/.github/workflows/doctests.yml b/.github/workflows/doctests.yml index bdf967a6d9e..925701a4c10 100644 --- a/.github/workflows/doctests.yml +++ b/.github/workflows/doctests.yml @@ -15,7 +15,7 @@ jobs: setup: name: Setup runs-on: - group: aws-g4dn-4xlarge-cache + group: aws-g5-4xlarge-cache container: image: huggingface/transformers-all-latest-gpu options: --gpus 0 --shm-size "16gb" --ipc host -v /mnt/cache/.cache/huggingface:/mnt/cache/ diff --git a/.github/workflows/model_jobs.yml b/.github/workflows/model_jobs.yml index c9096bec3c6..b7818d798d5 100644 --- a/.github/workflows/model_jobs.yml +++ b/.github/workflows/model_jobs.yml @@ -107,9 +107,9 @@ jobs: run: | echo "${{ inputs.machine_type }}" - if [ "${{ inputs.machine_type }}" = "aws-g4dn-4xlarge-cache" ]; then + if [ "${{ inputs.machine_type }}" = "aws-g5-4xlarge-cache" ]; then machine_type=single-gpu - elif [ "${{ inputs.machine_type }}" = "aws-g4dn-12xlarge-cache" ]; then + elif [ "${{ inputs.machine_type }}" = "aws-g5-12xlarge-cache" ]; then machine_type=multi-gpu else machine_type=${{ inputs.machine_type }} diff --git a/.github/workflows/self-comment-ci.yml b/.github/workflows/self-comment-ci.yml index d2883e19425..e9f07cd591a 100644 --- a/.github/workflows/self-comment-ci.yml +++ b/.github/workflows/self-comment-ci.yml @@ -185,7 +185,7 @@ jobs: fail-fast: false matrix: folders: ${{ fromJson(needs.get-tests.outputs.models) }} - machine_type: [aws-g4dn-4xlarge-cache, aws-g4dn-12xlarge-cache] + machine_type: [aws-g5-4xlarge-cache, aws-g5-12xlarge-cache] runs-on: group: '${{ matrix.machine_type }}' container: @@ -239,9 +239,9 @@ jobs: shell: bash run: | echo "${{ matrix.machine_type }}" - if [ "${{ matrix.machine_type }}" = "aws-g4dn-4xlarge-cache" ]; then + if [ "${{ matrix.machine_type }}" = "aws-g5-4xlarge-cache" ]; then machine_type=single-gpu - elif [ "${{ matrix.machine_type }}" = "aws-g4dn-12xlarge-cache" ]; then + elif [ "${{ matrix.machine_type }}" = "aws-g5-12xlarge-cache" ]; then machine_type=multi-gpu else machine_type=${{ matrix.machine_type }} @@ -292,7 +292,7 @@ jobs: fail-fast: false matrix: folders: ${{ fromJson(needs.get-tests.outputs.quantizations) }} - machine_type: [aws-g4dn-4xlarge-cache, aws-g4dn-12xlarge-cache] + machine_type: [aws-g5-4xlarge-cache, aws-g5-12xlarge-cache] runs-on: group: '${{ matrix.machine_type }}' container: @@ -338,9 +338,9 @@ jobs: shell: bash run: | echo "${{ matrix.machine_type }}" - if [ "${{ matrix.machine_type }}" = "aws-g4dn-4xlarge-cache" ]; then + if [ "${{ matrix.machine_type }}" = "aws-g5-4xlarge-cache" ]; then machine_type=single-gpu - elif [ "${{ matrix.machine_type }}" = "aws-g4dn-12xlarge-cache" ]; then + elif [ "${{ matrix.machine_type }}" = "aws-g5-12xlarge-cache" ]; then machine_type=multi-gpu else machine_type=${{ matrix.machine_type }} diff --git a/.github/workflows/self-push.yml b/.github/workflows/self-push.yml index 3b3be41e3e9..3ce1ae55992 100644 --- a/.github/workflows/self-push.yml +++ b/.github/workflows/self-push.yml @@ -31,7 +31,7 @@ jobs: name: Setup strategy: matrix: - machine_type: [aws-g4dn-2xlarge-cache, aws-g4dn-12xlarge-cache] + machine_type: [aws-g5-4xlarge-cache, aws-g5-12xlarge-cache] runs-on: group: '${{ matrix.machine_type }}' container: @@ -131,7 +131,7 @@ jobs: fail-fast: false matrix: folders: ${{ fromJson(needs.setup.outputs.matrix) }} - machine_type: [aws-g4dn-2xlarge-cache] + machine_type: [aws-g5-4xlarge-cache] runs-on: group: '${{ matrix.machine_type }}' container: @@ -169,9 +169,9 @@ jobs: run: | echo "${{ matrix.machine_type }}" - if [ "${{ matrix.machine_type }}" = "aws-g4dn-2xlarge-cache" ]; then + if [ "${{ matrix.machine_type }}" = "aws-g5-4xlarge-cache" ]; then machine_type=single-gpu - elif [ "${{ matrix.machine_type }}" = "aws-g4dn-12xlarge-cache" ]; then + elif [ "${{ matrix.machine_type }}" = "aws-g5-12xlarge-cache" ]; then machine_type=multi-gpu else machine_type=${{ matrix.machine_type }} @@ -244,7 +244,7 @@ jobs: fail-fast: false matrix: folders: ${{ fromJson(needs.setup.outputs.matrix) }} - machine_type: [aws-g4dn-12xlarge-cache] + machine_type: [aws-g5-12xlarge-cache] runs-on: group: '${{ matrix.machine_type }}' container: @@ -282,9 +282,9 @@ jobs: run: | echo "${{ matrix.machine_type }}" - if [ "${{ matrix.machine_type }}" = "aws-g4dn-2xlarge-cache" ]; then + if [ "${{ matrix.machine_type }}" = "aws-g5-4xlarge-cache" ]; then machine_type=single-gpu - elif [ "${{ matrix.machine_type }}" = "aws-g4dn-12xlarge-cache" ]; then + elif [ "${{ matrix.machine_type }}" = "aws-g5-12xlarge-cache" ]; then machine_type=multi-gpu else machine_type=${{ matrix.machine_type }} @@ -357,7 +357,7 @@ jobs: strategy: fail-fast: false matrix: - machine_type: [aws-g4dn-2xlarge-cache] + machine_type: [aws-g5-4xlarge-cache] runs-on: group: '${{ matrix.machine_type }}' container: @@ -395,9 +395,9 @@ jobs: run: | echo "${{ matrix.machine_type }}" - if [ "${{ matrix.machine_type }}" = "aws-g4dn-2xlarge-cache" ]; then + if [ "${{ matrix.machine_type }}" = "aws-g5-4xlarge-cache" ]; then machine_type=single-gpu - elif [ "${{ matrix.machine_type }}" = "aws-g4dn-12xlarge-cache" ]; then + elif [ "${{ matrix.machine_type }}" = "aws-g5-12xlarge-cache" ]; then machine_type=multi-gpu else machine_type=${{ matrix.machine_type }} @@ -467,7 +467,7 @@ jobs: strategy: fail-fast: false matrix: - machine_type: [aws-g4dn-12xlarge-cache] + machine_type: [aws-g5-12xlarge-cache] runs-on: group: '${{ matrix.machine_type }}' container: @@ -505,9 +505,9 @@ jobs: run: | echo "${{ matrix.machine_type }}" - if [ "${{ matrix.machine_type }}" = "aws-g4dn-2xlarge-cache" ]; then + if [ "${{ matrix.machine_type }}" = "aws-g5-4xlarge-cache" ]; then machine_type=single-gpu - elif [ "${{ matrix.machine_type }}" = "aws-g4dn-12xlarge-cache" ]; then + elif [ "${{ matrix.machine_type }}" = "aws-g5-12xlarge-cache" ]; then machine_type=multi-gpu else machine_type=${{ matrix.machine_type }} diff --git a/.github/workflows/self-scheduled.yml b/.github/workflows/self-scheduled.yml index 2ddf1071710..7a2b7470e15 100644 --- a/.github/workflows/self-scheduled.yml +++ b/.github/workflows/self-scheduled.yml @@ -50,7 +50,7 @@ jobs: name: Setup strategy: matrix: - machine_type: [aws-g4dn-4xlarge-cache, aws-g4dn-12xlarge-cache] + machine_type: [aws-g5-4xlarge-cache, aws-g5-12xlarge-cache] runs-on: group: '${{ matrix.machine_type }}' container: @@ -128,7 +128,7 @@ jobs: strategy: fail-fast: false matrix: - machine_type: [aws-g4dn-4xlarge-cache, aws-g4dn-12xlarge-cache] + machine_type: [aws-g5-4xlarge-cache, aws-g5-12xlarge-cache] slice_id: [0, 1] uses: ./.github/workflows/model_jobs.yml with: @@ -145,7 +145,7 @@ jobs: strategy: fail-fast: false matrix: - machine_type: [aws-g4dn-4xlarge-cache, aws-g4dn-12xlarge-cache] + machine_type: [aws-g5-4xlarge-cache, aws-g5-12xlarge-cache] runs-on: group: '${{ matrix.machine_type }}' container: @@ -179,9 +179,9 @@ jobs: run: | echo "${{ matrix.machine_type }}" - if [ "${{ matrix.machine_type }}" = "aws-g4dn-4xlarge-cache" ]; then + if [ "${{ matrix.machine_type }}" = "aws-g5-4xlarge-cache" ]; then machine_type=single-gpu - elif [ "${{ matrix.machine_type }}" = "aws-g4dn-12xlarge-cache" ]; then + elif [ "${{ matrix.machine_type }}" = "aws-g5-12xlarge-cache" ]; then machine_type=multi-gpu else machine_type=${{ matrix.machine_type }} @@ -213,7 +213,7 @@ jobs: strategy: fail-fast: false matrix: - machine_type: [aws-g4dn-4xlarge-cache] + machine_type: [aws-g5-4xlarge-cache] runs-on: group: '${{ matrix.machine_type }}' container: @@ -247,9 +247,9 @@ jobs: run: | echo "${{ matrix.machine_type }}" - if [ "${{ matrix.machine_type }}" = "aws-g4dn-4xlarge-cache" ]; then + if [ "${{ matrix.machine_type }}" = "aws-g5-4xlarge-cache" ]; then machine_type=single-gpu - elif [ "${{ matrix.machine_type }}" = "aws-g4dn-12xlarge-cache" ]; then + elif [ "${{ matrix.machine_type }}" = "aws-g5-12xlarge-cache" ]; then machine_type=multi-gpu else machine_type=${{ matrix.machine_type }} @@ -282,7 +282,7 @@ jobs: strategy: fail-fast: false matrix: - machine_type: [aws-g4dn-4xlarge-cache, aws-g4dn-12xlarge-cache] + machine_type: [aws-g5-4xlarge-cache, aws-g5-12xlarge-cache] runs-on: group: '${{ matrix.machine_type }}' container: @@ -344,9 +344,9 @@ jobs: run: | echo "${{ matrix.machine_type }}" - if [ "${{ matrix.machine_type }}" = "aws-g4dn-4xlarge-cache" ]; then + if [ "${{ matrix.machine_type }}" = "aws-g5-4xlarge-cache" ]; then machine_type=single-gpu - elif [ "${{ matrix.machine_type }}" = "aws-g4dn-12xlarge-cache" ]; then + elif [ "${{ matrix.machine_type }}" = "aws-g5-12xlarge-cache" ]; then machine_type=multi-gpu else machine_type=${{ matrix.machine_type }} @@ -381,7 +381,7 @@ jobs: fail-fast: false matrix: folders: ${{ fromJson(needs.setup.outputs.quantization_matrix) }} - machine_type: [aws-g4dn-4xlarge-cache, aws-g4dn-12xlarge-cache] + machine_type: [aws-g5-4xlarge-cache, aws-g5-12xlarge-cache] runs-on: group: '${{ matrix.machine_type }}' container: @@ -424,9 +424,9 @@ jobs: run: | echo "${{ matrix.machine_type }}" - if [ "${{ matrix.machine_type }}" = "aws-g4dn-4xlarge-cache" ]; then + if [ "${{ matrix.machine_type }}" = "aws-g5-4xlarge-cache" ]; then machine_type=single-gpu - elif [ "${{ matrix.machine_type }}" = "aws-g4dn-12xlarge-cache" ]; then + elif [ "${{ matrix.machine_type }}" = "aws-g5-12xlarge-cache" ]; then machine_type=multi-gpu else machine_type=${{ matrix.machine_type }}