From 2db4da5b5223adc1de4cae117f63c9b725c86ced Mon Sep 17 00:00:00 2001 From: Huy Do Date: Mon, 16 Dec 2024 13:40:12 -0800 Subject: [PATCH] Switch userbenchmar-a100 and v3-bisection to linux.aws.a100 (#2560) Summary: Per atalman comment in https://github.com/pytorch/pytorch/issues/143215#issuecomment-2546253999 Pull Request resolved: https://github.com/pytorch/benchmark/pull/2560 Reviewed By: xuzhao9 Differential Revision: D67287082 Pulled By: huydhn fbshipit-source-id: cd0514d521f1c7405b6ca6e56c35657833716b1b --- .github/workflows/userbenchmark-a100-bisection.yml | 7 +------ .github/workflows/userbenchmark-a100-release.yml | 7 +------ .github/workflows/userbenchmark-a100.yml | 7 +------ .github/workflows/v3-bisection.yml | 7 +------ 4 files changed, 4 insertions(+), 24 deletions(-) diff --git a/.github/workflows/userbenchmark-a100-bisection.yml b/.github/workflows/userbenchmark-a100-bisection.yml index 8f25e3919f..e133f194c8 100644 --- a/.github/workflows/userbenchmark-a100-bisection.yml +++ b/.github/workflows/userbenchmark-a100-bisection.yml @@ -28,7 +28,7 @@ jobs: AWS_SECRET_ACCESS_KEY: ${{ secrets.AWS_SECRET_ACCESS_KEY }} HUGGING_FACE_HUB_TOKEN: ${{ secrets.HUGGING_FACE_HUB_TOKEN }} if: ${{ github.repository_owner == 'pytorch' }} - runs-on: [a100-runner] + runs-on: linux.aws.a100 timeout-minutes: 2880 # 48 hours steps: - name: Checkout @@ -53,11 +53,6 @@ jobs: repository: pytorch/audio path: srcs/audio fetch-depth: 0 - - name: Tune Nvidia GPU - run: | - sudo nvidia-smi -pm 1 - sudo nvidia-smi -ac 1215,1410 - nvidia-smi - name: Install devel packages run: | sudo apt-get update -y diff --git a/.github/workflows/userbenchmark-a100-release.yml b/.github/workflows/userbenchmark-a100-release.yml index 6523af9691..90333dddc6 100644 --- a/.github/workflows/userbenchmark-a100-release.yml +++ b/.github/workflows/userbenchmark-a100-release.yml @@ -6,7 +6,7 @@ on: jobs: run-userbenchmark: - runs-on: [a100-runner] + runs-on: linux.aws.a100 timeout-minutes: 1440 # 24 hours environment: docker-s3-upload env: @@ -20,11 +20,6 @@ jobs: with: path: benchmark ref: ${{ github.event_name == 'pull_request' && github.event.pull_request.head.sha || github.sha }} - - name: Tune Nvidia GPU - run: | - sudo nvidia-smi -pm 1 - sudo nvidia-smi -ac 1215,1410 - nvidia-smi - name: Clone and setup conda env run: | CONDA_ENV=${BASE_CONDA_ENV} . "${SETUP_SCRIPT}" diff --git a/.github/workflows/userbenchmark-a100.yml b/.github/workflows/userbenchmark-a100.yml index 67d4003bdf..70f8235efe 100644 --- a/.github/workflows/userbenchmark-a100.yml +++ b/.github/workflows/userbenchmark-a100.yml @@ -11,7 +11,7 @@ on: jobs: run-userbenchmark: - runs-on: [a100-runner] + runs-on: linux.aws.a100 timeout-minutes: 1440 # 24 hours environment: docker-s3-upload env: @@ -27,11 +27,6 @@ jobs: uses: actions/checkout@v3 with: path: benchmark - - name: Tune Nvidia GPU - run: | - sudo nvidia-smi -pm 1 - sudo nvidia-smi -ac 1215,1410 - nvidia-smi - name: Clone and setup conda env run: | CONDA_ENV=${BASE_CONDA_ENV} . "${SETUP_SCRIPT}" diff --git a/.github/workflows/v3-bisection.yml b/.github/workflows/v3-bisection.yml index 3d95417911..e68cbee809 100644 --- a/.github/workflows/v3-bisection.yml +++ b/.github/workflows/v3-bisection.yml @@ -20,7 +20,7 @@ jobs: AWS_ACCESS_KEY_ID: ${{ secrets.AWS_ACCESS_KEY_ID }} AWS_SECRET_ACCESS_KEY: ${{ secrets.AWS_SECRET_ACCESS_KEY }} if: ${{ github.repository_owner == 'pytorch' }} - runs-on: [a100-runner] + runs-on: linux.aws.a100 timeout-minutes: 2880 # 48 hours steps: - name: Checkout @@ -51,11 +51,6 @@ jobs: repository: pytorch/audio path: srcs/audio fetch-depth: 0 - - name: Tune Nvidia GPU - run: | - sudo nvidia-smi -pm 1 - sudo nvidia-smi -ac 1215,1410 - nvidia-smi - name: Install Deps run: | sudo apt-get -y update && sudo apt -y update