Create upload_benchmark_results reusable workflow (#7269)

huydhn · web-flow · commit 482f9b06393f · 2025-10-01T17:11:51.000-07:00
This is needed to unblock pytorch/helion#732. By unravelled the current upload_benchmark_results GHA, the new `.github/workflows/upload_benchmark_results.yml` workflow needs 4 inputs: 1. The benchmark artifact itself, uploaded to GitHub via `actions/upload-artifact` 2. The benchmark metadata including workflow ID, job ID, repo, and branch name. This is collected by the new `gather-benchmark-metadata` GHA 3. The runners info including GPU or CPU type. This is collected by the new `gather-runners-info` GHA 4. The list of dependencies. This is collected by the new `gather-dependencies` GHA Two examples on how to use the new reusable workflow are at: * `.github/workflows/test_upload_benchmark_results.yml` * Helion pytorch/helion#758 --------- Signed-off-by: Huy Do <huydhn@gmail.com>
diff --git a/.github/actions/gather-benchmark-metadata/action.yml b/.github/actions/gather-benchmark-metadata/action.yml
@@ -0,0 +1,69 @@
+name: Gather benchmark metadata
+
+description: Gather the metadata about the benchmark run
+
+inputs:
+  github-token:
+    default: ''
+  schema-version:
+    default: 'v3'
+  venv:
+    description: 'Path to virtual environment to activate'
+    required: false
+    default: ''
+
+outputs:
+  benchmark-metadata:
+    description: The benchmark metadata in JSON format
+    value: ${{ steps.gather-metadata.outputs.metadata }}
+
+runs:
+  using: composite
+  steps:
+    - name: Check that GITHUB_TOKEN is defined
+      env:
+        GITHUB_TOKEN: ${{ inputs.github-token }}
+      shell: bash
+      run: |
+        set -eux
+
+        if [[ -z "${GITHUB_TOKEN}" ]]; then
+          echo "Missing github-token input"
+          exit 1
+        fi
+
+    - name: Get workflow job id
+      if: ${{ inputs.github-token != '' }}
+      id: get-job-id
+      uses: pytorch/test-infra/.github/actions/get-workflow-job-id@main
+      with:
+        github-token: ${{ inputs.github-token }}
+
+    - name: Gather the metadata
+      id: gather-metadata
+      shell: bash
+      env:
+        SCHEMA_VERSION: ${{ inputs.schema-version }}
+        REPO: ${{ github.repository }}
+        HEAD_BRANCH: ${{ github.event_name == 'pull_request' && github.event.pull_request.head.ref || github.ref }}
+        HEAD_SHA: ${{ github.event_name == 'pull_request' && github.event.pull_request.head.sha || github.sha }}
+        WORKFLOW_RUN_ID: ${{ github.run_id }}
+        RUN_ATTEMPT: ${{ github.run_attempt }}
+        JOB_ID: ${{ inputs.github-token != '' && steps.get-job-id.outputs.job-id || '0' }}
+        JOB_NAME: ${{ inputs.github-token != '' && steps.get-job-id.outputs.job-name || '' }}
+      run: |
+        set -eux
+
+        if [[ -n "${{ inputs.venv }}" ]]; then
+          source "${{ inputs.venv }}"
+        fi
+
+        python3 "${GITHUB_ACTION_PATH}/../../scripts/benchmarks/gather_metadata.py" \
+          --schema-version "${SCHEMA_VERSION}" \
+          --repo "${REPO}" \
+          --head-branch "${HEAD_BRANCH}" \
+          --head-sha "${HEAD_SHA}" \
+          --workflow-id "${WORKFLOW_RUN_ID}" \
+          --run-attempt "${RUN_ATTEMPT}" \
+          --job-id "${JOB_ID}" \
+          --job-name "${JOB_NAME}"
diff --git a/.github/actions/gather-dependencies/action.yml b/.github/actions/gather-dependencies/action.yml
@@ -0,0 +1,26 @@
+name: Gather dependencies
+
+description: Gather the list of all dependencies
+
+inputs:
+  venv:
+    description: 'Path to virtual environment to activate'
+    required: false
+    default: ''
+
+outputs:
+  dependencies:
+    description: The list of all dependencies in JSON format
+    value: ${{ steps.gather-dependencies.outputs.dependencies }}
+
+runs:
+  using: composite
+  steps:
+    - name: Gather the dependencies information
+      id: gather-dependencies
+      shell: bash
+      run: |
+        set -eux
+
+        # TODO (huydhn): Implement this part
+        echo "dependencies={}" >> "${GITHUB_OUTPUT}"
diff --git a/.github/actions/gather-runners-info/action.yml b/.github/actions/gather-runners-info/action.yml
@@ -0,0 +1,61 @@
+name: Gather runners info
+
+description: Gather the information about the runners
+
+inputs:
+  venv:
+    description: 'Path to virtual environment to activate'
+    required: false
+    default: ''
+
+outputs:
+  runners-info:
+    description: The runners info in JSON format
+    value: ${{ steps.gather-runners-info.outputs.runners }}
+
+runs:
+  using: composite
+  steps:
+    - name: Get device name
+      shell: bash
+      run: |
+        set -eux
+
+        if command -v nvidia-smi; then
+          DEVICE_NAME=cuda
+          nvidia-smi
+        elif command -v rocm-smi; then
+          DEVICE_NAME=rocm
+          rocm-smi
+        else
+          DEVICE_NAME=cpu
+          lscpu
+        fi
+        echo "DEVICE_NAME=$DEVICE_NAME" >> $GITHUB_ENV
+
+    - name: Get device type
+      shell: bash
+      run: |
+        set -eux
+
+        if [[ "${DEVICE_NAME}" == "cuda" ]]; then
+          DEVICE_TYPE=$(nvidia-smi -i 0 --query-gpu=name --format=csv,noheader | awk '{print $2}')
+        elif [[ "${DEVICE_NAME}" == "rocm" ]]; then
+          DEVICE_TYPE=$(rocminfo | grep "Marketing Name" | tail -n1 | awk -F':' '{print $2}' | xargs)
+        elif [[ "${DEVICE_NAME}" == "cpu" ]]; then
+          DEVICE_TYPE=$(lscpu | grep 'Model name' | cut -f 2 -d ":" | awk '{$1=$1}1' | cut -f 2 -d " ")
+        fi
+        echo "DEVICE_TYPE=$DEVICE_TYPE" >> $GITHUB_ENV
+
+    - name: Gather the runners information
+      id: gather-runners-info
+      shell: bash
+      run: |
+        set -eux
+
+        if [[ -n "${{ inputs.venv }}" ]]; then
+          source "${{ inputs.venv }}"
+        fi
+
+        python3 -mpip install psutil==7.0.0 nvidia-ml-py==13.580.82
+        python3 "${GITHUB_ACTION_PATH}/../../scripts/benchmarks/gather_runners_info.py"
diff --git a/.github/workflows/test_gather_benchmark_info.yml b/.github/workflows/test_gather_benchmark_info.yml
@@ -0,0 +1,41 @@
+name: Test all GHA to gather different benchmark info
+
+on:
+  workflow_call:
+    outputs:
+      benchmark-metadata:
+        value: ${{ jobs.test-gather-benchmark-info.outputs.benchmark-metadata }}
+      runners-info:
+        value: ${{ jobs.test-gather-benchmark-info.outputs.runners-info }}
+      dependencies:
+        value: ${{ jobs.test-gather-benchmark-info.outputs.dependencies }}
+
+jobs:
+  test-gather-benchmark-info:
+    runs-on: linux.2xlarge
+    outputs:
+      benchmark-metadata: ${{ steps.gather-benchmark-metadata.outputs.benchmark-metadata }}
+      runners-info: ${{ steps.gather-runners-info.outputs.runners-info }}
+      dependencies: ${{ steps.gather-dependencies.outputs.dependencies }}
+    steps:
+      - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
+
+      - name: Gather benchmark metadata
+        id: gather-benchmark-metadata
+        uses: ./.github/actions/gather-benchmark-metadata
+        with:
+          github-token: ${{ secrets.GITHUB_TOKEN }}
+
+      - name: Gather runners info
+        id: gather-runners-info
+        uses: ./.github/actions/gather-runners-info
+
+      - name: Gather dependencies
+        id: gather-dependencies
+        uses: ./.github/actions/gather-dependencies
+
+      - name: Upload the mock benchmark results
+        uses: actions/upload-artifact@ea165f8d65b6e75b540449e92b4886f43607fa02 # v4.6.2
+        with:
+          name: benchmark-results
+          path: .github/scripts/benchmark-results-dir-for-testing/v3
diff --git a/.github/workflows/test_upload_benchmark_results.yml b/.github/workflows/test_upload_benchmark_results.yml
@@ -3,20 +3,49 @@ name: Test upload-benchmark-results
 on:
   pull_request:
     paths:
+      # GHA route
+      - .github/scripts/benchmarks/*
       - .github/scripts/upload_benchmark_results.py
-      - .github/workflows/test_upload_benchmark_results.ym
       - .github/actions/upload-benchmark-results/*
+      # Reusable workflow route
+      - .github/actions/gather-benchmark-metadata/*
+      - .github/actions/gather-runners-info/*
+      - .github/actions/gather-dependencies/*
+      - .github/workflows/upload_benchmark_results.yml
+      # The test workflow itself
+      - .github/workflows/test_upload_benchmark_results.yml
+
+permissions:
+  id-token: write
+  contents: read
 
 jobs:
-  test:
+  test-upload-benchmark-results-gha:
     runs-on: linux.2xlarge
     steps:
       - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
 
-      - name: Test upload the benchmark results (v3)
+      - name: Test upload the benchmark results
         uses: ./.github/actions/upload-benchmark-results
         with:
           benchmark-results-dir: .github/scripts/benchmark-results-dir-for-testing/v3
           schema-version: v3
           dry-run: true
           github-token: ${{ secrets.GITHUB_TOKEN }}
+
+  test-gather-benchmark-info:
+    uses: ./.github/workflows/test_gather_benchmark_info.yml
+
+  test-upload-benchmark-results-reusable-workflow:
+    needs: test-gather-benchmark-info
+    uses: ./.github/workflows/upload_benchmark_results.yml
+    permissions:
+      id-token: write
+      contents: read
+    with:
+      benchmark-artifact: benchmark-results
+      benchmark-metadata: ${{ needs.test-gather-benchmark-info.outputs.benchmark-metadata }}
+      runners-info: ${{ needs.test-gather-benchmark-info.outputs.runners-info }}
+      dependencies: ${{ needs.test-gather-benchmark-info.outputs.dependencies }}
+      schema-version: v3
+      dry-run: true
diff --git a/.github/workflows/upload_benchmark_results.yml b/.github/workflows/upload_benchmark_results.yml
@@ -0,0 +1,86 @@
+name: Upload benchmark results
+
+on:
+  workflow_call:
+    inputs:
+      benchmark-artifact:
+        description: The name of the benchmark artifact to upload
+        required: true
+        type: string
+      benchmark-metadata:
+        description: The benchmark metadata provided by gather-benchmark-metadata GHA
+        required: true
+        type: string
+      runners-info:
+        description: The runners info gathered by gather-runners-info GHA
+        required: true
+        type: string
+      dependencies:
+        description: The list of dependencies (not yet implemented)
+        required: false
+        type: string
+        default: '{}'
+      schema-version:
+        default: 'v3'
+        type: string
+      dry-run:
+        default: true
+        type: boolean
+
+jobs:
+  job:
+    name: Uploading ${{ inputs.benchmark-artifact }}
+    runs-on: linux.2xlarge
+    # Keep this in case we need to use OIDC later on, so the permission is there
+    permissions:
+      id-token: write
+      contents: read
+    steps:
+      - name: Checkout test-infra
+        uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
+        with:
+          repository: pytorch/test-infra
+          ref: main
+          path: test-infra
+
+      - name: Download benchmark artifacts
+        uses: actions/download-artifact@65a9edc5881444af0b9093a5e628f2fe47ea3b2e # v4.1.7
+        with:
+          name: ${{ inputs.benchmark-artifact }}
+          path: ${{ runner.temp }}/benchmark-artifact
+
+      - name: Upload benchmark results
+        shell: bash
+        working-directory: test-infra
+        env:
+          BENCHMARK_RESULTS_DIR: ${{ runner.temp }}/benchmark-artifact
+          DRY_RUN: ${{ inputs.dry-run }}
+          # Additional information about the benchmarks
+          BENCHMARK_METADATA: ${{ inputs.benchmark-metadata }}
+          RUNNERS_INFO: ${{ inputs.runners-info }}
+          DEPENDENCIES: ${{ inputs.dependencies }}
+        run: |
+          set -eux
+
+          if [[ ! -d "${BENCHMARK_RESULTS_DIR}" ]]; then
+            echo "${BENCHMARK_RESULTS_DIR} does not exist, skipping"
+            # We don't want the job to fail if the directory doesn't exist
+            exit 0
+          fi
+
+          python3 -mpip install boto3==1.35.33
+
+          if [[ "${DRY_RUN}" == "true" ]]; then
+            python3 ".github/scripts/upload_benchmark_results.py" \
+              --benchmark-results-dir "${BENCHMARK_RESULTS_DIR}" \
+              --metadata "${BENCHMARK_METADATA}" \
+              --runners "${RUNNERS_INFO}" \
+              --dependencies "${DEPENDENCIES}" \
+              --dry-run
+          else
+            python3 ".github/scripts/upload_benchmark_results.py" \
+              --benchmark-results-dir "${BENCHMARK_RESULTS_DIR}" \
+              --metadata "${BENCHMARK_METADATA}" \
+              --runners "${RUNNERS_INFO}" \
+              --dependencies "${DEPENDENCIES}"
+          fi