|
| 1 | +name: MLPerf inference bert (deepsparse, tf, onnxruntime, pytorch) |
| 2 | + |
| 3 | +on: |
| 4 | + pull_request: |
| 5 | + branches: [ "main", "dev" ] |
| 6 | + paths: |
| 7 | + - '.github/workflows/test-mlperf-inference-bert-deepsparse-tf-onnxruntime-pytorch.yml' |
| 8 | + - '**' |
| 9 | + - '!**.md' |
| 10 | + |
| 11 | +jobs: |
| 12 | + build: |
| 13 | + runs-on: ${{ matrix.os }} |
| 14 | + strategy: |
| 15 | + fail-fast: false |
| 16 | + matrix: |
| 17 | + # 3.12 didn't work on 20240305 - need to check |
| 18 | + python-version: [ "3.11" ] |
| 19 | + backend: [ "deepsparse", "tf", "onnxruntime", "pytorch" ] |
| 20 | + precision: [ "int8", "fp32" ] |
| 21 | + os: [ubuntu-latest, windows-latest, macos-latest] |
| 22 | + exclude: |
| 23 | + - backend: tf |
| 24 | + - backend: pytorch |
| 25 | + - backend: onnxruntime |
| 26 | + - precision: fp32 |
| 27 | + - os: windows-latest |
| 28 | + |
| 29 | + steps: |
| 30 | + - uses: actions/checkout@v3 |
| 31 | + - name: Set up Python ${{ matrix.python-version }} |
| 32 | + uses: actions/setup-python@v3 |
| 33 | + with: |
| 34 | + python-version: ${{ matrix.python-version }} |
| 35 | + - name: Install mlcflow |
| 36 | + run: | |
| 37 | + python -m pip install --upgrade pip |
| 38 | + python -m pip install --ignore-installed --verbose pip setuptools |
| 39 | + python -m pip install . |
| 40 | + mlc pull repo mlcommons@mlperf-automations --branch=dev |
| 41 | + - name: Test MLPerf Inference Bert ${{ matrix.backend }} on ${{ matrix.os }} |
| 42 | + if: matrix.os == 'windows-latest' |
| 43 | + run: | |
| 44 | + mlcr --tags=run,mlperf,inference,generate-run-cmds,_submission,_short --submitter="MLCommons" --hw_name=gh_${{ matrix.os }} --model=bert-99 --backend=${{ matrix.backend }} --device=cpu --scenario=Offline --test_query_count=5 --adr.loadgen.tags=_from-pip --pip_loadgen=yes --precision=${{ matrix.precision }} --target_qps=1 -v --quiet |
| 45 | + - name: Test MLPerf Inference Bert ${{ matrix.backend }} on ${{ matrix.os }} |
| 46 | + if: matrix.os != 'windows-latest' |
| 47 | + run: | |
| 48 | + mlcr --tags=run,mlperf,inference,generate-run-cmds,_submission,_short --submitter="MLCommons" --hw_name=gh_${{ matrix.os }}_x86 --model=bert-99 --backend=${{ matrix.backend }} --device=cpu --scenario=Offline --test_query_count=5 --precision=${{ matrix.precision }} --target_qps=1 -v --quiet |
0 commit comments