Skip to content

Commit 7bf5997

Browse files
authored
Docs update, fix download links for llama models (#2055)
* add docs for llama3 + inference * Update llama2-70b README.md * Update main.py
1 parent fa5d4f7 commit 7bf5997

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

48 files changed

+374
-205
lines changed

.github/workflows/build_wheels.yml

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -11,6 +11,7 @@ on:
1111
paths:
1212
- loadgen/**
1313

14+
1415
jobs:
1516
update_version:
1617
name: Update version only on ubuntu but used by windows and macos
@@ -133,6 +134,7 @@ jobs:
133134
with:
134135
name: wheels-windows-latest
135136
path: wheels
137+
# Publish
136138
- name: Publish
137139
uses: pypa/gh-action-pypi-publish@release/v1
138140
with:

.github/workflows/publish.yaml

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,6 @@
22

33
name: Publish site
44

5-
65
on:
76
release:
87
types: [published]

.github/workflows/test-bert.yml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
# This workflow will install Python dependencies, run tests and lint with a variety of Python versions
22
# For more information see: https://help.github.com/actions/language-and-framework-guides/using-python-with-github-actions
33

4-
name: Test for MLPerf inference bert submission generation using CM script automation
4+
name: Test for MLPerf inference bert submission generation using MLC script automation
55

66
on:
77
pull_request:
@@ -33,7 +33,7 @@ jobs:
3333
python-version: ${{ matrix.python-version }}
3434
- name: Install dependencies
3535
run: |
36-
python3 -m pip install cm4mlops
36+
python3 -m pip install mlc-scripts
3737
- name: Test BERT and end to end submission generation
3838
run: |
39-
cm run script --tags=run,mlperf,inference,generate-run-cmds,_submission,_short --quiet --submitter="MLCommons" --hw_name=default --model=bert-99 --implementation=reference --backend=${{ matrix.backend }} --device=cpu --scenario=Offline --adr.compiler.tags=gcc --adr.inference-src.version=custom --adr.inference-src.tags=_repo.${{ github.event.pull_request.head.repo.html_url }},_branch.$PR_HEAD_REF --adr.inference-src-loadgen.tags=_branch.$PR_HEAD_REF,_repo.${{ github.event.pull_request.head.repo.html_url }} --adr.inference-src-loadgen.version=custom --adr.loadgen.version=custom
39+
mlcr run,mlperf,inference,generate-run-cmds,_submission,_short --quiet --submitter="MLCommons" --hw_name=default --model=bert-99 --implementation=reference --backend=${{ matrix.backend }} --device=cpu --scenario=Offline --adr.compiler.tags=gcc --adr.inference-src.version=custom --adr.inference-src.tags=_repo.${{ github.event.pull_request.head.repo.html_url }},_branch.$PR_HEAD_REF --adr.inference-src-loadgen.tags=_branch.$PR_HEAD_REF,_repo.${{ github.event.pull_request.head.repo.html_url }} --adr.inference-src-loadgen.version=custom --adr.loadgen.version=custom
Lines changed: 94 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,94 @@
1+
name: Test for the downloads of calibration datasets
2+
on:
3+
pull_request:
4+
branches: [ "master", "dev" ]
5+
paths:
6+
- vision/classification_and_detection/**
7+
- language/**
8+
- recommendation/**
9+
- .github/workflows/test-calibration-downloads.yml
10+
- '!**.md'
11+
12+
env:
13+
PR_HEAD_REF: ${{ github.event.pull_request.head.ref }}
14+
15+
jobs:
16+
download-imagenet:
17+
runs-on: ubuntu-latest
18+
strategy:
19+
fail-fast: false
20+
matrix:
21+
python-version: [ "3.9" ]
22+
23+
steps:
24+
- uses: actions/checkout@v4
25+
- name: Set up Python ${{ matrix.python-version }}
26+
uses: actions/setup-python@v3
27+
with:
28+
python-version: ${{ matrix.python-version }}
29+
- name: Install dependencies
30+
run: |
31+
python3 -m pip install mlc-scripts
32+
- name: Download Imagenet Calibration
33+
run: |
34+
mlcr get,dataset,imagenet,_calibration --outdirname=. --quiet
35+
36+
download-openimages:
37+
runs-on: ubuntu-latest
38+
strategy:
39+
fail-fast: false
40+
matrix:
41+
python-version: [ "3.9" ]
42+
43+
steps:
44+
- uses: actions/checkout@v4
45+
- name: Set up Python ${{ matrix.python-version }}
46+
uses: actions/setup-python@v3
47+
with:
48+
python-version: ${{ matrix.python-version }}
49+
- name: Install dependencies
50+
run: |
51+
python3 -m pip install mlc-scripts
52+
- name: Download Openimages Calibration
53+
run: |
54+
mlcr get,dataset,openimages,_calibration --outdirname=. --quiet
55+
56+
download-igbh:
57+
runs-on: ubuntu-latest
58+
strategy:
59+
fail-fast: false
60+
matrix:
61+
python-version: [ "3.9" ]
62+
63+
steps:
64+
- uses: actions/checkout@v4
65+
- name: Set up Python ${{ matrix.python-version }}
66+
uses: actions/setup-python@v3
67+
with:
68+
python-version: ${{ matrix.python-version }}
69+
- name: Install dependencies
70+
run: |
71+
python3 -m pip install mlc-scripts
72+
# - name: Download IGBH Calibration
73+
# run: |
74+
# mlcr get,dataset,igbh,_calibration --outdirname=. --quiet
75+
76+
download-squad:
77+
runs-on: ubuntu-latest
78+
strategy:
79+
fail-fast: false
80+
matrix:
81+
python-version: [ "3.9" ]
82+
83+
steps:
84+
- uses: actions/checkout@v4
85+
- name: Set up Python ${{ matrix.python-version }}
86+
uses: actions/setup-python@v3
87+
with:
88+
python-version: ${{ matrix.python-version }}
89+
- name: Install dependencies
90+
run: |
91+
python3 -m pip install mlc-scripts
92+
- name: Download SQUAD Calibration
93+
run: |
94+
mlcr get,dataset,squad,_calib1 --outdirname=. --quiet

.github/workflows/test-loadgen.yml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
# This workflow will install Python dependencies, run tests and lint with a variety of Python versions
22
# For more information see: https://help.github.com/actions/language-and-framework-guides/using-python-with-github-actions
33

4-
name: Test for MLPerf inference loadgen using CM script automation
4+
name: Test for MLPerf inference loadgen using MLC script automation
55

66
on:
77
pull_request:
@@ -31,7 +31,7 @@ jobs:
3131
python-version: ${{ matrix.python-version }}
3232
- name: Install dependencies
3333
run: |
34-
python3 -m pip install cm4mlops
34+
python3 -m pip install mlc-scripts
3535
- name: Test Loadgen
3636
run: |
37-
cm run script --tags=get,mlperf,inference,loadgen --quiet --version=custom --adr.inference-src.tags=_repo.${{ github.event.pull_request.head.repo.html_url }},_branch.$PR_HEAD_REF --adr.loadgen.tags=_no-compilation-warnings
37+
mlcr get,mlperf,inference,loadgen --quiet --version=custom --adr.inference-src.tags=_repo.${{ github.event.pull_request.head.repo.html_url }},_branch.$PR_HEAD_REF --adr.loadgen.tags=_no-compilation-warnings

.github/workflows/test-resnet50.yml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
# This workflow will install Python dependencies, run tests and lint with a variety of Python versions
22
# For more information see: https://help.github.com/actions/language-and-framework-guides/using-python-with-github-actions
33

4-
name: Test for MLPerf inference resnet50 submission generation using CM script automation
4+
name: Test for MLPerf inference resnet50 submission generation using MLC script automation
55

66
on:
77
pull_request:
@@ -35,7 +35,7 @@ jobs:
3535
python-version: ${{ matrix.python-version }}
3636
- name: Install dependencies
3737
run: |
38-
python3 -m pip install cm4mlops
38+
python3 -m pip install mlc-scripts
3939
- name: Test Resnet50 and end to end submission generation
4040
run: |
41-
cm run script --tags=run,mlperf,inference,generate-run-cmds,_submission,_short --quiet --submitter="MLCommons" --hw_name=default --model=resnet50 --implementation=reference --backend=${{ matrix.backend }} --device=cpu --scenario=Offline --test_query_count=500 --adr.compiler.tags=gcc --adr.inference-src.tags=_branch.$PR_HEAD_REF,_repo.${{ github.event.pull_request.head.repo.html_url }} --adr.inference-src.version=custom --adr.inference-src-loadgen.tags=_branch.$PR_HEAD_REF,_repo.${{ github.event.pull_request.head.repo.html_url }} --adr.inference-src-loadgen.version=custom --adr.loadgen.version=custom ${{ matrix.loadgen-flag }}
41+
mlcr run,mlperf,inference,generate-run-cmds,_submission,_short --quiet --submitter="MLCommons" --hw_name=default --model=resnet50 --implementation=reference --backend=${{ matrix.backend }} --device=cpu --scenario=Offline --test_query_count=500 --adr.compiler.tags=gcc --adr.inference-src.tags=_branch.$PR_HEAD_REF,_repo.${{ github.event.pull_request.head.repo.html_url }} --adr.inference-src.version=custom --adr.inference-src-loadgen.tags=_branch.$PR_HEAD_REF,_repo.${{ github.event.pull_request.head.repo.html_url }} --adr.inference-src-loadgen.version=custom --adr.loadgen.version=custom ${{ matrix.loadgen-flag }}

.github/workflows/test-retinanet.yml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
# This workflow will install Python dependencies, run tests and lint with a variety of Python versions
22
# For more information see: https://help.github.com/actions/language-and-framework-guides/using-python-with-github-actions
33

4-
name: Test for MLPerf inference retinanet submission generation using CM script automation
4+
name: Test for MLPerf inference retinanet submission generation using MLC script automation
55

66
on:
77
pull_request:
@@ -33,7 +33,7 @@ jobs:
3333
python-version: ${{ matrix.python-version }}
3434
- name: Install dependencies
3535
run: |
36-
python3 -m pip install cm4mlops
36+
python3 -m pip install mlc-scripts
3737
- name: Test Retinanet and end to end submission generation
3838
run: |
39-
cm run script --tags=run,mlperf,inference,generate-run-cmds,_submission,_short --quiet --submitter="MLCommons" --hw_name=default --model=retinanet --implementation=reference --backend=${{ matrix.backend }} --device=cpu --scenario=Offline --test_query_count=10 --adr.compiler.tags=gcc --adr.inference-src.version=custom --adr.inference-src.tags=_repo.${{ github.event.pull_request.head.repo.html_url }},_branch.$PR_HEAD_REF --adr.inference-src-loadgen.tags=_branch.$PR_HEAD_REF,_repo.${{ github.event.pull_request.head.repo.html_url }} --adr.inference-src-loadgen.version=custom --adr.loadgen.version=custom
39+
mlcr run,mlperf,inference,generate-run-cmds,_submission,_short --quiet --submitter="MLCommons" --hw_name=default --model=retinanet --implementation=reference --backend=${{ matrix.backend }} --device=cpu --scenario=Offline --test_query_count=10 --adr.compiler.tags=gcc --adr.inference-src.version=custom --adr.inference-src.tags=_repo.${{ github.event.pull_request.head.repo.html_url }},_branch.$PR_HEAD_REF --adr.inference-src-loadgen.tags=_branch.$PR_HEAD_REF,_repo.${{ github.event.pull_request.head.repo.html_url }} --adr.inference-src-loadgen.version=custom --adr.loadgen.version=custom

.github/workflows/test-rgat.yml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
name: Test for MLPerf inference rgat submission generation using CM script automation
1+
name: Test for MLPerf inference rgat submission generation using MLC script automation
22

33
on:
44
pull_request:
@@ -32,7 +32,7 @@ jobs:
3232
python-version: ${{ matrix.python-version }}
3333
- name: Install dependencies
3434
run: |
35-
python3 -m pip install cm4mlops
35+
python3 -m pip install mlc-scripts
3636
- name: Test R-GAT and end to end submission generation
3737
run: |
38-
cm run script --tags=run,mlperf,inference,generate-run-cmds,_submission,_short --quiet --submitter="MLCommons" --category=datacenter --hw_name=default --model=rgat --implementation=reference --backend=${{ matrix.backend }} --device=cpu --scenario=Offline --test_query_count=500 --adr.compiler.tags=gcc --adr.inference-src.tags=_branch.$PR_HEAD_REF,_repo.${{ github.event.pull_request.head.repo.html_url }} --adr.inference-src-loadgen.tags=_branch.$PR_HEAD_REF,_repo.${{ github.event.pull_request.head.repo.html_url }} --adr.inference-src-loadgen.version=custom --adr.loadgen.version=custom ${{ matrix.loadgen-flag }}
38+
mlcr run,mlperf,inference,generate-run-cmds,_submission,_short --quiet --submitter="MLCommons" --category=datacenter --hw_name=default --model=rgat --implementation=reference --backend=${{ matrix.backend }} --device=cpu --scenario=Offline --test_query_count=500 --adr.compiler.tags=gcc --adr.inference-src.tags=_branch.$PR_HEAD_REF,_repo.${{ github.event.pull_request.head.repo.html_url }} --adr.inference-src-loadgen.tags=_branch.$PR_HEAD_REF,_repo.${{ github.event.pull_request.head.repo.html_url }} --adr.inference-src-loadgen.version=custom --adr.loadgen.version=custom ${{ matrix.loadgen-flag }}

.github/workflows/test-rnnt.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
# This workflow will install Python dependencies, run tests and lint with a variety of Python versions
22
# For more information see: https://help.github.com/actions/language-and-framework-guides/using-python-with-github-actions
33

4-
name: Test for MLPerf inference rnnt submission generation using CM script automation
4+
name: Test for MLPerf inference rnnt submission generation using MLC script automation
55

66
on:
77
pull_request:
@@ -39,4 +39,4 @@ jobs:
3939
cm run script --quiet --tags=get,sys-utils-cm
4040
- name: Test RNNT and end to end submission generation
4141
run: |
42-
cm run script --tags=run,mlperf,inference,generate-run-cmds,_performance-only --quiet --submitter="MLCommons" --hw_name=default --model=rnnt --implementation=reference --backend=${{ matrix.backend }} --device=cpu --scenario=Offline --precision=${{ matrix.precision }} --adr.compiler.tags=gcc --adr.inference-src.version=custom --adr.inference-src.env.CM_GIT_CHECKOUT=$PR_HEAD_REF --adr.inference-src.env.CM_GIT_URL=${{ github.event.pull_request.head.repo.html_url }} --adr.ml-engine-pytorch.version=1.13.0 --adr.ml-engine-torchvision.version=0.14.1 --adr.librosa.version_max=0.9.1
42+
mlcr run,mlperf,inference,generate-run-cmds,_performance-only --quiet --submitter="MLCommons" --hw_name=default --model=rnnt --implementation=reference --backend=${{ matrix.backend }} --device=cpu --scenario=Offline --precision=${{ matrix.precision }} --adr.compiler.tags=gcc --adr.inference-src.version=custom --adr.inference-src.env.CM_GIT_CHECKOUT=$PR_HEAD_REF --adr.inference-src.env.CM_GIT_URL=${{ github.event.pull_request.head.repo.html_url }} --adr.ml-engine-pytorch.version=1.13.0 --adr.ml-engine-torchvision.version=0.14.1 --adr.librosa.version_max=0.9.1

.github/workflows/test-submission-checker.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
# This workflow will install Python dependencies, run tests and lint with a variety of Python versions
22
# For more information see: https://help.github.com/actions/language-and-framework-guides/using-python-with-github-actions
33

4-
name: Test for MLPerf inference submission checker using CM script automation
4+
name: Test for MLPerf inference submission checker using MLC script automation
55

66
on:
77
pull_request:

0 commit comments

Comments
 (0)