Skip to content

Commit 3a14f23

Browse files
committed
chore: rebase and minor changes
Signed-off-by: Dheeraj Peri <[email protected]>
1 parent bfae556 commit 3a14f23

File tree

2 files changed

+14
-5
lines changed

2 files changed

+14
-5
lines changed

tools/perf/README.md

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -127,3 +127,12 @@ Eg:
127127
--backends torch,torch_tensorrt,tensorrt \
128128
--report "vgg_perf_bs1.txt"
129129
```
130+
131+
### Example models
132+
133+
This tool benchmarks any pytorch model or torchscript module. As an example, we provide VGG16, Resnet50, EfficientNet-B0, VIT, HF-BERT models in `hub.py` that we internally test for performance.
134+
The torchscript modules for these models can be generated by running
135+
```
136+
python hub.py
137+
```
138+
You can refer to `benchmark.sh` on how we run/benchmark these models.

tools/perf/benchmark.sh

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -9,7 +9,7 @@ batch_sizes=(1 2 4 8 16 32 64 128 256)
99

1010
#Benchmark VGG16 model
1111
echo "Benchmarking VGG16 model"
12-
for bs in batch_sizes
12+
for bs in ${batch_sizes[@]}
1313
do
1414
python perf_run.py --model ${MODELS_DIR}/vgg16_scripted.jit.pt \
1515
--precision fp32,fp16 --inputs="(${bs}, 3, 224, 224)" \
@@ -20,7 +20,7 @@ done
2020

2121
# Benchmark Resnet50 model
2222
echo "Benchmarking Resnet50 model"
23-
for bs in batch_sizes
23+
for bs in ${batch_sizes[@]}
2424
do
2525
python perf_run.py --model ${MODELS_DIR}/resnet50_scripted.jit.pt \
2626
--precision fp32,fp16 --inputs="(${bs}, 3, 224, 224)" \
@@ -31,7 +31,7 @@ done
3131

3232
# Benchmark VIT model
3333
echo "Benchmarking VIT model"
34-
for bs in batch_sizes
34+
for bs in ${batch_sizes[@]}
3535
do
3636
python perf_run.py --model ${MODELS_DIR}/vit_scripted.jit.pt \
3737
--precision fp32,fp16 --inputs="(${bs}, 3, 224, 224)" \
@@ -42,7 +42,7 @@ done
4242

4343
# Benchmark EfficientNet-B0 model
4444
echo "Benchmarking EfficientNet-B0 model"
45-
for bs in batch_sizes
45+
for bs in ${batch_sizes[@]}
4646
do
4747
python perf_run.py --model ${MODELS_DIR}/efficientnet_b0_scripted.jit.pt \
4848
--precision fp32,fp16 --inputs="(${bs}, 3, 224, 224)" \
@@ -53,7 +53,7 @@ done
5353

5454
# Benchmark BERT model
5555
echo "Benchmarking Huggingface BERT base model"
56-
for bs in batch_sizes
56+
for bs in ${batch_sizes[@]}
5757
do
5858
python perf_run.py --model ${MODELS_DIR}/bert_base_uncased_traced.jit.pt \
5959
--precision fp32 --inputs="(${bs}, 128)@int32;(${bs}, 128)@int32" \

0 commit comments

Comments
 (0)