add alexnet, caffenet and squeezenet qdq models (#571)

yuwenzho · jcwchen · web-flow · commit 8e893eb39b13 · 2022-12-09T15:43:05.000-08:00
Signed-off-by: yuwenzho &lt;yuwen.zhou@intel.com&gt;

Signed-off-by: yuwenzho &lt;yuwen.zhou@intel.com&gt;
Co-authored-by: Chun-Wei Chen &lt;jacky82226@gmail.com&gt;
diff --git a/ONNX_HUB_MANIFEST.json b/ONNX_HUB_MANIFEST.json
@@ -1131,6 +1131,48 @@
             "model_with_data_bytes": 40683138
         }
     },
+    {
+        "model": "AlexNet-qdq",
+        "model_path": "vision/classification/alexnet/model/bvlcalexnet-12-qdq.onnx",
+        "onnx_version": "1.9",
+        "opset_version": 12,
+        "metadata": {
+            "model_sha": "c103c0f7b8f9d8d64b400e0899d5934d2a13d1f08368ba1907285aa0691f4cbb",
+            "model_bytes": 61009072,
+            "tags": [
+                "vision",
+                "classification",
+                "alexnet"
+            ],
+            "io_ports": {
+                "inputs": [
+                    {
+                        "name": "data_0",
+                        "shape": [
+                            1,
+                            3,
+                            224,
+                            224
+                        ],
+                        "type": "tensor(float)"
+                    }
+                ],
+                "outputs": [
+                    {
+                        "name": "prob_1",
+                        "shape": [
+                            1,
+                            1000
+                        ],
+                        "type": "tensor(float)"
+                    }
+                ]
+            },
+            "model_with_data_path": "vision/classification/alexnet/model/bvlcalexnet-12-qdq.tar.gz",
+            "model_with_data_sha": "930eeb3f4d25a20e59fa21919f95edbb7a4b3f31b51a83f62c9b6627906156b9",
+            "model_with_data_bytes": 45565042
+        }
+    },
     {
         "model": "AlexNet",
         "model_path": "vision/classification/alexnet/model/bvlcalexnet-12.onnx",
@@ -1421,6 +1463,48 @@
             "model_with_data_bytes": 40718510
         }
     },
+    {
+        "model": "CaffeNet-qdq",
+        "model_path": "vision/classification/caffenet/model/caffenet-12-qdq.onnx",
+        "onnx_version": "1.9",
+        "opset_version": 12,
+        "metadata": {
+            "model_sha": "ff1170e8123aa7b8d652bc43a9e9864ee6ba050653470f34dada9b6ad0731b40",
+            "model_bytes": 61009797,
+            "tags": [
+                "vision",
+                "classification",
+                "caffenet"
+            ],
+            "io_ports": {
+                "inputs": [
+                    {
+                        "name": "data_0",
+                        "shape": [
+                            1,
+                            3,
+                            224,
+                            224
+                        ],
+                        "type": "tensor(float)"
+                    }
+                ],
+                "outputs": [
+                    {
+                        "name": "prob_1",
+                        "shape": [
+                            1,
+                            1000
+                        ],
+                        "type": "tensor(float)"
+                    }
+                ]
+            },
+            "model_with_data_path": "vision/classification/caffenet/model/caffenet-12-qdq.tar.gz",
+            "model_with_data_sha": "7d78cb5357b90e71f38c133715e67237c5156e21be0aa6e397c9654557364a6d",
+            "model_with_data_bytes": 45685092
+        }
+    },
     {
         "model": "CaffeNet",
         "model_path": "vision/classification/caffenet/model/caffenet-12.onnx",
@@ -5102,6 +5186,50 @@
             "model_with_data_bytes": 5151210
         }
     },
+    {
+        "model": "SqueezeNet 1.0-qdq",
+        "model_path": "vision/classification/squeezenet/model/squeezenet1.0-13-qdq.onnx",
+        "onnx_version": "1.9",
+        "opset_version": 13,
+        "metadata": {
+            "model_sha": "4a567dd7542ef440890d57268fabf47211174c593d7a1837bd7f16a1067169e7",
+            "model_bytes": 1345213,
+            "tags": [
+                "vision",
+                "classification",
+                "squeezenet"
+            ],
+            "io_ports": {
+                "inputs": [
+                    {
+                        "name": "data_0",
+                        "shape": [
+                            1,
+                            3,
+                            224,
+                            224
+                        ],
+                        "type": "tensor(float)"
+                    }
+                ],
+                "outputs": [
+                    {
+                        "name": "softmaxout_1",
+                        "shape": [
+                            1,
+                            1000,
+                            1,
+                            1
+                        ],
+                        "type": "tensor(float)"
+                    }
+                ]
+            },
+            "model_with_data_path": "vision/classification/squeezenet/model/squeezenet1.0-13-qdq.tar.gz",
+            "model_with_data_sha": "d3a84101535d52ecf31503ff1645f170c7b156b6bc53f1492caec485b7c023a7",
+            "model_with_data_bytes": 1565787
+        }
+    },
     {
         "model": "SqueezeNet 1.0",
         "model_path": "vision/classification/squeezenet/model/squeezenet1.0-3.onnx",
diff --git a/vision/classification/alexnet/README.md b/vision/classification/alexnet/README.md
@@ -11,6 +11,7 @@
 |AlexNet| [238 MB](model/bvlcalexnet-9.onnx)  |  [226 MB](model/bvlcalexnet-9.tar.gz) |  1.4 | 9| | |
 |AlexNet| [233 MB](model/bvlcalexnet-12.onnx)  |  [216 MB](model/bvlcalexnet-12.tar.gz) |  1.9 | 12|54.80|78.23|
 |AlexNet-int8| [58 MB](model/bvlcalexnet-12-int8.onnx)  |  [39 MB](model/bvlcalexnet-12-int8.tar.gz) |  1.9 | 12|54.68|78.23|
+|AlexNet-qdq| [59 MB](model/bvlcalexnet-12-qdq.onnx)  |  [44 MB](model/bvlcalexnet-12-qdq.tar.gz) |  1.9 | 12|54.71|78.22|
 > Compared with the fp32 AlextNet, int8 AlextNet's Top-1 accuracy drop ratio is 0.22%, Top-5 accuracy drop ratio is 0.05% and performance improvement is 2.26x.
 >
 > **Note** 
@@ -63,7 +64,7 @@ This model obtains a top-1 accuracy 57.1% and a top-5 accuracy
 should obtain a bit higher accuracy.)
 
 ## Quantization
-AlexNet-int8 is obtained by quantizing fp32 AlexNet model. We use [Intel® Neural Compressor](https://github.com/intel/neural-compressor) with onnxruntime backend to perform quantization. View the [instructions](https://github.com/intel/neural-compressor/blob/master/examples/onnxrt/image_recognition/onnx_model_zoo/alexnet/quantization/ptq/README.md) to understand how to use Intel® Neural Compressor for quantization.
+AlexNet-int8 and AlexNet-qdq are obtained by quantizing fp32 AlexNet model. We use [Intel® Neural Compressor](https://github.com/intel/neural-compressor) with onnxruntime backend to perform quantization. View the [instructions](https://github.com/intel/neural-compressor/blob/master/examples/onnxrt/image_recognition/onnx_model_zoo/alexnet/quantization/ptq/README.md) to understand how to use Intel® Neural Compressor for quantization.
 
 ### Environment
 onnx: 1.9.0 
@@ -91,6 +92,7 @@ bash run_tuning.sh --input_model=path/to/model \  # model path as *.onnx
 
 ## Contributors
 * [mengniwang95](https://github.com/mengniwang95) (Intel)
+* [yuwenzho](https://github.com/yuwenzho) (Intel)
 * [airMeng](https://github.com/airMeng) (Intel)
 * [ftian1](https://github.com/ftian1) (Intel)
 * [hshen14](https://github.com/hshen14) (Intel)
diff --git a/vision/classification/alexnet/model/bvlcalexnet-12-qdq.onnx b/vision/classification/alexnet/model/bvlcalexnet-12-qdq.onnx
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c103c0f7b8f9d8d64b400e0899d5934d2a13d1f08368ba1907285aa0691f4cbb
+size 61009072
diff --git a/vision/classification/alexnet/model/bvlcalexnet-12-qdq.tar.gz b/vision/classification/alexnet/model/bvlcalexnet-12-qdq.tar.gz
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:930eeb3f4d25a20e59fa21919f95edbb7a4b3f31b51a83f62c9b6627906156b9
+size 45565042
diff --git a/vision/classification/caffenet/README.md b/vision/classification/caffenet/README.md
@@ -11,6 +11,7 @@
 |CaffeNet| [238 MB](model/caffenet-9.onnx)  |  [244 MB](model/caffenet-9.tar.gz) |  1.4 | 9| | |
 |CaffeNet| [233 MB](model/caffenet-12.onnx)  |  [216 MB](model/caffenet-12.tar.gz) |  1.9 | 12|56.27 |79.52 |
 |CaffeNet-int8| [58 MB](model/caffenet-12-int8.onnx)  |  [39 MB](model/caffenet-12-int8.tar.gz) |  1.9 | 12| 56.22|79.52 |
+|CaffeNet-qdq| [59 MB](model/caffenet-12-qdq.onnx)  |  [44 MB](model/caffenet-12-qdq.tar.gz) |  1.9 | 12| 56.25|79.45 |
 > Compared with the fp32 CaffeNet, int8 CaffeNet's Top-1 accuracy drop ratio is 0.09%, Top-5 accuracy drop ratio is 0.13% and performance improvement is 3.08x.
 >
 > **Note** 
@@ -64,7 +65,7 @@ This model obtains a top-1 accuracy 57.4% and a top-5 accuracy
 should obtain a bit higher accuracy still.)
 
 ## Quantization
-CaffeNet-int8 is obtained by quantizing fp32 CaffeNet model. We use [Intel® Neural Compressor](https://github.com/intel/neural-compressor) with onnxruntime backend to perform quantization. View the [instructions](https://github.com/intel/neural-compressor/blob/master/examples/onnxrt/image_recognition/onnx_model_zoo/caffenet/quantization/ptq/README.md) to understand how to use Intel® Neural Compressor for quantization.
+CaffeNet-int8 and CaffeNet-qdq are obtained by quantizing fp32 CaffeNet model. We use [Intel® Neural Compressor](https://github.com/intel/neural-compressor) with onnxruntime backend to perform quantization. View the [instructions](https://github.com/intel/neural-compressor/blob/master/examples/onnxrt/image_recognition/onnx_model_zoo/caffenet/quantization/ptq/README.md) to understand how to use Intel® Neural Compressor for quantization.
 
 ### Environment
 onnx: 1.9.0 
@@ -92,6 +93,7 @@ bash run_tuning.sh --input_model=path/to/model \  # model path as *.onnx
 
 ## Contributors
 * [mengniwang95](https://github.com/mengniwang95) (Intel)
+* [yuwenzho](https://github.com/yuwenzho) (Intel)
 * [airMeng](https://github.com/airMeng) (Intel)
 * [ftian1](https://github.com/ftian1) (Intel)
 * [hshen14](https://github.com/hshen14) (Intel)
diff --git a/vision/classification/caffenet/model/caffenet-12-qdq.onnx b/vision/classification/caffenet/model/caffenet-12-qdq.onnx
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ff1170e8123aa7b8d652bc43a9e9864ee6ba050653470f34dada9b6ad0731b40
+size 61009797
diff --git a/vision/classification/caffenet/model/caffenet-12-qdq.tar.gz b/vision/classification/caffenet/model/caffenet-12-qdq.tar.gz
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7d78cb5357b90e71f38c133715e67237c5156e21be0aa6e397c9654557364a6d
+size 45685092
diff --git a/vision/classification/squeezenet/README.md b/vision/classification/squeezenet/README.md
@@ -22,6 +22,7 @@ SqueezeNet 1.1 has 2.4x less computation and slightly fewer parameters than Sque
 |SqueezeNet 1.0| [5 MB](model/squeezenet1.0-9.onnx)  |  [11 MB](model/squeezenet1.0-9.tar.gz) |  1.4 | 9|
 |SqueezeNet 1.0| [5 MB](model/squeezenet1.0-12.onnx)  |  [5 MB](model/squeezenet1.0-12.tar.gz) |  1.9 | 12|56.85|79.87|
 |SqueezeNet 1.0-int8| [2 MB](model/squeezenet1.0-12-int8.onnx)  |  [2 MB](model/squeezenet1.0-12-int8.tar.gz) |  1.9 | 12|56.48|79.76|
+|SqueezeNet 1.0-qdq| [2 MB](model/squeezenet1.0-13-qdq.onnx)  |  [2 MB](model/squeezenet1.0-13-qdq.tar.gz) |  1.9 | 13|56.54|79.76|
 > Compared with the fp32 SqueezeNet 1.0, int8 SqueezeNet 1.0's Top-1 accuracy drop ratio is 0.65%, Top-5 accuracy drop ratio is 0.14% and performance improvement is 1.31x.
 >
 > **Note** 
@@ -64,7 +65,7 @@ We used MXNet as framework with gluon APIs to perform training. View the [traini
 We used MXNet as framework with gluon APIs to perform validation. Use the notebook [imagenet_validation](../imagenet_validation.ipynb) to verify the accuracy of the model on the validation set. Make sure to specify the appropriate model name in the notebook.
 
 ## Quantization
-SqueezeNet 1.0-int8 is obtained by quantizing fp32 SqueezeNet 1.0 model. We use [Intel® Neural Compressor](https://github.com/intel/neural-compressor) with onnxruntime backend to perform quantization. View the [instructions](https://github.com/intel/neural-compressor/blob/master/examples/onnxrt/image_recognition/onnx_model_zoo/squeezenet/quantization/ptq/README.md) to understand how to use Intel® Neural Compressor for quantization.
+SqueezeNet 1.0-int8 and SqueezeNet 1.0-qdq are obtained by quantizing fp32 SqueezeNet 1.0 model. We use [Intel® Neural Compressor](https://github.com/intel/neural-compressor) with onnxruntime backend to perform quantization. View the [instructions](https://github.com/intel/neural-compressor/blob/master/examples/onnxrt/image_recognition/onnx_model_zoo/squeezenet/quantization/ptq/README.md) to understand how to use Intel® Neural Compressor for quantization.
 
 ### Environment
 onnx: 1.9.0 
@@ -97,6 +98,7 @@ SqueezeNet1.1 presented in the [Official SqueezeNet repo](https://github.com/Dee
 * [abhinavs95](https://github.com/abhinavs95) (Amazon AI)
 * [ankkhedia](https://github.com/ankkhedia) (Amazon AI)
 * [mengniwang95](https://github.com/mengniwang95) (Intel)
+* [yuwenzho](https://github.com/yuwenzho) (Intel)
 * [airMeng](https://github.com/airMeng) (Intel)
 * [ftian1](https://github.com/ftian1) (Intel)
 * [hshen14](https://github.com/hshen14) (Intel)
diff --git a/vision/classification/squeezenet/model/squeezenet1.0-13-qdq.onnx b/vision/classification/squeezenet/model/squeezenet1.0-13-qdq.onnx
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4a567dd7542ef440890d57268fabf47211174c593d7a1837bd7f16a1067169e7
+size 1345213
diff --git a/vision/classification/squeezenet/model/squeezenet1.0-13-qdq.tar.gz b/vision/classification/squeezenet/model/squeezenet1.0-13-qdq.tar.gz
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d3a84101535d52ecf31503ff1645f170c7b156b6bc53f1492caec485b7c023a7
+size 1565787

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+version https://git-lfs.github.com/spec/v1`
	`2`	`+oid sha256:c103c0f7b8f9d8d64b400e0899d5934d2a13d1f08368ba1907285aa0691f4cbb`
	`3`	`+size 61009072`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+version https://git-lfs.github.com/spec/v1`
	`2`	`+oid sha256:930eeb3f4d25a20e59fa21919f95edbb7a4b3f31b51a83f62c9b6627906156b9`
	`3`	`+size 45565042`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+version https://git-lfs.github.com/spec/v1`
	`2`	`+oid sha256:ff1170e8123aa7b8d652bc43a9e9864ee6ba050653470f34dada9b6ad0731b40`
	`3`	`+size 61009797`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+version https://git-lfs.github.com/spec/v1`
	`2`	`+oid sha256:7d78cb5357b90e71f38c133715e67237c5156e21be0aa6e397c9654557364a6d`
	`3`	`+size 45685092`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+version https://git-lfs.github.com/spec/v1`
	`2`	`+oid sha256:4a567dd7542ef440890d57268fabf47211174c593d7a1837bd7f16a1067169e7`
	`3`	`+size 1345213`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+version https://git-lfs.github.com/spec/v1`
	`2`	`+oid sha256:d3a84101535d52ecf31503ff1645f170c7b156b6bc53f1492caec485b7c023a7`
	`3`	`+size 1565787`