add googlenet, inception_v1 and shufflenet-v2 qdq models (#570)

mengniwang95 · jcwchen · web-flow · commit 376af18bd3d2 · 2022-12-08T06:29:34.000-08:00
* add googlenet, inception_v1 and shufflenet-v2 qdq models

Signed-off-by: mengniwa &lt;mengni.wang@intel.com&gt;

* update test data

Signed-off-by: mengniwa &lt;mengni.wang@intel.com&gt;

* update json

Signed-off-by: mengniwa &lt;mengni.wang@intel.com&gt;

Signed-off-by: mengniwa &lt;mengni.wang@intel.com&gt;
Co-authored-by: Chun-Wei Chen &lt;jacky82226@gmail.com&gt;
diff --git a/ONNX_HUB_MANIFEST.json b/ONNX_HUB_MANIFEST.json
@@ -2185,6 +2185,49 @@
             "model_with_data_bytes": 5724344
         }
     },
+    {
+        "model": "GoogleNet-qdq",
+        "model_path": "vision/classification/inception_and_googlenet/googlenet/model/googlenet-12-qdq.onnx",
+        "onnx_version": "1.12",
+        "opset_version": 12,
+        "metadata": {
+            "model_sha": "f764ae1ed52e5fca319a43a19e9526d2f028e7f10b9d17a8eefcb098cd90d36d",
+            "model_bytes": 7135204,
+            "tags": [
+                "vision",
+                "classification",
+                "inception and googlenet",
+                "googlenet"
+            ],
+            "io_ports": {
+                "inputs": [
+                    {
+                        "name": "data_0",
+                        "shape": [
+                            1,
+                            3,
+                            224,
+                            224
+                        ],
+                        "type": "tensor(float)"
+                    }
+                ],
+                "outputs": [
+                    {
+                        "name": "prob_1",
+                        "shape": [
+                            1,
+                            1000
+                        ],
+                        "type": "tensor(float)"
+                    }
+                ]
+            },
+            "model_with_data_path": "vision/classification/inception_and_googlenet/googlenet/model/googlenet-12-qdq.tar.gz",
+            "model_with_data_sha": "5587255e94438edd7c0017f5355178546b150deea05ed5e59109a4d4ae9aa4b3",
+            "model_with_data_bytes": 5562451
+        }
+    },
     {
         "model": "GoogleNet",
         "model_path": "vision/classification/inception_and_googlenet/googlenet/model/googlenet-12.onnx",
@@ -2564,6 +2607,49 @@
             "model_with_data_bytes": 9474526
         }
     },
+    {
+        "model": "Inception-1-qdq",
+        "model_path": "vision/classification/inception_and_googlenet/inception_v1/model/inception-v1-12-qdq.onnx",
+        "onnx_version": "1.12",
+        "opset_version": 12,
+        "metadata": {
+            "model_sha": "c6a8e07c53ea417a0001ebba885a3a623f1c3c51fac105485aca638e2f3de25d",
+            "model_bytes": 7135424,
+            "tags": [
+                "vision",
+                "classification",
+                "inception and googlenet",
+                "inception v1"
+            ],
+            "io_ports": {
+                "inputs": [
+                    {
+                        "name": "data_0",
+                        "shape": [
+                            1,
+                            3,
+                            224,
+                            224
+                        ],
+                        "type": "tensor(float)"
+                    }
+                ],
+                "outputs": [
+                    {
+                        "name": "prob_1",
+                        "shape": [
+                            1,
+                            1000
+                        ],
+                        "type": "tensor(float)"
+                    }
+                ]
+            },
+            "model_with_data_path": "vision/classification/inception_and_googlenet/inception_v1/model/inception-v1-12-qdq.tar.gz",
+            "model_with_data_sha": "c981fd944a125d3626cb79720c7f0a57309da5a24994c0378e2657fdca87a869",
+            "model_with_data_bytes": 5559367
+        }
+    },
     {
         "model": "Inception-1",
         "model_path": "vision/classification/inception_and_googlenet/inception_v1/model/inception-v1-12.onnx",
@@ -4820,6 +4906,48 @@
             "model_with_data_bytes": 2488137
         }
     },
+    {
+        "model": "ShuffleNet-v2-qdq",
+        "model_path": "vision/classification/shufflenet/model/shufflenet-v2-12-qdq.onnx",
+        "onnx_version": "1.12",
+        "opset_version": 12,
+        "metadata": {
+            "model_sha": "7c536d02e2f6af9569e5f3c7a4d8282060072119524c93c8da71e63876b4722b",
+            "model_bytes": 2415805,
+            "tags": [
+                "vision",
+                "classification",
+                "shufflenet"
+            ],
+            "io_ports": {
+                "inputs": [
+                    {
+                        "name": "input",
+                        "shape": [
+                            1,
+                            3,
+                            224,
+                            224
+                        ],
+                        "type": "tensor(float)"
+                    }
+                ],
+                "outputs": [
+                    {
+                        "name": "output",
+                        "shape": [
+                            1,
+                            1000
+                        ],
+                        "type": "tensor(float)"
+                    }
+                ]
+            },
+            "model_with_data_path": "vision/classification/shufflenet/model/shufflenet-v2-12-qdq.tar.gz",
+            "model_with_data_sha": "071594e233cedf5688501c9b67cad30c4babb1b46771fb87afe7fd1beb1cc008",
+            "model_with_data_bytes": 2245304
+        }
+    },
     {
         "model": "ShuffleNet-v2-fp32",
         "model_path": "vision/classification/shufflenet/model/shufflenet-v2-12.onnx",
diff --git a/vision/classification/inception_and_googlenet/googlenet/README.md b/vision/classification/inception_and_googlenet/googlenet/README.md
@@ -11,6 +11,7 @@
 |GoogleNet| [28 MB](model/googlenet-9.onnx)  |  [31 MB](model/googlenet-9.tar.gz) |  1.4 | 9| | |
 |GoogleNet| [27 MB](model/googlenet-12.onnx)  |  [25 MB](model/googlenet-12.tar.gz) |  1.9 | 12|67.78|88.34|
 |GoogleNet-int8| [7 MB](model/googlenet-12-int8.onnx)  |  [5 MB](model/googlenet-12-int8.tar.gz) |  1.9 | 12|67.73|88.32|
+|GoogleNet-qdq | [7 MB](model/googlenet-12-qdq.onnx) | [5 MB](model/googlenet-12-qdq.tar.gz) | 1.12 | 12 | 67.73 | 88.31 |
 > Compared with the fp32 GoogleNet, int8 GoogleNet's Top-1 accuracy drop ratio is 0.07%, Top-5 accuracy drop ratio is 0.02% and performance improvement is 1.27x.
 >
 > **Note** 
@@ -103,7 +104,7 @@ just the center crop. (Using the average of 10 crops,
 (4 + 1 center) * 2 mirror, should obtain a bit higher accuracy.)
 
 ## Quantization
-GoogleNet-int8 is obtained by quantizing fp32 GoogleNet model. We use [Intel® Neural Compressor](https://github.com/intel/neural-compressor) with onnxruntime backend to perform quantization. View the [instructions](https://github.com/intel/neural-compressor/blob/master/examples/onnxrt/image_recognition/onnx_model_zoo/googlenet/quantization/ptq/README.md) to understand how to use Intel® Neural Compressor for quantization.
+GoogleNet-int8 and GoogleNet-qdq are obtained by quantizing fp32 GoogleNet model. We use [Intel® Neural Compressor](https://github.com/intel/neural-compressor) with onnxruntime backend to perform quantization. View the [instructions](https://github.com/intel/neural-compressor/blob/master/examples/onnxrt/image_recognition/onnx_model_zoo/googlenet/quantization/ptq/README.md) to understand how to use Intel® Neural Compressor for quantization.
 
 ### Environment
 onnx: 1.9.0 
diff --git a/vision/classification/inception_and_googlenet/googlenet/model/googlenet-12-qdq.onnx b/vision/classification/inception_and_googlenet/googlenet/model/googlenet-12-qdq.onnx
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f764ae1ed52e5fca319a43a19e9526d2f028e7f10b9d17a8eefcb098cd90d36d
+size 7135204
diff --git a/vision/classification/inception_and_googlenet/googlenet/model/googlenet-12-qdq.tar.gz b/vision/classification/inception_and_googlenet/googlenet/model/googlenet-12-qdq.tar.gz
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5587255e94438edd7c0017f5355178546b150deea05ed5e59109a4d4ae9aa4b3
+size 5562451
diff --git a/vision/classification/inception_and_googlenet/inception_v1/README.md b/vision/classification/inception_and_googlenet/inception_v1/README.md
@@ -11,6 +11,7 @@
 |Inception-1| [28 MB](model/inception-v1-9.onnx)  |  [29 MB](model/inception-v1-9.tar.gz) |  1.4 | 9| |
 |Inception-1| [27 MB](model/inception-v1-12.onnx)  |  [25 MB](model/inception-v1-12.tar.gz) |  1.9 | 12| 67.23|
 |Inception-1-int8| [10 MB](model/inception-v1-12-int8.onnx)  |  [9 MB](model/inception-v1-12-int8.tar.gz) |  1.9 | 12| 67.24|
+|Inception-1-qdq| [7 MB](model/inception-v1-12-qdq.onnx) | [5 MB](model/inception-v1-12-qdq.tar.gz) | 1.12 | 12 | 67.21 |
 > Compared with the fp32 Inception-1, int8 Inception-1's Top-1 accuracy drop ratio is -0.01% and performance improvement is 1.26x.
 >
 > **Note** 
@@ -51,7 +52,7 @@ random generated sampe test data:
 ## Results/accuracy on test set
 
 ## Quantization
-Inception-1-int8 is obtained by quantizing fp32 Inception-1 model. We use [Intel® Neural Compressor](https://github.com/intel/neural-compressor) with onnxruntime backend to perform quantization. View the [instructions](https://github.com/intel/neural-compressor/blob/master/examples/onnxrt/image_recognition/onnx_model_zoo/inception/quantization/ptq/README.md) to understand how to use Intel® Neural Compressor for quantization.
+Inception-1-int8 and Inception-1-qdq are obtained by quantizing fp32 Inception-1 model. We use [Intel® Neural Compressor](https://github.com/intel/neural-compressor) with onnxruntime backend to perform quantization. View the [instructions](https://github.com/intel/neural-compressor/blob/master/examples/onnxrt/image_recognition/onnx_model_zoo/inception/quantization/ptq/README.md) to understand how to use Intel® Neural Compressor for quantization.
 
 ### Environment
 onnx: 1.9.0 
diff --git a/vision/classification/inception_and_googlenet/inception_v1/model/inception-v1-12-qdq.onnx b/vision/classification/inception_and_googlenet/inception_v1/model/inception-v1-12-qdq.onnx
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c6a8e07c53ea417a0001ebba885a3a623f1c3c51fac105485aca638e2f3de25d
+size 7135424
diff --git a/vision/classification/inception_and_googlenet/inception_v1/model/inception-v1-12-qdq.tar.gz b/vision/classification/inception_and_googlenet/inception_v1/model/inception-v1-12-qdq.tar.gz
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c981fd944a125d3626cb79720c7f0a57309da5a24994c0378e2657fdca87a869
+size 5559367
diff --git a/vision/classification/shufflenet/README.md b/vision/classification/shufflenet/README.md
@@ -31,6 +31,7 @@ ONNX ShuffleNet-v2 ==> Quantized ONNX ShuffleNet-v2
 |ShuffleNet-v2 |[9.2MB](model/shufflenet-v2-10.onnx) |  [8.7MB](model/shufflenet-v2-10.tar.gz) | 1.6 | 10 | 30.64 | 11.68|
 |ShuffleNet-v2-fp32 |[8.79MB](model/shufflenet-v2-12.onnx) |[8.69MB](model/shufflenet-v2-12.tar.gz) |1.9 |12 |33.65 |13.43|
 |ShuffleNet-v2-int8 |[2.28MB](model/shufflenet-v2-12-int8.onnx) |[2.37MB](model/shufflenet-v2-12-int8.tar.gz) |1.9 |12 |33.85 |13.66 |
+|ShuffleNet-v2-qdq |[2.30MB](model/shufflenet-v2-12-qdq.onnx) |[2.68MB](model/shufflenet-v2-12-qdq.tar.gz) |1.12 |12 |33.88 | 19.94 |
 > Compared with the fp32 ShuffleNet-v2, int8 ShuffleNet-v2's Top-1 error rising ratio is 0.59%, Top-5 error rising ratio is 1.71% and performance improvement is 1.62x.
 >
 > Note the performance depends on the test hardware. 
@@ -79,7 +80,7 @@ Details of performance on COCO object detection are provided in [this paper](htt
 <hr>
 
 ## Quantization
-ShuffleNet-v2-int8 is obtained by quantizing ShuffleNet-v2-fp32 model. We use [Intel® Neural Compressor](https://github.com/intel/neural-compressor) with onnxruntime backend to perform quantization. View the [instructions](https://github.com/intel/neural-compressor/blob/master/examples/onnxrt/image_recognition/onnx_model_zoo/shufflenet/quantization/ptq/README.md) to understand how to use Intel® Neural Compressor for quantization.
+ShuffleNet-v2-int8 and ShuffleNet-v2-int8 are obtained by quantizing ShuffleNet-v2-fp32 model. We use [Intel® Neural Compressor](https://github.com/intel/neural-compressor) with onnxruntime backend to perform quantization. View the [instructions](https://github.com/intel/neural-compressor/blob/master/examples/onnxrt/image_recognition/onnx_model_zoo/shufflenet/quantization/ptq/README.md) to understand how to use Intel® Neural Compressor for quantization.
 
 ### Environment
 onnx: 1.9.0 
diff --git a/vision/classification/shufflenet/model/shufflenet-v2-12-qdq.onnx b/vision/classification/shufflenet/model/shufflenet-v2-12-qdq.onnx
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7c536d02e2f6af9569e5f3c7a4d8282060072119524c93c8da71e63876b4722b
+size 2415805
diff --git a/vision/classification/shufflenet/model/shufflenet-v2-12-qdq.tar.gz b/vision/classification/shufflenet/model/shufflenet-v2-12-qdq.tar.gz
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:071594e233cedf5688501c9b67cad30c4babb1b46771fb87afe7fd1beb1cc008
+size 2245304

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+version https://git-lfs.github.com/spec/v1`
	`2`	`+oid sha256:f764ae1ed52e5fca319a43a19e9526d2f028e7f10b9d17a8eefcb098cd90d36d`
	`3`	`+size 7135204`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+version https://git-lfs.github.com/spec/v1`
	`2`	`+oid sha256:5587255e94438edd7c0017f5355178546b150deea05ed5e59109a4d4ae9aa4b3`
	`3`	`+size 5562451`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+version https://git-lfs.github.com/spec/v1`
	`2`	`+oid sha256:c6a8e07c53ea417a0001ebba885a3a623f1c3c51fac105485aca638e2f3de25d`
	`3`	`+size 7135424`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+version https://git-lfs.github.com/spec/v1`
	`2`	`+oid sha256:c981fd944a125d3626cb79720c7f0a57309da5a24994c0378e2657fdca87a869`
	`3`	`+size 5559367`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+version https://git-lfs.github.com/spec/v1`
	`2`	`+oid sha256:7c536d02e2f6af9569e5f3c7a4d8282060072119524c93c8da71e63876b4722b`
	`3`	`+size 2415805`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+version https://git-lfs.github.com/spec/v1`
	`2`	`+oid sha256:071594e233cedf5688501c9b67cad30c4babb1b46771fb87afe7fd1beb1cc008`
	`3`	`+size 2245304`