add vgg16, zfnet512 and fcn qdq models (#586)

yuwenzho · jcwchen · web-flow · commit 3d125fac4f1a · 2023-04-07T16:18:25.000-07:00
* add vgg16, zfnet512 and fcn qdq models

Signed-off-by: yuwenzho &lt;yuwen.zhou@intel.com&gt;

* reupload tar.gz file

Signed-off-by: yuwenzho &lt;yuwen.zhou@intel.com&gt;

---------

Signed-off-by: yuwenzho &lt;yuwen.zhou@intel.com&gt;
Co-authored-by: Chun-Wei Chen &lt;jacky82226@gmail.com&gt;
diff --git a/ONNX_HUB_MANIFEST.json b/ONNX_HUB_MANIFEST.json
@@ -5624,6 +5624,48 @@
             "model_with_data_bytes": 106112057
         }
     },
+    {
+        "model": "VGG 16-qdq",
+        "model_path": "vision/classification/vgg/model/vgg16-12-qdq.onnx",
+        "onnx_version": "1.9.0",
+        "opset_version": 12,
+        "metadata": {
+            "model_sha": "74ae0fa7e9e5b16782581bf17b5582080d1c06b69ed59410c7b1f190d9328bb1",
+            "model_bytes": 138424439,
+            "tags": [
+                "vision",
+                "classification",
+                "vgg"
+            ],
+            "io_ports": {
+                "inputs": [
+                    {
+                        "name": "data",
+                        "shape": [
+                            1,
+                            3,
+                            224,
+                            224
+                        ],
+                        "type": "tensor(float)"
+                    }
+                ],
+                "outputs": [
+                    {
+                        "name": "vgg0_dense2_fwd",
+                        "shape": [
+                            1,
+                            1000
+                        ],
+                        "type": "tensor(float)"
+                    }
+                ]
+            },
+            "model_with_data_path": "vision/classification/vgg/model/vgg16-12-qdq.tar.gz",
+            "model_with_data_sha": "ba8f1a789554deab15d28a3c4e6a1508595c326d36e5d744e8d5acf2729f7621",
+            "model_with_data_bytes": 103626016
+        }
+    },
     {
         "model": "VGG 16-fp32",
         "model_path": "vision/classification/vgg/model/vgg16-12.onnx",
@@ -6115,6 +6157,48 @@
             "model_with_data_bytes": 50270897
         }
     },
+    {
+        "model": "ZFNet-512-qdq",
+        "model_path": "vision/classification/zfnet-512/model/zfnet512-12-qdq.onnx",
+        "onnx_version": "1.9",
+        "opset_version": 12,
+        "metadata": {
+            "model_sha": "d29f9fe228a3b1ea4333e69f156faee1075e610721b46730c7ebeeb9ede36727",
+            "model_bytes": 87288258,
+            "tags": [
+                "vision",
+                "classification",
+                "zfnet-512"
+            ],
+            "io_ports": {
+                "inputs": [
+                    {
+                        "name": "gpu_0/data_0",
+                        "shape": [
+                            1,
+                            3,
+                            224,
+                            224
+                        ],
+                        "type": "tensor(float)"
+                    }
+                ],
+                "outputs": [
+                    {
+                        "name": "gpu_0/softmax_1",
+                        "shape": [
+                            1,
+                            1000
+                        ],
+                        "type": "tensor(float)"
+                    }
+                ]
+            },
+            "model_with_data_path": "vision/classification/zfnet-512/model/zfnet512-12-qdq.tar.gz",
+            "model_with_data_sha": "b65d9e14088acabfd11efccc7601cad1697b5ab48fe6074c41f15c9f7b5fed8c",
+            "model_with_data_bytes": 58038148
+        }
+    },
     {
         "model": "ZFNet-512",
         "model_path": "vision/classification/zfnet-512/model/zfnet512-12.onnx",
@@ -6874,6 +6958,60 @@
             "model_with_data_bytes": 30117697
         }
     },
+    {
+        "model": "FCN ResNet-50-qdq",
+        "model_path": "vision/object_detection_segmentation/fcn/model/fcn-resnet50-12-qdq.onnx",
+        "onnx_version": "1.8.0",
+        "opset_version": 12,
+        "metadata": {
+            "model_sha": "0a6aef19ef5401364aacb6883303401b4b7ccd3e3cd5eb60180b467dae88dcf5",
+            "model_bytes": 35440011,
+            "tags": [
+                "vision",
+                "object detection segmentation",
+                "fcn"
+            ],
+            "io_ports": {
+                "inputs": [
+                    {
+                        "name": "input",
+                        "shape": [
+                            "batch",
+                            3,
+                            "height",
+                            "width"
+                        ],
+                        "type": "tensor(float)"
+                    }
+                ],
+                "outputs": [
+                    {
+                        "name": "out",
+                        "shape": [
+                            "batch",
+                            21,
+                            "height",
+                            "width"
+                        ],
+                        "type": "tensor(float)"
+                    },
+                    {
+                        "name": "aux",
+                        "shape": [
+                            "batch",
+                            21,
+                            "height",
+                            "width"
+                        ],
+                        "type": "tensor(float)"
+                    }
+                ]
+            },
+            "model_with_data_path": "vision/object_detection_segmentation/fcn/model/fcn-resnet50-12-qdq.tar.gz",
+            "model_with_data_sha": "0feb90c5e17f1fac9c21e17bd536e43aeb56c04adcf87d5eb66acc1ef57fbafe",
+            "model_with_data_bytes": 21876642
+        }
+    },
     {
         "model": "FCN ResNet-50",
         "model_path": "vision/object_detection_segmentation/fcn/model/fcn-resnet50-12.onnx",
diff --git a/vision/classification/vgg/README.md b/vision/classification/vgg/README.md
@@ -27,6 +27,7 @@ The models below are variant of same network with different number of layers and
 |VGG 19-bn|    [548.1 MB](model/vgg19-bn-7.onnx) |[508.6 MB](model/vgg19-bn-7.tar.gz)   |  1.2.1 |7   | 73.83    |      91.79     |
 |VGG 16-fp32|    [527.8 MB](model/vgg16-12.onnx)   |[488.2 MB](model/vgg16-12.tar.gz)| 1.9.0 | 12 | 72.38 | 91.00 |
 |VGG 16-int8|    [132.0 MB](model/vgg16-12-int8.onnx)   |[101.1 MB](model/vgg16-12-int8.tar.gz)| 1.9.0 | 12 | 72.32 | 90.97 |
+|VGG 16-qdq|    [133.0 MB](model/vgg16-12-qdq.onnx)   |[99 MB](model/vgg16-12-qdq.tar.gz)| 1.9.0 | 12 | 72.35 | 91.02 |
 > Compared with the fp32 VGG 16, int8 VGG 16's Top-1 accuracy drop ratio is 0.06%, Top-5 accuracy drop ratio is 0.03% and performance improvement is 2.31x.
 >
 > Note the performance depends on the test hardware. 
@@ -81,7 +82,7 @@ We used MXNet as framework with gluon APIs to perform training. View the [traini
 We used MXNet as framework with gluon APIs to perform validation. Use the notebook [imagenet_validation](../imagenet_validation.ipynb) to verify the accuracy of the model on the validation set. Make sure to specify the appropriate model name in the notebook.
 
 ## Quantization
-VGG 16-int8 is obtained by quantizing VGG 16-fp32 model. We use [Intel® Neural Compressor](https://github.com/intel/neural-compressor) with onnxruntime backend to perform quantization. View the [instructions](https://github.com/intel/neural-compressor/blob/master/examples/onnxrt/image_recognition/onnx_model_zoo/vgg16/quantization/ptq/README.md) to understand how to use Intel® Neural Compressor for quantization.
+VGG 16-int8 and VGG 16-qdq are obtained by quantizing VGG 16-fp32 model. We use [Intel® Neural Compressor](https://github.com/intel/neural-compressor) with onnxruntime backend to perform quantization. View the [instructions](https://github.com/intel/neural-compressor/blob/master/examples/onnxrt/image_recognition/onnx_model_zoo/vgg16/quantization/ptq/README.md) to understand how to use Intel® Neural Compressor for quantization.
 
 ### Environment
 onnx: 1.9.0 
@@ -116,6 +117,7 @@ We use onnxruntime to perform VGG 16-fp32 and VGG 16-int8 inference. View the no
 * [abhinavs95](https://github.com/abhinavs95) (Amazon AI)
 * [ankkhedia](https://github.com/ankkhedia) (Amazon AI)
 * [mengniwang95](https://github.com/mengniwang95) (Intel)
+* [yuwenzho](https://github.com/yuwenzho) (Intel)
 * [airMeng](https://github.com/airMeng) (Intel)
 * [ftian1](https://github.com/ftian1) (Intel)
 * [hshen14](https://github.com/hshen14) (Intel)
diff --git a/vision/classification/vgg/model/vgg16-12-qdq.onnx b/vision/classification/vgg/model/vgg16-12-qdq.onnx
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:74ae0fa7e9e5b16782581bf17b5582080d1c06b69ed59410c7b1f190d9328bb1
+size 138424439
diff --git a/vision/classification/vgg/model/vgg16-12-qdq.tar.gz b/vision/classification/vgg/model/vgg16-12-qdq.tar.gz
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ba8f1a789554deab15d28a3c4e6a1508595c326d36e5d744e8d5acf2729f7621
+size 103626016
diff --git a/vision/classification/zfnet-512/README.md b/vision/classification/zfnet-512/README.md
@@ -11,6 +11,7 @@
 |ZFNet-512| [341 MB](model/zfnet512-9.onnx)  |  [318 MB](model/zfnet512-9.tar.gz) |  1.4 | 9| | |
 |ZFNet-512| [333 MB](model/zfnet512-12.onnx)  |  [309 MB](model/zfnet512-12.tar.gz) |  1.9 | 12|55.97|79.41|
 |ZFNet-512-int8| [83 MB](model/zfnet512-12-int8.onnx)  |  [48 MB](model/zfnet512-12-int8.tar.gz) |  1.9 | 12|55.84|79.33|
+|ZFNet-512-qdq| [84 MB](model/zfnet512-12-qdq.onnx)  |  [56 MB](model/zfnet512-12-qdq.tar.gz) |  1.9 | 12|55.83|79.42|
 > Compared with the fp32 ZFNet-512, int8 ZFNet-512's Top-1 accuracy drop ratio is 0.23%, Top-5 accuracy drop ratio is 0.10% and performance improvement is 1.78x.
 >
 > **Note** 
@@ -52,7 +53,7 @@ random generated sampe test data:
 ## Results/accuracy on test set
 
 ## Quantization
-ZFNet-512-int8 is obtained by quantizing fp32 ZFNet-512 model. We use [Intel® Neural Compressor](https://github.com/intel/neural-compressor) with onnxruntime backend to perform quantization. View the [instructions](https://github.com/intel/neural-compressor/blob/master/examples/onnxrt/image_recognition/onnx_model_zoo/zfnet/quantization/ptq/README.md) to understand how to use Intel® Neural Compressor for quantization.
+ZFNet-512-int8 and ZFNet-512-qdq are obtained by quantizing fp32 ZFNet-512 model. We use [Intel® Neural Compressor](https://github.com/intel/neural-compressor) with onnxruntime backend to perform quantization. View the [instructions](https://github.com/intel/neural-compressor/blob/master/examples/onnxrt/image_recognition/onnx_model_zoo/zfnet/quantization/ptq/README.md) to understand how to use Intel® Neural Compressor for quantization.
 
 ### Environment
 onnx: 1.9.0 
@@ -80,6 +81,7 @@ bash run_tuning.sh --input_model=path/to/model \  # model path as *.onnx
 
 ## Contributors
 * [mengniwang95](https://github.com/mengniwang95) (Intel)
+* [yuwenzho](https://github.com/yuwenzho) (Intel)
 * [airMeng](https://github.com/airMeng) (Intel)
 * [ftian1](https://github.com/ftian1) (Intel)
 * [hshen14](https://github.com/hshen14) (Intel)
diff --git a/vision/classification/zfnet-512/model/zfnet512-12-qdq.onnx b/vision/classification/zfnet-512/model/zfnet512-12-qdq.onnx
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d29f9fe228a3b1ea4333e69f156faee1075e610721b46730c7ebeeb9ede36727
+size 87288258
diff --git a/vision/classification/zfnet-512/model/zfnet512-12-qdq.tar.gz b/vision/classification/zfnet-512/model/zfnet512-12-qdq.tar.gz
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b65d9e14088acabfd11efccc7601cad1697b5ab48fe6074c41f15c9f7b5fed8c
+size 58038148
diff --git a/vision/object_detection_segmentation/fcn/README.md b/vision/object_detection_segmentation/fcn/README.md
@@ -15,6 +15,7 @@ This specific model detects 20 different [classes](dependencies/voc_classes.txt)
 | FCN ResNet-101 | [207 MB](model/fcn-resnet101-11.onnx) | [281 MB](model/fcn-resnet101-11.tar.gz) | 1.8.0        | 11 | 63.7% |
 | FCN ResNet-50  | [134 MB](model/fcn-resnet50-12.onnx)  | [125 MB](model/fcn-resnet50-12.tar.gz)  | 1.8.0        | 12 | 65.0% |
 | FCN ResNet-50-int8  | [34 MB](model/fcn-resnet50-12-int8.onnx)  | [29 MB](model/fcn-resnet50-12-int8.tar.gz)  | 1.8.0        | 12 | 64.7% |
+| FCN ResNet-50-qdq  | [34 MB](model/fcn-resnet50-12-qdq.onnx)  | [21 MB](model/fcn-resnet50-12-qdq.tar.gz)  | 1.8.0        | 12 | 64.4% |
 
 ### Source
 
@@ -145,7 +146,7 @@ The more conservative of the two estimates is used in the model files table.
 <hr>
 
 ## Quantization
-FCN ResNet 50-int8 is obtained by quantizing fp32 FCN ResNet 50 model. We use [Intel® Neural Compressor](https://github.com/intel/neural-compressor) with onnxruntime backend to perform quantization. View the [instructions](https://github.com/intel/neural-compressor/blob/master/examples/onnxrt/image_recognition/onnx_model_zoo/fcn/quantization/ptq/README.md) to understand how to use Intel® Neural Compressor for quantization.
+FCN ResNet 50-int8 and FCN ResNet-50-qdq are obtained by quantizing fp32 FCN ResNet 50 model. We use [Intel® Neural Compressor](https://github.com/intel/neural-compressor) with onnxruntime backend to perform quantization. View the [instructions](https://github.com/intel/neural-compressor/blob/master/examples/onnxrt/image_recognition/onnx_model_zoo/fcn/quantization/ptq/README.md) to understand how to use Intel® Neural Compressor for quantization.
 
 ### Environment
 onnx: 1.9.0 
@@ -176,6 +177,7 @@ bash run_tuning.sh --input_model=path/to/model  \ # model path as *.onnx
 ## Contributors
 * [Jack Duvall](https://github.com/duvallj)
 * [mengniwang95](https://github.com/mengniwang95) (Intel)
+* [yuwenzho](https://github.com/yuwenzho) (Intel)
 * [airMeng](https://github.com/airMeng) (Intel)
 * [ftian1](https://github.com/ftian1) (Intel)
 * [hshen14](https://github.com/hshen14) (Intel)
diff --git a/vision/object_detection_segmentation/fcn/model/fcn-resnet50-12-qdq.onnx b/vision/object_detection_segmentation/fcn/model/fcn-resnet50-12-qdq.onnx
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0a6aef19ef5401364aacb6883303401b4b7ccd3e3cd5eb60180b467dae88dcf5
+size 35440011
diff --git a/vision/object_detection_segmentation/fcn/model/fcn-resnet50-12-qdq.tar.gz b/vision/object_detection_segmentation/fcn/model/fcn-resnet50-12-qdq.tar.gz
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0feb90c5e17f1fac9c21e17bd536e43aeb56c04adcf87d5eb66acc1ef57fbafe
+size 21876642

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+version https://git-lfs.github.com/spec/v1`
	`2`	`+oid sha256:74ae0fa7e9e5b16782581bf17b5582080d1c06b69ed59410c7b1f190d9328bb1`
	`3`	`+size 138424439`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+version https://git-lfs.github.com/spec/v1`
	`2`	`+oid sha256:ba8f1a789554deab15d28a3c4e6a1508595c326d36e5d744e8d5acf2729f7621`
	`3`	`+size 103626016`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+version https://git-lfs.github.com/spec/v1`
	`2`	`+oid sha256:d29f9fe228a3b1ea4333e69f156faee1075e610721b46730c7ebeeb9ede36727`
	`3`	`+size 87288258`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+version https://git-lfs.github.com/spec/v1`
	`2`	`+oid sha256:b65d9e14088acabfd11efccc7601cad1697b5ab48fe6074c41f15c9f7b5fed8c`
	`3`	`+size 58038148`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+version https://git-lfs.github.com/spec/v1`
	`2`	`+oid sha256:0a6aef19ef5401364aacb6883303401b4b7ccd3e3cd5eb60180b467dae88dcf5`
	`3`	`+size 35440011`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+version https://git-lfs.github.com/spec/v1`
	`2`	`+oid sha256:0feb90c5e17f1fac9c21e17bd536e43aeb56c04adcf87d5eb66acc1ef57fbafe`
	`3`	`+size 21876642`