convert superglue to onnx format

xmba15 · xmba15 · commit 89cf7745c091 · 2022-08-14T00:40:13.000+09:00
diff --git a/.gitmodules b/.gitmodules
@@ -1,3 +1,6 @@
 [submodule "scripts/superpoint/SuperPointPretrainedNetwork"]
 	path = scripts/superpoint/SuperPointPretrainedNetwork
 	url = https://github.com/magicleap/SuperPointPretrainedNetwork
+[submodule "scripts/superglue/SuperGluePretrainedNetwork"]
+	path = scripts/superglue/SuperGluePretrainedNetwork
+	url = https://github.com/magicleap/SuperGluePretrainedNetwork.git
diff --git a/scripts/superglue/README.md b/scripts/superglue/README.md
@@ -0,0 +1,28 @@
+# convert pre-trained superglue pytorch weights to onnx format
+
+---
+
+## dependencies
+
+---
+
+- python: 3x
+
+-
+
+```bash
+git submodule update --init --recursive
+
+python3 -m pip install -r SuperGluePretrainedNetwork/requirements.txt
+```
+
+## :running: how to run
+
+---
+
+
+- export onnx weights
+
+```
+python3 convert_to_onnx.py
+```
diff --git a/scripts/superglue/SuperGluePretrainedNetwork b/scripts/superglue/SuperGluePretrainedNetwork
@@ -0,0 +1 @@
+Subproject commit ddcf11f42e7e0732a0c4607648f9448ea8d73590
diff --git a/scripts/superglue/convert_to_onnx.py b/scripts/superglue/convert_to_onnx.py
@@ -0,0 +1,59 @@
+#!/usr/bin/env python
+import os
+
+import torch
+
+from superglue_wrapper import SuperGlueWrapper as SuperGlue
+
+
+def main():
+    config = {
+        "descriptor_dim": 256,
+        "weights": "indoor",
+        "keypoint_encoder": [32, 64, 128, 256],
+        "GNN_layers": ["self", "cross"] * 9,
+        "sinkhorn_iterations": 100,
+        "match_threshold": 0.2,
+    }
+
+    model = SuperGlue(config=config)
+    model.eval()
+
+    batch_size = 1
+    height = 480
+    width = 640
+    num_keypoints = 382
+    data = {}
+    for i in range(2):
+        data[f"image{i}_shape"] = torch.tensor([batch_size, 1, height, width])
+        data[f"scores{i}"] = torch.randn(batch_size, num_keypoints)
+        data[f"keypoints{i}"] = torch.randn(batch_size, num_keypoints, 2)
+        data[f"descriptors{i}"] = torch.randn(batch_size, 256, num_keypoints)
+
+    torch.onnx.export(
+        model,
+        data,
+        "super_glue.onnx",
+        export_params=True,
+        opset_version=12,
+        do_constant_folding=True,
+        input_names=list(data.keys()),
+        output_names=["matches0", "matches1", "matching_scores0", "matching_scores1"],
+        dynamic_axes={
+            "keypoints0": {0: "batch_size", 1: "num_keypoints0"},
+            "scores0": {0: "batch_size", 1: "num_keypoints0"},
+            "descriptors0": {0: "batch_size", 2: "num_keypoints0"},
+            "keypoints1": {0: "batch_size", 1: "num_keypoints1"},
+            "scores1": {0: "batch_size", 1: "num_keypoints1"},
+            "descriptors1": {0: "batch_size", 2: "num_keypoints1"},
+            "matches0": {0: "batch_size", 1: "num_keypoints0"},
+            "matches1": {0: "batch_size", 1: "num_keypoints1"},
+            "matching_scores0": {0: "batch_size", 1: "num_keypoints0"},
+            "matching_scores1": {0: "batch_size", 1: "num_keypoints1"},
+        },
+    )
+    print(f"\nonnx model is saved to: {os.getcwd()}/super_glue.onnx")
+
+
+if __name__ == "__main__":
+    main()
diff --git a/scripts/superglue/superglue_wrapper.py b/scripts/superglue/superglue_wrapper.py
@@ -0,0 +1,91 @@
+import torch
+
+from SuperGluePretrainedNetwork.models.superglue import (
+    SuperGlue,
+    arange_like,
+    log_optimal_transport,
+    normalize_keypoints,
+)
+
+
+class SuperGlueWrapper(SuperGlue):
+    default_config = {
+        "descriptor_dim": 256,
+        "weights": "outdor",
+        "keypoint_encoder": [32, 64, 128, 256],
+        "GNN_layers": ["self", "cross"] * 9,
+        "sinkhorn_iterations": 100,
+        "match_threshold": 0.2,
+    }
+
+    def __init__(self, config):
+        SuperGlue.__init__(self, config)
+
+    def forward(
+        self,
+        image0_shape,
+        scores0,
+        keypoints0,
+        descriptors0,
+        image1_shape,
+        scores1,
+        keypoints1,
+        descriptors1,
+    ):
+        data = {
+            "image0_shape": image0_shape,
+            "scores0": scores0,
+            "keypoints0": keypoints0,
+            "descriptors0": descriptors0,
+            "image1_shape": image1_shape,
+            "scores1": scores1,
+            "keypoints1": keypoints1,
+            "descriptors1": descriptors1,
+        }
+
+        """Run SuperGlue on a pair of keypoints and descriptors"""
+        desc0, desc1 = data["descriptors0"], data["descriptors1"]
+        kpts0, kpts1 = data["keypoints0"], data["keypoints1"]
+
+        # Keypoint normalization.
+        kpts0 = normalize_keypoints(kpts0, data["image0_shape"])
+        kpts1 = normalize_keypoints(kpts1, data["image1_shape"])
+
+        # Keypoint MLP encoder.
+        desc0 = desc0 + self.kenc(kpts0, data["scores0"])
+        desc1 = desc1 + self.kenc(kpts1, data["scores1"])
+
+        # Multi-layer Transformer network.
+        desc0, desc1 = self.gnn(desc0, desc1)
+
+        # Final MLP projection.
+        mdesc0, mdesc1 = self.final_proj(desc0), self.final_proj(desc1)
+
+        # Compute matching descriptor distance.
+        scores = torch.einsum("bdn,bdm->bnm", mdesc0, mdesc1)
+        scores = scores / self.config["descriptor_dim"] ** 0.5
+
+        # Run the optimal transport.
+        scores = log_optimal_transport(
+            scores, self.bin_score, iters=self.config["sinkhorn_iterations"]
+        )
+
+        # Get the matches with score above "match_threshold".
+        max0, max1 = scores[:, :-1, :-1].max(2), scores[:, :-1, :-1].max(1)
+        indices0, indices1 = max0.indices, max1.indices
+        mutual0 = arange_like(indices0, 1)[None] == indices1.gather(1, indices0)
+        mutual1 = arange_like(indices1, 1)[None] == indices0.gather(1, indices1)
+        zero = scores.new_tensor(0)
+        mscores0 = torch.where(mutual0, max0.values.exp(), zero)
+        mscores1 = torch.where(mutual1, mscores0.gather(1, indices1), zero)
+        valid0 = mutual0 & (mscores0 > self.config["match_threshold"])
+        valid1 = mutual1 & valid0.gather(1, indices1)
+        indices0 = torch.where(valid0, indices0, indices0.new_tensor(-1))
+        indices1 = torch.where(valid1, indices1, indices1.new_tensor(-1))
+
+        return {
+            "matches0": indices0,  # use -1 for invalid match
+            "matches1": indices1,  # use -1 for invalid match
+            "matching_scores0": mscores0,
+            "matching_scores1": mscores1,
+        }