cvg · OroChippw · Aug 10, 2023 · Aug 11, 2023 · Aug 14, 2023 · Aug 18, 2023
diff --git a/.gitignore b/.gitignore
@@ -7,4 +7,12 @@ __pycache__
 /lightglue/weights/
 lightglue/_flash/
 *-checkpoint.ipynb
-*.pth
+*.pth
+
+# weights
+weights/
+*.pth
+*.onnx
+
+# data
+data/
diff --git a/demo.ipynb b/demo.ipynb
diff --git a/export_onnx.py b/export_onnx.py
@@ -0,0 +1,239 @@
+# -*- coding: utf-8 -*-
+
+import torch
+import argparse
+from typing import List
+
+from lightglue_onnx import DISK, LightGlue, LightGlueEnd2End, SuperPoint
+from lightglue_onnx.end2end import normalize_keypoints
+from lightglue_onnx.ops import patch_disk_convolution_mode, register_aten_sdpa
+from lightglue_onnx.utils import load_image, rgb_to_grayscale
+
+
+def parse_args() -> argparse.Namespace:
+    parser = argparse.ArgumentParser()
+    parser.add_argument(
+        "--img_size" , nargs="+" , type=int,
+        default=512 , required=False,
+        help="Sample image size for ONNX tracing. If a single integer is given, resize the longer side of the image to this value. Otherwise, please provide two integers (height width).",
+    )
+    parser.add_argument(
+        "--extractor_type" , type=str , default="superpoint",
+        choices=["superpoint", "disk"] , required=False,
+        help="Type of feature extractor. Supported extractors are 'superpoint' and 'disk'. Defaults to 'superpoint'.",
+    )
+    parser.add_argument(
+        "--extractor_path" , type=str , default=None , required=False,
+        help="Path to save the feature extractor ONNX model.",
+    )
+    parser.add_argument(
+        "--lightglue_path" , type=str , default=None , required=False,
+        help="Path to save the LightGlue ONNX model.",
+    )
+    parser.add_argument(
+        "--end2end" , action="store_true",
+        help="Whether to export an end-to-end pipeline instead of individual models.",
+    )
+    parser.add_argument(
+        "--safe" , action="store_true",
+        help="Use the safe mode to prevent LightGlue from crashing on the rare occasion that the feature extractor outputs zero keypoints. Only applies when exporting with the end2end option.",
+    )
+    parser.add_argument(
+        "--dynamic", action="store_true", help="Whether to allow dynamic image sizes."
+    )
+    parser.add_argument(
+        "--mp" , action="store_true",
+        help="Whether to use mixed precision (CUDA only). Not supported when using the --safe option.",
+    )
+    parser.add_argument(
+        "--flash" , action="store_true",
+        help="Whether to use Flash Attention (CUDA only). Flash Attention must be installed. Not supported when using the --safe option.",
+    )
+
+    # Extractor-specific args:
+    parser.add_argument(
+        "--max_num_keypoints" , type=int , default=None , required=False,
+        help="Maximum number of keypoints outputted by the extractor.",
+    )
+
+    return parser.parse_args()
+
+
+def export_onnx(
+    img_size=512,
+    extractor_type="superpoint",
+    extractor_path=None,
+    lightglue_path=None,
+    img0_path="assets/sacre_coeur1.jpg",
+    img1_path="assets/sacre_coeur2.jpg",
+    end2end=False,
+    safe=False,
+    dynamic=False,
+    mp=False,
+    flash=False,
+    max_num_keypoints=None,
+):
+    # Handle args
+    if isinstance(img_size, List) and len(img_size) == 1:
+        img_size = img_size[0]
+
+    if extractor_path is not None and end2end:
+        raise ValueError(
+            "Extractor will be combined with LightGlue when exporting end-to-end model."
+        )
+    if extractor_path is None:
+        extractor_path = f"weights/{extractor_type}" f"{'_mp' if mp else ''}" ".onnx"
+
+    if lightglue_path is None:
+        lightglue_path = (
+            f"weights/{extractor_type}_lightglue"
+            f"{'_end2end' if end2end else ''}"
+            f"{'_safe' if safe else ''}"
+            f"{'_mp' if mp else ''}"
+            f"{'_flash' if flash else ''}"
+            ".onnx"
+        )
+
+    # Sample images for tracing
+    image0, scales0 = load_image(img0_path, resize=img_size)
+    image1, scales1 = load_image(img1_path, resize=img_size)
+    # Models
+    extractor_type = extractor_type.lower()
+    if extractor_type == "superpoint":
+        # SuperPoint works on grayscale images.
+        image0 = rgb_to_grayscale(image0)
+        image1 = rgb_to_grayscale(image1)
+        extractor = SuperPoint(max_num_keypoints=max_num_keypoints).eval()
+        lightglue = LightGlue(extractor_type, flash=flash).eval()
+    elif extractor_type == "disk":
+        extractor = DISK(max_num_keypoints=max_num_keypoints).eval()
+        lightglue = LightGlue(extractor_type, flash=flash).eval()
+
+        if torch.__version__ < "2.1":
+            patch_disk_convolution_mode(extractor)
+    else:
+        raise NotImplementedError(
+            f"LightGlue has not been trained on {extractor_type} features."
+        )
+
+    if (
+        hasattr(torch.nn.functional, "scaled_dot_product_attention")
+        and torch.__version__ < "2.1"
+    ):
+        register_aten_sdpa(opset_version=14)
+
+    if mp or flash:
+        assert torch.cuda.is_available(), "Mixed precision requires CUDA."
+        image0, image1 = image0.to("cuda"), image1.to("cuda")
+        extractor, lightglue = extractor.to("cuda"), lightglue.to("cuda")
+
+    # ONNX Export
+    if end2end:
+        if safe:
+            extractor = torch.jit.trace(extractor, image0[None])
+            desc_dim = 256 if extractor_type == "superpoint" else 128
+            lightglue = torch.jit.trace(
+                lightglue,
+                (
+                    torch.rand(1, 5, 2),
+                    torch.rand(1, 10, 2),
+                    torch.rand(1, 5, desc_dim),
+                    torch.rand(1, 10, desc_dim),
+                ),
+            )
+            pipeline = LightGlueEnd2End(extractor, lightglue, safe=safe).eval()
+            pipeline = torch.jit.script(pipeline)
+        else:
+            pipeline = LightGlueEnd2End(extractor, lightglue).eval()
+
+        dynamic_axes = {
+            "kpts0": {1: "num_keypoints0"},
+            "kpts1": {1: "num_keypoints1"},
+            "matches0": {1: "num_matches0"},
+            "matches1": {1: "num_matches1"},
+            "mscores0": {1: "num_matches0"},
+            "mscores1": {1: "num_matches1"},
+        }
+        if dynamic:
+            dynamic_axes.update(
+                {
+                    "image0": {2: "height0", 3: "width0"},
+                    "image1": {2: "height1", 3: "width1"},
+                }
+            )
+
+        with torch.autocast("cuda", enabled=mp):
+            torch.onnx.export(
+                pipeline,
+                (image0[None], image1[None]),
+                lightglue_path,
+                input_names=["image0", "image1"],
+                output_names=[
+                    "kpts0",
+                    "kpts1",
+                    "matches0",
+                    "matches1",
+                    "mscores0",
+                    "mscores1",
+                ],
+                opset_version=16,
+                dynamic_axes=dynamic_axes,
+            )
+    else:
+        # Export Extractor
+        dynamic_axes = {
+            "keypoints": {1: "num_keypoints"},
+            "scores": {1: "num_keypoints"},
+            "descriptors": {1: "num_keypoints"},
+        }
+        if dynamic:
+            dynamic_axes.update({"image": {2: "height", 3: "width"}})
+
+        with torch.autocast("cuda", enabled=mp):
+            torch.onnx.export(
+                extractor,
+                image0[None],
+                extractor_path,
+                input_names=["image"],
+                output_names=["keypoints", "scores", "descriptors"],
+                opset_version=16,
+                dynamic_axes=dynamic_axes,
+            )
+
+        # Export LightGlue
+        feats0, feats1 = extractor(image0[None]), extractor(image1[None])
+        kpts0, scores0, desc0 = feats0
+        kpts1, scores1, desc1 = feats1
+
+        kpts0 = normalize_keypoints(kpts0, image0.shape[1], image0.shape[2])
+        kpts1 = normalize_keypoints(kpts1, image1.shape[1], image1.shape[2])
+
+        with torch.autocast("cuda", enabled=mp):
+            torch.onnx.export(
+                lightglue,
+                (
+                    kpts0,
+                    kpts1,
+                    desc0,
+                    desc1,
+                ),
+                lightglue_path,
+                input_names=["kpts0", "kpts1", "desc0", "desc1"],
+                output_names=["matches0", "matches1", "mscores0", "mscores1"],
+                opset_version=16,
+                dynamic_axes={
+                    "kpts0": {1: "num_keypoints0"},
+                    "kpts1": {1: "num_keypoints1"},
+                    "desc0": {1: "num_keypoints0"},
+                    "desc1": {1: "num_keypoints1"},
+                    "matches0": {1: "num_matches0"},
+                    "matches1": {1: "num_matches1"},
+                    "mscores0": {1: "num_matches0"},
+                    "mscores1": {1: "num_matches1"},
+                },
+            )
+
+
+if __name__ == "__main__":
+    args = parse_args()
+    export_onnx(**vars(args))
diff --git a/export_onnx.sh b/export_onnx.sh
@@ -0,0 +1,11 @@
+# template
+
+python export_onnx.py \
+  --img_size 512 \
+  --extractor_type superpoint \
+  --extractor_path weights/superpoint.onnx \
+  --lightglue_path weights/superpoint_lightglue.onnx \
+  --dynamic
+
+
+python export_onnx.py --img_size 512 --extractor_type superpoint --extractor_path weights/superpoint.onnx --lightglue_path weights/superpoint_lightglue.onnx --dynamic
diff --git a/inference_onnx.sh b/inference_onnx.sh
@@ -0,0 +1,12 @@
+# template
+python run_Lightglue_onnx.py \
+  --inputdir0 assets/DSC_0410.JPG \
+  --inputdir1 assets/DSC_0411.JPG \
+  --img-size 512 \
+  --lightglue-path weights/superpoint_lightglue.onnx \
+  --extractor-type superpoint \
+  --extractor-path weights/superpoint.onnx \
+  --viz
+
+# Samples
+python run_Lightglue_onnx.py --inputdir0 D:\\OroChiLab\\LightGlue\\data\\dir0\\DSC_0411.JPG --inputdir1 D:\\OroChiLab\\LightGlue\\data\\dir1\\DSC_0410.JPG --img-size 512 --lightglue-path D:\\OroChiLab\\LightGlue\\weights\\onnx\\superpoint_lightglue.onnx --extractor-type superpoint --extractor-path D:\\OroChiLab\\LightGlue\\weights\\onnx\\superpoint.onnx --viz
diff --git a/inference_torch.sh b/inference_torch.sh
@@ -0,0 +1,10 @@
+# SuperPoint
+python run_Lightglue_pth.py
+## Withline
+python run_Lightglue_pth.py --withline
+
+
+# DISK
+python run_Lightglue_pth.py --extractor-type disk
+## Withline
+python run_Lightglue_pth.py --withline --extractor-type disk
diff --git a/lightglue_onnx/__init__.py b/lightglue_onnx/__init__.py
@@ -0,0 +1,5 @@
+from .disk import DISK
+from .end2end import LightGlueEnd2End
+from .lightglue import LightGlue
+from .superpoint import SuperPoint
+from .utils import match_pair