Vincentqyw · Vincentqyw · Aug 31, 2024 · Aug 22, 2024 · Aug 23, 2024 · Aug 31, 2024
diff --git a/.gitmodules b/.gitmodules
@@ -67,3 +67,6 @@
 [submodule "third_party/pram"]
 	path = third_party/pram
 	url = https://github.com/agipro/pram.git
+[submodule "third_party/EfficientLoFTR"]
+	path = third_party/EfficientLoFTR
+	url = https://github.com/zju3dv/EfficientLoFTR.git
diff --git a/README.md b/README.md
@@ -23,6 +23,7 @@ Here is a demo of the tool:
 https://github.com/Vincentqyw/image-matching-webui/assets/18531182/263534692-c3484d1b-cc00-4fdc-9b31-e5b7af07ecd9
 
 The tool currently supports various popular image matching algorithms, namely:
+- [x] [EfficientLoFTR](https://github.com/zju3dv/EfficientLoFTR), CVPR 2024
 - [x] [MASt3R](https://github.com/naver/mast3r), CVPR 2024
 - [x] [DUSt3R](https://github.com/naver/dust3r), CVPR 2024
 - [x] [OmniGlue](https://github.com/Vincentqyw/omniglue-onnx), CVPR 2024

diff --git a/hloc/extractors/sfd2.py b/hloc/extractors/sfd2.py
@@ -24,8 +24,8 @@ def _init(self, conf):
         self.norm_rgb = tvf.Normalize(
             mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]
         )
-        model_fn = tp_path / "pram" / "weights" / self.conf["model_name"]
-        self.net = load_sfd2(weight_path=model_fn).eval()
+        model_path = tp_path / "pram" / "weights" / self.conf["model_name"]
+        self.net = load_sfd2(weight_path=model_path).eval()
 
         logger.info("Load SFD2 model done.")
 

diff --git a/hloc/match_dense.py b/hloc/match_dense.py
@@ -44,6 +44,25 @@
         "max_error": 1,  # max error for assigned keypoints (in px)
         "cell_size": 1,  # size of quantization patch (max 1 kp/patch)
     },
+    "eloftr": {
+        "output": "matches-eloftr",
+        "model": {
+            "name": "eloftr",
+            "weights": "weights/eloftr_outdoor.ckpt",
+            "max_keypoints": 2000,
+            "match_threshold": 0.2,
+        },
+        "preprocessing": {
+            "grayscale": True,
+            "resize_max": 1024,
+            "dfactor": 32,
+            "width": 640,
+            "height": 480,
+            "force_resize": True,
+        },
+        "max_error": 1,  # max error for assigned keypoints (in px)
+        "cell_size": 1,  # size of quantization patch (max 1 kp/patch)
+    },
     # "loftr_quadtree": {
     #     "output": "matches-loftr-quadtree",
     #     "model": {
@@ -104,7 +123,14 @@
             "max_keypoints": 2000,
             "match_threshold": 0.2,
         },
-        "preprocessing": {"grayscale": True, "resize_max": 1024, "dfactor": 8},
+        "preprocessing": {
+            "grayscale": True,
+            "resize_max": 1024,
+            "dfactor": 8,
+            "width": 640,
+            "height": 480,
+            "force_resize": True,
+        },
         "max_error": 4,  # max error for assigned keypoints (in px)
         "cell_size": 4,  # size of quantization patch (max 1 kp/patch)
     },
@@ -172,6 +198,21 @@
             "dfactor": 16,
         },
     },
+    "xfeat_lightglue": {
+        "output": "matches-xfeat_lightglue",
+        "model": {
+            "name": "xfeat_lightglue",
+            "max_keypoints": 8000,
+        },
+        "preprocessing": {
+            "grayscale": False,
+            "force_resize": False,
+            "resize_max": 1024,
+            "width": 640,
+            "height": 480,
+            "dfactor": 8,
+        },
+    },
     "xfeat_dense": {
         "output": "matches-xfeat_dense",
         "model": {
@@ -251,6 +292,10 @@
             "resize_max": 1024,
             "dfactor": 8,
             "force_resize": False,
+            "resize_max": 1024,
+            "width": 640,
+            "height": 480,
+            "dfactor": 8,
         },
     },
     "sold2": {

diff --git a/hloc/matchers/eloftr.py b/hloc/matchers/eloftr.py
@@ -0,0 +1,115 @@
+import subprocess
+import sys
+import warnings
+from copy import deepcopy
+from pathlib import Path
+
+import torch
+from huggingface_hub import hf_hub_download
+
+tp_path = Path(__file__).parent / "../../third_party"
+sys.path.append(str(tp_path))
+
+from EfficientLoFTR.src.loftr import LoFTR as ELoFTR_
+from EfficientLoFTR.src.loftr import (
+    full_default_cfg,
+    opt_default_cfg,
+    reparameter,
+)
+
+from hloc import logger
+
+from ..utils.base_model import BaseModel
+
+
+class ELoFTR(BaseModel):
+    default_conf = {
+        "weights": "weights/eloftr_outdoor.ckpt",
+        "match_threshold": 0.2,
+        # "sinkhorn_iterations": 20,
+        "max_keypoints": -1,
+        # You can choose model type in ['full', 'opt']
+        "model_type": "full",  # 'full' for best quality, 'opt' for best efficiency
+        # You can choose numerical precision in ['fp32', 'mp', 'fp16']. 'fp16' for best efficiency
+        "precision": "fp32",
+    }
+    required_inputs = ["image0", "image1"]
+
+    def _init(self, conf):
+
+        if self.conf["model_type"] == "full":
+            _default_cfg = deepcopy(full_default_cfg)
+        elif self.conf["model_type"] == "opt":
+            _default_cfg = deepcopy(opt_default_cfg)
+
+        if self.conf["precision"] == "mp":
+            _default_cfg["mp"] = True
+        elif self.conf["precision"] == "fp16":
+            _default_cfg["half"] = True
+
+        model_path = tp_path / "EfficientLoFTR" / self.conf["weights"]
+
+        # Download the model.
+        if not model_path.exists():
+            model_path.parent.mkdir(exist_ok=True)
+            cached_file = hf_hub_download(
+                repo_type="space",
+                repo_id="Realcat/image-matching-webui",
+                filename="third_party/EfficientLoFTR/{}".format(
+                    conf["weights"]
+                ),
+            )
+            logger.info("Downloaded EfficientLoFTR model succeeed!")
+            cmd = [
+                "cp",
+                str(cached_file),
+                str(model_path),
+            ]
+            subprocess.run(cmd, check=True)
+            logger.info(f"Copy model file `{cmd}`.")
+
+        cfg = _default_cfg
+        cfg["match_coarse"]["thr"] = conf["match_threshold"]
+        # cfg["match_coarse"]["skh_iters"] = conf["sinkhorn_iterations"]
+        state_dict = torch.load(model_path, map_location="cpu")["state_dict"]
+        matcher = ELoFTR_(config=cfg)
+        matcher.load_state_dict(state_dict)
+        self.net = reparameter(matcher)
+
+        if self.conf["precision"] == "fp16":
+            self.net = self.net.half()
+        logger.info(f"Loaded Efficient LoFTR with weights {conf['weights']}")
+
+    def _forward(self, data):
+        # For consistency with hloc pairs, we refine kpts in image0!
+        rename = {
+            "keypoints0": "keypoints1",
+            "keypoints1": "keypoints0",
+            "image0": "image1",
+            "image1": "image0",
+            "mask0": "mask1",
+            "mask1": "mask0",
+        }
+        data_ = {rename[k]: v for k, v in data.items()}
+        with warnings.catch_warnings():
+            warnings.simplefilter("ignore")
+            pred = self.net(data_)
+        pred = {
+            "keypoints0": data_["mkpts0_f"],
+            "keypoints1": data_["mkpts1_f"],
+        }
+        scores = data_["mconf"]
+
+        top_k = self.conf["max_keypoints"]
+        if top_k is not None and len(scores) > top_k:
+            keep = torch.argsort(scores, descending=True)[:top_k]
+            pred["keypoints0"], pred["keypoints1"] = (
+                pred["keypoints0"][keep],
+                pred["keypoints1"][keep],
+            )
+            scores = scores[keep]
+
+        # Switch back indices
+        pred = {(rename[k] if k in rename else k): v for k, v in pred.items()}
+        pred["scores"] = scores
+        return pred
diff --git a/hloc/matchers/xfeat_lightglue.py b/hloc/matchers/xfeat_lightglue.py
@@ -0,0 +1,48 @@
+import torch
+
+from hloc import logger
+
+from ..utils.base_model import BaseModel
+
+
+class XFeatLightGlue(BaseModel):
+    default_conf = {
+        "keypoint_threshold": 0.005,
+        "max_keypoints": 8000,
+    }
+    required_inputs = [
+        "image0",
+        "image1",
+    ]
+
+    def _init(self, conf):
+        self.net = torch.hub.load(
+            "verlab/accelerated_features",
+            "XFeat",
+            pretrained=True,
+            top_k=self.conf["max_keypoints"],
+        )
+        logger.info("Load XFeat(dense) model done.")
+
+    def _forward(self, data):
+        # we use results from one batch
+        im0 = data["image0"]
+        im1 = data["image1"]
+        # Compute coarse feats
+        out0 = self.net.detectAndCompute(im0, top_k=self.conf["max_keypoints"])[
+            0
+        ]
+        out1 = self.net.detectAndCompute(im1, top_k=self.conf["max_keypoints"])[
+            0
+        ]
+        out0.update({"image_size": (im0.shape[-1], im0.shape[-2])})  # W H
+        out1.update({"image_size": (im1.shape[-1], im1.shape[-2])})  # W H
+        mkpts_0, mkpts_1 = self.net.match_lighterglue(out0, out1)
+        mkpts_0 = torch.from_numpy(mkpts_0)  # n x 2
+        mkpts_1 = torch.from_numpy(mkpts_1)  # n x 2
+        pred = {
+            "keypoints0": mkpts_0,
+            "keypoints1": mkpts_1,
+            "mconf": torch.ones_like(mkpts_0[:, 0]),
+        }
+        return pred
diff --git a/requirements.txt b/requirements.txt
@@ -6,7 +6,7 @@ gradio_client==0.16.0
 h5py==3.9.0
 imageio==2.31.1
 Jinja2==3.1.2
-kornia==0.6.12
+kornia
 loguru==0.7.0
 matplotlib==3.7.1
 numpy==1.23.5

diff --git a/third_party/EfficientLoFTR b/third_party/EfficientLoFTR
diff --git a/ui/config.yaml b/ui/config.yaml
@@ -41,7 +41,7 @@ matcher_zoo:
   DUSt3R:
     # TODO: duster is under development  
     enable: true
-    skip_ci: true
+    # skip_ci: true
     matcher: duster
     dense: true
     info:
@@ -53,7 +53,7 @@ matcher_zoo:
       display: true
   GIM(dkm):
     enable: true
-    skip_ci: true
+    # skip_ci: true
     matcher: gim(dkm)
     dense: true
     info:
@@ -95,6 +95,16 @@ matcher_zoo:
       paper: https://arxiv.org/pdf/2104.00680
       project: https://zju3dv.github.io/loftr
       display: true
+  eloftr:
+    matcher: eloftr
+    dense: true
+    info:
+      name: Efficient LoFTR #dispaly name
+      source: "CVPR 2024"
+      github: https://github.com/zju3dv/efficientloftr
+      paper: https://zju3dv.github.io/efficientloftr/files/EfficientLoFTR.pdf
+      project: https://zju3dv.github.io/efficientloftr
+      display: true
   cotr:
     enable: false
     skip_ci: true
@@ -127,6 +137,17 @@ matcher_zoo:
       paper: https://arxiv.org/abs/2208.14201
       project: null
       display: true
+  xfeat+lightglue:
+    enable: true
+    matcher: xfeat_lightglue
+    dense: true
+    info:
+      name: xfeat+lightglue
+      source: "CVPR 2024"
+      github: https://github.com/Vincentqyw/omniglue-onnx
+      paper: https://arxiv.org/abs/2405.12979
+      project: https://hwjiang1510.github.io/OmniGlue
+      display: true
   xfeat(sparse):
     matcher: NN-mutual
     feature: xfeat