cvg · sarlinpe · Jul 12, 2021 · Jan 24, 2021 · Feb 5, 2021 · Feb 5, 2021
diff --git a/.gitmodules b/.gitmodules
@@ -8,3 +8,6 @@
 [submodule "third_party/deep-image-retrieval"]
 	path = third_party/deep-image-retrieval
 	url = https://github.com/naver/deep-image-retrieval.git
+[submodule "third_party/r2d2"]
+	path = third_party/r2d2
+	url = https://github.com/naver/r2d2.git
diff --git a/hloc/extractors/r2d2.py b/hloc/extractors/r2d2.py
@@ -0,0 +1,56 @@
+import sys
+from pathlib import Path
+import torchvision.transforms as tvf
+
+from ..utils.base_model import BaseModel
+
+r2d2_path = Path(__file__).parent / "../../third_party/r2d2"
+sys.path.append(str(r2d2_path))
+from extract import load_network, NonMaxSuppression, extract_multiscale
+
+
+class R2D2(BaseModel):
+    default_conf = {
+        'model_name': 'r2d2_WASF_N16.pt',
+        'max_keypoints': 5000,
+        'scale_factor': 2**0.25,
+        'min_size': 256,
+        'max_size': 1024,
+        'min_scale': 0,
+        'max_scale': 1,
+        'reliability_threshold': 0.7,
+        'repetability_threshold': 0.7,
+    }
+    required_inputs = ['image']
+
+    def _init(self, conf):
+        model_fn = r2d2_path / "models" / conf['model_name']
+        self.norm_rgb = tvf.Normalize(mean=[0.485, 0.456, 0.406],
+                                      std=[0.229, 0.224, 0.225])
+        self.net = load_network(model_fn)
+        self.detector = NonMaxSuppression(
+            rel_thr=conf['reliability_threshold'],
+            rep_thr=conf['repetability_threshold']
+        )
+
+    def _forward(self, data):
+        img = data['image']
+        img = self.norm_rgb(img)
+
+        xys, desc, scores = extract_multiscale(
+            self.net, img, self.detector,
+            scale_f=self.conf['scale_factor'],
+            min_size=self.conf['min_size'],
+            max_size=self.conf['max_size'],
+            min_scale=self.conf['min_scale'],
+            max_scale=self.conf['max_scale'],
+        )
+        idxs = scores.argsort()[-self.conf['max_keypoints'] or None:]
+        xy = xys[idxs, :2]
+        desc = desc[idxs].t()
+        scores = scores[idxs]
+
+        pred = {'keypoints': xy[None],
+                'descriptors': desc[None],
+                'scores': scores[None]}
+        return pred
diff --git a/third_party/r2d2 b/third_party/r2d2