|
import subprocess |
|
import sys |
|
from pathlib import Path |
|
|
|
import torch |
|
|
|
from hloc import MODEL_REPO_ID, logger |
|
|
|
from ..utils.base_model import BaseModel |
|
|
|
rord_path = Path(__file__).parent / "../../third_party" |
|
sys.path.append(str(rord_path)) |
|
from RoRD.lib.model_test import D2Net as _RoRD |
|
from RoRD.lib.pyramid import process_multiscale |
|
|
|
|
|
class RoRD(BaseModel): |
|
default_conf = { |
|
"model_name": "rord.pth", |
|
"checkpoint_dir": rord_path / "RoRD" / "models", |
|
"use_relu": True, |
|
"multiscale": False, |
|
"max_keypoints": 1024, |
|
} |
|
required_inputs = ["image"] |
|
|
|
def _init(self, conf): |
|
model_path = self._download_model( |
|
repo_id=MODEL_REPO_ID, |
|
filename="{}/{}".format( |
|
Path(__file__).stem, self.conf["model_name"] |
|
), |
|
) |
|
self.net = _RoRD( |
|
model_file=model_path, use_relu=conf["use_relu"], use_cuda=False |
|
) |
|
logger.info("Load RoRD model done.") |
|
|
|
def _forward(self, data): |
|
image = data["image"] |
|
image = image.flip(1) |
|
norm = image.new_tensor([103.939, 116.779, 123.68]) |
|
image = image * 255 - norm.view(1, 3, 1, 1) |
|
|
|
if self.conf["multiscale"]: |
|
keypoints, scores, descriptors = process_multiscale(image, self.net) |
|
else: |
|
keypoints, scores, descriptors = process_multiscale( |
|
image, self.net, scales=[1] |
|
) |
|
keypoints = keypoints[:, [1, 0]] |
|
|
|
idxs = scores.argsort()[-self.conf["max_keypoints"] or None :] |
|
keypoints = keypoints[idxs, :2] |
|
descriptors = descriptors[idxs] |
|
scores = scores[idxs] |
|
|
|
return { |
|
"keypoints": torch.from_numpy(keypoints)[None], |
|
"scores": torch.from_numpy(scores)[None], |
|
"descriptors": torch.from_numpy(descriptors.T)[None], |
|
} |
|
|