Vincentqyw
update: features and matchers
437b5f6
raw
history blame
4.97 kB
#!/usr/bin/env python
# coding: utf-8
import os, glob, cv2
import argparse
from argparse import Namespace
import yaml
from tqdm import tqdm
import torch
from torch.utils.data import Dataset, DataLoader, SequentialSampler
from src.datasets.custom_dataloader import TestDataLoader
from src.utils.dataset import read_img_gray
from configs.data.base import cfg as data_cfg
import viz
def get_model_config(method_name, dataset_name, root_dir='viz'):
config_file = f'{root_dir}/configs/{method_name}.yml'
with open(config_file, 'r') as f:
model_conf = yaml.load(f, Loader=yaml.FullLoader)[dataset_name]
return model_conf
class DemoDataset(Dataset):
def __init__(self, dataset_dir, img_file=None, resize=0, down_factor=16):
self.dataset_dir = dataset_dir
if img_file is None:
self.list_img_files = glob.glob(os.path.join(dataset_dir, "*.*"))
self.list_img_files.sort()
else:
with open(img_file) as f:
self.list_img_files = [os.path.join(dataset_dir, img_file.strip()) for img_file in f.readlines()]
self.resize = resize
self.down_factor = down_factor
def __len__(self):
return len(self.list_img_files)
def __getitem__(self, idx):
img_path = self.list_img_files[idx] #os.path.join(self.dataset_dir, self.list_img_files[idx])
img, scale = read_img_gray(img_path, resize=self.resize, down_factor=self.down_factor)
return {"img": img, "id": idx, "img_path": img_path}
if __name__ == '__main__':
parser = argparse.ArgumentParser(description='Visualize matches')
parser.add_argument('--gpu', '-gpu', type=str, default='0')
parser.add_argument('--method', type=str, default=None)
parser.add_argument('--dataset_dir', type=str, default='data/aachen-day-night')
parser.add_argument('--pair_dir', type=str, default=None)
parser.add_argument(
'--dataset_name', type=str, choices=['megadepth', 'scannet', 'aachen_v1.1', 'inloc'], default='megadepth'
)
parser.add_argument('--measure_time', action="store_true")
parser.add_argument('--no_viz', action="store_true")
parser.add_argument('--compute_eval_metrics', action="store_true")
parser.add_argument('--run_demo', action="store_true")
args = parser.parse_args()
model_cfg = get_model_config(args.method, args.dataset_name)
class_name = model_cfg["class"]
model = viz.__dict__[class_name](model_cfg)
# all_args = Namespace(**vars(args), **model_cfg)
if not args.run_demo:
if args.dataset_name == 'megadepth':
from configs.data.megadepth_test_1500 import cfg
data_cfg.merge_from_other_cfg(cfg)
elif args.dataset_name == 'scannet':
from configs.data.scannet_test_1500 import cfg
data_cfg.merge_from_other_cfg(cfg)
elif args.dataset_name == 'aachen_v1.1':
data_cfg.merge_from_list(["DATASET.TEST_DATA_SOURCE", "aachen_v1.1",
"DATASET.TEST_DATA_ROOT", os.path.join(args.dataset_dir, "images/images_upright"),
"DATASET.TEST_LIST_PATH", args.pair_dir,
"DATASET.TEST_IMGSIZE", model_cfg["imsize"]])
elif args.dataset_name == 'inloc':
data_cfg.merge_from_list(["DATASET.TEST_DATA_SOURCE", "inloc",
"DATASET.TEST_DATA_ROOT", args.dataset_dir,
"DATASET.TEST_LIST_PATH", args.pair_dir,
"DATASET.TEST_IMGSIZE", model_cfg["imsize"]])
has_ground_truth = str(data_cfg.DATASET.TEST_DATA_SOURCE).lower() in ["megadepth", "scannet"]
dataloader = TestDataLoader(data_cfg)
with torch.no_grad():
for data_dict in tqdm(dataloader):
for k, v in data_dict.items():
if isinstance(v, torch.Tensor):
data_dict[k] = v.cuda() if torch.cuda.is_available() else v
img_root_dir = data_cfg.DATASET.TEST_DATA_ROOT
model.match_and_draw(data_dict, root_dir=img_root_dir, ground_truth=has_ground_truth,
measure_time=args.measure_time, viz_matches=(not args.no_viz))
if args.measure_time:
print("Running time for each image is {} miliseconds".format(model.measure_time()))
if args.compute_eval_metrics and has_ground_truth:
model.compute_eval_metrics()
else:
demo_dataset = DemoDataset(args.dataset_dir, img_file=args.pair_dir, resize=640)
sampler = SequentialSampler(demo_dataset)
dataloader = DataLoader(demo_dataset, batch_size=1, sampler=sampler)
writer = cv2.VideoWriter('topicfm_demo.mp4', cv2.VideoWriter_fourcc(*'mp4v'), 15, (640 * 2 + 5, 480 * 2 + 10))
model.run_demo(iter(dataloader), writer) #, output_dir="demo", no_display=True)