Spaces:

Realcat
/

image-matching-webui

Running

image-matching-webui / third_party /r2d2 /datasets /pair_dataset.py

Vincentqyw

update: features and matchers

a80d6bb over 1 year ago

10.1 kB

	# Copyright 2019-present NAVER Corp.
	# CC BY-NC-SA 3.0
	# Available only for non-commercial use

	import os, pdb
	import numpy as np
	from PIL import Image

	from .dataset import Dataset, CatDataset
	from tools.transforms import instanciate_transformation
	from tools.transforms_tools import persp_apply


	class PairDataset (Dataset):
	""" A dataset that serves image pairs with ground-truth pixel correspondences.
	"""
	def __init__(self):
	Dataset.__init__(self)
	self.npairs = 0

	def get_filename(self, img_idx, root=None):
	if is_pair(img_idx): # if img_idx is a pair of indices, we return a pair of filenames
	return tuple(Dataset.get_filename(self, i, root) for i in img_idx)
	return Dataset.get_filename(self, img_idx, root)

	def get_image(self, img_idx):
	if is_pair(img_idx): # if img_idx is a pair of indices, we return a pair of images
	return tuple(Dataset.get_image(self, i) for i in img_idx)
	return Dataset.get_image(self, img_idx)

	def get_corres_filename(self, pair_idx):
	raise NotImplementedError()

	def get_homography_filename(self, pair_idx):
	raise NotImplementedError()

	def get_flow_filename(self, pair_idx):
	raise NotImplementedError()

	def get_mask_filename(self, pair_idx):
	raise NotImplementedError()

	def get_pair(self, idx, output=()):
	""" returns (img1, img2, `metadata`)

	`metadata` is a dict() that can contain:
	flow: optical flow
	aflow: absolute flow
	corres: list of 2d-2d correspondences
	mask: boolean image of flow validity (in the first image)
	...
	"""
	raise NotImplementedError()

	def get_paired_images(self):
	fns = set()
	for i in range(self.npairs):
	a,b = self.image_pairs[i]
	fns.add(self.get_filename(a))
	fns.add(self.get_filename(b))
	return fns

	def __len__(self):
	return self.npairs # size should correspond to the number of pairs, not images

	def __repr__(self):
	res = 'Dataset: %s\n' % self.__class__.__name__
	res += ' %d images,' % self.nimg
	res += ' %d image pairs' % self.npairs
	res += '\n root: %s...\n' % self.root
	return res

	@staticmethod
	def _flow2png(flow, path):
	flow = np.clip(np.around(16flow), -215, 2*15-1)
	bytes = np.int16(flow).view(np.uint8)
	Image.fromarray(bytes).save(path)
	return flow / 16

	@staticmethod
	def _png2flow(path):
	try:
	flow = np.asarray(Image.open(path)).view(np.int16)
	return np.float32(flow) / 16
	except:
	raise IOError("Error loading flow for %s" % path)



	class StillPairDataset (PairDataset):
	""" A dataset of 'still' image pairs.
	By overloading a normal image dataset, it appends the get_pair(i) function
	that serves trivial image pairs (img1, img2) where img1 == img2 == get_image(i).
	"""
	def get_pair(self, pair_idx, output=()):
	if isinstance(output, str): output = output.split()
	img1, img2 = map(self.get_image, self.image_pairs[pair_idx])

	W,H = img1.size
	sx = img2.size[0] / float(W)
	sy = img2.size[1] / float(H)

	meta = {}
	if 'aflow' in output or 'flow' in output:
	mgrid = np.mgrid[0:H, 0:W][::-1].transpose(1,2,0).astype(np.float32)
	meta['aflow'] = mgrid * (sx,sy)
	meta['flow'] = meta['aflow'] - mgrid

	if 'mask' in output:
	meta['mask'] = np.ones((H,W), np.uint8)

	if 'homography' in output:
	meta['homography'] = np.diag(np.float32([sx, sy, 1]))

	return img1, img2, meta



	class SyntheticPairDataset (PairDataset):
	""" A synthetic generator of image pairs.
	Given a normal image dataset, it constructs pairs using random homographies & noise.
	"""
	def __init__(self, dataset, scale='', distort=''):
	self.attach_dataset(dataset)
	self.distort = instanciate_transformation(distort)
	self.scale = instanciate_transformation(scale)

	def attach_dataset(self, dataset):
	assert isinstance(dataset, Dataset) and not isinstance(dataset, PairDataset)
	self.dataset = dataset
	self.npairs = dataset.nimg
	self.get_image = dataset.get_image
	self.get_key = dataset.get_key
	self.get_filename = dataset.get_filename
	self.root = None

	def make_pair(self, img):
	return img, img

	def get_pair(self, i, output=('aflow')):
	""" Procedure:
	This function applies a series of random transformations to one original image
	to form a synthetic image pairs with perfect ground-truth.
	"""
	if isinstance(output, str):
	output = output.split()

	original_img = self.dataset.get_image(i)

	scaled_image = self.scale(original_img)
	scaled_image, scaled_image2 = self.make_pair(scaled_image)
	scaled_and_distorted_image = self.distort(
	dict(img=scaled_image2, persp=(1,0,0,0,1,0,0,0)))
	W, H = scaled_image.size
	trf = scaled_and_distorted_image['persp']

	meta = dict()
	if 'aflow' in output or 'flow' in output:
	# compute optical flow
	xy = np.mgrid[0:H,0:W][::-1].reshape(2,H*W).T
	aflow = np.float32(persp_apply(trf, xy).reshape(H,W,2))
	meta['flow'] = aflow - xy.reshape(H,W,2)
	meta['aflow'] = aflow

	if 'homography' in output:
	meta['homography'] = np.float32(trf+(1,)).reshape(3,3)

	return scaled_image, scaled_and_distorted_image['img'], meta

	def __repr__(self):
	res = 'Dataset: %s\n' % self.__class__.__name__
	res += ' %d images and pairs' % self.npairs
	res += '\n root: %s...' % self.dataset.root
	res += '\n Scale: %s' % (repr(self.scale).replace('\n',''))
	res += '\n Distort: %s' % (repr(self.distort).replace('\n',''))
	return res + '\n'



	class TransformedPairs (PairDataset):
	""" Automatic data augmentation for pre-existing image pairs.
	Given an image pair dataset, it generates synthetically jittered pairs
	using random transformations (e.g. homographies & noise).
	"""
	def __init__(self, dataset, trf=''):
	self.attach_dataset(dataset)
	self.trf = instanciate_transformation(trf)

	def attach_dataset(self, dataset):
	assert isinstance(dataset, PairDataset)
	self.dataset = dataset
	self.nimg = dataset.nimg
	self.npairs = dataset.npairs
	self.get_image = dataset.get_image
	self.get_key = dataset.get_key
	self.get_filename = dataset.get_filename
	self.root = None

	def get_pair(self, i, output=''):
	""" Procedure:
	This function applies a series of random transformations to one original image
	to form a synthetic image pairs with perfect ground-truth.
	"""
	img_a, img_b_, metadata = self.dataset.get_pair(i, output)

	img_b = self.trf({'img': img_b_, 'persp':(1,0,0,0,1,0,0,0)})
	trf = img_b['persp']

	if 'aflow' in metadata or 'flow' in metadata:
	aflow = metadata['aflow']
	aflow[:] = persp_apply(trf, aflow.reshape(-1,2)).reshape(aflow.shape)
	W, H = img_a.size
	flow = metadata['flow']
	mgrid = np.mgrid[0:H, 0:W][::-1].transpose(1,2,0).astype(np.float32)
	flow[:] = aflow - mgrid

	if 'corres' in metadata:
	corres = metadata['corres']
	corres[:,1] = persp_apply(trf, corres[:,1])

	if 'homography' in metadata:
	# p_b = homography * p_a
	trf_ = np.float32(trf+(1,)).reshape(3,3)
	metadata['homography'] = np.float32(trf_ @ metadata['homography'])

	return img_a, img_b['img'], metadata

	def __repr__(self):
	res = 'Transformed Pairs from %s\n' % type(self.dataset).__name__
	res += ' %d images and pairs' % self.npairs
	res += '\n root: %s...' % self.dataset.root
	res += '\n transform: %s' % (repr(self.trf).replace('\n',''))
	return res + '\n'



	class CatPairDataset (CatDataset):
	''' Concatenation of several pair datasets.
	'''
	def __init__(self, *datasets):
	CatDataset.__init__(self, *datasets)
	pair_offsets = [0]
	for db in datasets:
	pair_offsets.append(db.npairs)
	self.pair_offsets = np.cumsum(pair_offsets)
	self.npairs = self.pair_offsets[-1]

	def __len__(self):
	return self.npairs

	def __repr__(self):
	fmt_str = "CatPairDataset("
	for db in self.datasets:
	fmt_str += str(db).replace("\n"," ") + ', '
	return fmt_str[:-2] + ')'

	def pair_which(self, i):
	pos = np.searchsorted(self.pair_offsets, i, side='right')-1
	assert pos < self.npairs, 'Bad pair index %d >= %d' % (i, self.npairs)
	return pos, i - self.pair_offsets[pos]

	def pair_call(self, func, i, args, *kwargs):
	b, j = self.pair_which(i)
	return getattr(self.datasets[b], func)(j, args, *kwargs)

	def get_pair(self, i, output=()):
	b, i = self.pair_which(i)
	return self.datasets[b].get_pair(i, output)

	def get_flow_filename(self, pair_idx, args, *kwargs):
	return self.pair_call('get_flow_filename', pair_idx, args, *kwargs)

	def get_mask_filename(self, pair_idx, args, *kwargs):
	return self.pair_call('get_mask_filename', pair_idx, args, *kwargs)

	def get_corres_filename(self, pair_idx, args, *kwargs):
	return self.pair_call('get_corres_filename', pair_idx, args, *kwargs)



	def is_pair(x):
	if isinstance(x, (tuple,list)) and len(x) == 2:
	return True
	if isinstance(x, np.ndarray) and x.ndim == 1 and x.shape[0] == 2:
	return True
	return False