add Photoour dataset

c7a39ba9 · edgarriba · Soumith Chintala · c47418f0 · c7a39ba9 · c7a39ba9
Commit c7a39ba9 authored Feb 23, 2017 by edgarriba Committed by Soumith Chintala Mar 17, 2017
Showing with 201 additions and 2 deletions

README.rst README.rst +19 -1

torchvision/datasets/__init__.py torchvision/datasets/__init__.py +1 -1

torchvision/datasets/phototour.py torchvision/datasets/phototour.py +181 -0

No files found.
--- a/README.rst
+++ b/README.rst
@@ -51,6 +51,7 @@ The following dataset loaders are available:
 -  `CIFAR10 and CIFAR100 <#cifar>`__
 -  `STL10 <#stl10>`__
 -  `SVHN <#svhn>`__
+-  `PhotoTour <#phototour>`__

 Datasets have the API: - ``__getitem__`` - ``__len__`` They all subclass
 from ``torch.utils.data.Dataset`` Hence, they can all be multi-threaded
@@ -215,6 +216,23 @@ here <https://github.com/facebook/fb.resnet.torch/blob/master/INSTALL.md#downloa
 `Here is an
 example <https://github.com/pytorch/examples/blob/27e2a46c1d1505324032b1d94fc6ce24d5b67e97/imagenet/main.py#L48-L62>`__.

+PhotoTour
+~~~~~~~~~
+
+**Learning Local Image Descriptors Data**
+http://phototour.cs.washington.edu/patches/default.htm
+
+.. code:: python
+
+    import torchvision.datasets as dset
+    import torchvision.transforms as transforms
+    dataset = dset.PhotoTour(root = 'dir where images are',
+                             name = 'name of the dataset to load',
+                             transform=transforms.ToTensor())
+
+    print('Loaded PhotoTour: {} with {} images.'
+          .format(dataset.name, len(dataset.data)))
+
 Models
 ======


--- a/torchvision/datasets/__init__.py
+++ b/torchvision/datasets/__init__.py
@@ -10,4 +10,4 @@ __all__ = ('LSUN', 'LSUNClass',
           'ImageFolder',
           'CocoCaptions', 'CocoDetection',
           'CIFAR10', 'CIFAR100',
-           'MNIST', 'STL10', 'SVHN')
+           'MNIST', 'STL10', 'SVHN', 'PhotoTour')
--- a/torchvision/datasets/phototour.py
+++ b/torchvision/datasets/phototour.py
+import os
+import errno
+import numpy as np
+from PIL import Image
+
+import torch
+import torch.utils.data as data
+
+
+class PhotoTour(data.Dataset):
+    urls = {
+        'notredame': 'http://www.iis.ee.ic.ac.uk/~vbalnt/phototourism-patches/notredame.zip',
+        'yosemite': 'http://www.iis.ee.ic.ac.uk/~vbalnt/phototourism-patches/yosemite.zip',
+        'liberty': 'http://www.iis.ee.ic.ac.uk/~vbalnt/phototourism-patches/liberty.zip'
+    }
+    mean = {'notredame': 0.4854, 'yosemite': 0.4844, 'liberty': 0.4437}
+    std = {'notredame': 0.1864, 'yosemite': 0.1818, 'liberty': 0.2019}
+    lens = {'notredame': 468159, 'yosemite': 633587, 'liberty': 450092}
+
+    image_ext = 'bmp'
+    info_file = 'info.txt'
+    matches_files = 'm50_100000_100000_0.txt'
+
+    def __init__(self, root, name, train=True, transform=None, download=False):
+        self.root = root
+        self.name = name
+        self.data_dir = os.path.join(root, name)
+        self.data_down = os.path.join(root, '{}.zip'.format(name))
+        self.data_file = os.path.join(root, '{}.pt'.format(name))
+
+        self.train = train
+        self.transform = transform
+
+        self.mean = self.mean[name]
+        self.std = self.std[name]
+
+        if download:
+            self.download()
+
+        if not self._check_exists():
+            raise RuntimeError('Dataset not found.' +
+                               ' You can use download=True to download it')
+
+        # load the serialized data
+        self.data, self.labels, self.matches = torch.load(self.data_file)
+
+    def __getitem__(self, index):
+        if self.train:
+            data = self.data[index]
+            if self.transform is not None:
+                data = self.transform(data)
+            return data
+        m = self.matches[index]
+        data1, data2 = self.data[m[0]], self.data[m[1]]
+        if self.transform is not None:
+            data1 = self.transform(data1)
+            data2 = self.transform(data2)
+        return data1, data2, m[2]
+
+    def __len__(self):
+        if self.train:
+            return self.lens[self.name]
+        return len(self.matches)
+
+    def _check_exists(self):
+        return os.path.exists(self.data_file)
+
+    def _check_downloaded(self):
+        return os.path.exists(self.data_dir)
+
+    def download(self):
+        from six.moves import urllib
+        print('\n-- Loading PhotoTour dataset: {}\n'.format(self.name))
+
+        if self._check_exists():
+            print('# Found cached data {}'.format(self.data_file))
+            return
+
+        if not self._check_downloaded():
+            # download files
+            url = self.urls[self.name]
+            filename = url.rpartition('/')[2]
+            file_path = os.path.join(self.root, filename)
+
+            try:
+                os.makedirs(self.root)
+            except OSError as e:
+                if e.errno == errno.EEXIST:
+                    pass
+                else:
+                    raise
+
+            print('# Downloading {} into {}\n\nIt might take while.'
+                  ' Please grab yourself a coffee and relax.'
+                  .format(url, file_path))
+
+            urllib.request.urlretrieve(url, file_path)
+            assert os.path.exists(file_path)
+
+            print('# Extracting data {}\n'.format(self.data_down))
+
+            import zipfile
+            with zipfile.ZipFile(file_path, 'r') as z:
+                z.extractall(self.data_dir)
+            os.unlink(file_path)
+
+        # process and save as torch files
+        print('# Caching data {}'.format(self.data_file))
+
+        data_set = (
+            read_image_file(self.data_dir, self.image_ext, self.lens[self.name]),
+            read_info_file(self.data_dir, self.info_file),
+            read_matches_files(self.data_dir, self.matches_files)
+        )
+
+        with open(self.data_file, 'wb') as f:
+            torch.save(data_set, f)
+
+
+def read_image_file(data_dir, image_ext, n):
+    """Return a Tensor containing the patches
+    """
+    def PIL2array(_img):
+        """Convert PIL image type to numpy 2D array
+        """
+        return np.array(_img.getdata(), dtype=np.uint8).reshape(64, 64)
+
+    def find_files(_data_dir, _image_ext):
+        """Return a list with the file names of the images containing the patches
+        """
+        files = []
+        # find those files with the specified extension
+        for file_dir in os.listdir(_data_dir):
+            if file_dir.endswith(_image_ext):
+                files.append(os.path.join(_data_dir, file_dir))
+        return sorted(files)  # sort files in ascend order to keep relations
+
+    patches = []
+    list_files = find_files(data_dir, image_ext)
+
+    for file_path in list_files:
+        img = Image.open(file_path)
+        for y in range(0, 1024, 64):
+            for x in range(0, 1024, 64):
+                patch = img.crop((x, y, x + 64, y + 64))
+                patches.append(PIL2array(patch))
+    return torch.ByteTensor(np.array(patches[:n]))
+
+
+def read_info_file(data_dir, info_file):
+    """Return a Tensor containing the list of labels
+       Read the file and keep only the ID of the 3D point.
+    """
+    labels = []
+    with open(os.path.join(data_dir, info_file), 'r') as f:
+        labels = [int(line.split()[0]) for line in f]
+    return torch.LongTensor(labels)
+
+
+def read_matches_files(data_dir, matches_file):
+    """Return a Tensor containing the ground truth matches
+       Read the file and keep only 3D point ID.
+       Matches are represented with a 1, non matches with a 0.
+    """
+    matches = []
+    with open(os.path.join(data_dir, matches_file), 'r') as f:
+        for line in f:
+            l = line.split()
+            matches.append([int(l[0]), int(l[3]), int(l[1] == l[4])])
+    return torch.LongTensor(matches)
+
+
+if __name__ == '__main__':
+    dataset = PhotoTour(root='/home/eriba/datasets/patches_dataset',
+                        name='notredame',
+                        download=True)
+
+    print('Loaded PhotoTour: {} with {} images.'
+          .format(dataset.name, len(dataset.data)))
+
+    assert len(dataset.data) == len(dataset.labels)