tristandeleu · RobvanGastel · Jan 6, 2022 · Jan 6, 2022 · Jan 8, 2022 · Jan 10, 2022
diff --git a/README.md b/README.md
@@ -22,6 +22,7 @@ A collection of extensions and data-loaders for few-shot learning & meta-learnin
     - Caltech-UCSD Birds ([Hilliard et al., 2019](https://arxiv.org/abs/1802.04376), [Wah et al., 2019](http://www.vision.caltech.edu/visipedia/CUB-200-2011.html))
     - Double MNIST ([Sun, 2019](https://github.com/shaohua0116/MultiDigitMNIST))
     - Triple MNIST ([Sun, 2019](https://github.com/shaohua0116/MultiDigitMNIST))
+    - OmniPrint ([Sun et al., 2021](https://github.com/SunHaozhe/OmniPrint-datasets))
   - **Few-shot segmentation** (semantic segmentation):
     - Pascal5i 1-way Setup
   - **Few-shot classification (tabular datasets)**

diff --git a/torchmeta/datasets/__init__.py b/torchmeta/datasets/__init__.py
@@ -1,12 +1,14 @@
 from torchmeta.datasets.triplemnist import TripleMNIST
 from torchmeta.datasets.doublemnist import DoubleMNIST
+
 from torchmeta.datasets.cub import CUB
 from torchmeta.datasets.cifar100 import CIFARFS, FC100
 from torchmeta.datasets.miniimagenet import MiniImagenet
 from torchmeta.datasets.omniglot import Omniglot
 from torchmeta.datasets.tieredimagenet import TieredImagenet
 from torchmeta.datasets.tcga import TCGA
 from torchmeta.datasets.pascal5i import Pascal5i
+from torchmeta.datasets.omniprint import OmniPrint
 from torchmeta.datasets.letter import Letter
 from torchmeta.datasets.one_hundred_plants_texture import PlantsTexture
 from torchmeta.datasets.one_hundred_plants_shape import PlantsShape
@@ -28,6 +30,7 @@
     'DoubleMNIST',
     'TripleMNIST',
     'Pascal5i',
+    'OmniPrint',
     'helpers',
     # tabular data
     'Letter',

diff --git a/torchmeta/datasets/helpers.py b/torchmeta/datasets/helpers.py
@@ -1,7 +1,8 @@
 import warnings
 
 from torchmeta.datasets import (Omniglot, MiniImagenet, TieredImagenet, CIFARFS,
-                                FC100, CUB, DoubleMNIST, TripleMNIST, Pascal5i)
+                                FC100, CUB, DoubleMNIST, TripleMNIST, Pascal5i,
+                                OmniPrint)
 from torchmeta.transforms import Categorical, ClassSplitter, Rotation, SegmentationPairTransform
 from torchvision.transforms import Compose, Resize, CenterCrop, ToTensor
 
@@ -412,3 +413,44 @@ def pascal5i(folder, shots, ways=1, shuffle=True, test_shots=None,
     return helper_with_default(Pascal5i, folder, shots, ways,
                                shuffle=shuffle, test_shots=test_shots,
                                seed=seed, defaults=defaults, **kwargs)
+
+
+
+def omniprint(folder, shots, ways, shuffle=True, test_shots=None,
+              seed=None, **kwargs):
+    """Helper function to create a meta-dataset for the OmniPrint dataset.
+
+    Parameters
+    ----------
+    folder : string
+        Root directory where the dataset folder `omniprint` exists.
+
+    shots : int
+        Number of (training) examples per class in each task. This corresponds
+        to `k` in `k-shot` classification.
+
+    ways : int
+        Number of classes per task. This corresponds to `N` in `N-way`
+        classification.
+
+    shuffle : bool (default: `True`)
+        Shuffle the examples when creating the tasks.
+
+    test_shots : int, optional
+        Number of test examples per class in each task. If `None`, then the
+        number of test examples is equal to the number of training examples per
+        class.
+
+    seed : int, optional
+        Random seed to be used in the meta-dataset.
+
+    kwargs
+        Additional arguments passed to the `OmniPrint` class.
+
+    See also
+    --------
+    `datasets.OmniPrint` : Meta-dataset for the OmniPrint dataset.
+    """
+    return helper_with_default(OmniPrint, folder, shots, ways,
+                               shuffle=shuffle, test_shots=test_shots,
+                               seed=seed, **kwargs)
diff --git a/torchmeta/datasets/omniprint.py b/torchmeta/datasets/omniprint.py
@@ -0,0 +1,267 @@
+import os
+import json
+import h5py
+from PIL import Image
+
+from torchmeta.utils.data import Dataset, ClassDataset, CombinationMetaDataset
+from torchmeta.datasets.utils import download_file_from_google_drive
+
+
+class OmniPrint(CombinationMetaDataset):
+    """
+    The OmniPrint dataset [1] based on [2]. A synthetic generated dataset
+    of 1409 classes and 935 different fonts. Moreover, the dataset consists of
+    5 different splits increased synthetic noise.
+
+    Parameters
+    ----------
+    root : string
+        Root directory where the dataset folder `omniprint` exists.
+
+    num_classes_per_task : int
+        Number of classes per tasks. This corresponds to "N" in "N-way" 
+        classification.
+
+    meta_train : bool (default: `False`)
+        Use the meta-train split of the dataset. If set to `True`, then the
+        arguments `meta_val` and `meta_test` must be set to `False`. Exactly one 
+        of these three arguments must be set to `True`.
+
+    meta_val : bool (default: `False`)
+        Use the meta-validation split of the dataset. If set to `True`, then the 
+        arguments `meta_train` and `meta_test` must be set to `False`. Exactly one 
+        of these three arguments must be set to `True`.
+
+    meta_test : bool (default: `False`)
+        Use the meta-test split of the dataset. If set to `True`, then the 
+        arguments `meta_train` and `meta_val` must be set to `False`. Exactly one 
+        of these three arguments must be set to `True`.
+
+    meta_split : string in {'train', 'val', 'test'}, optional
+        Name of the split to use. This overrides the arguments `meta_train`, 
+        `meta_val` and `meta_test` if all three are set to `False`.
+
+    print_split : string in {'meta1', 'meta2', 'meta3', 'meta4, 'meta5'}
+    (default: `None`)
+        The string value is mapped to the given OmniPrint split defined in [1].
+        The higher the meta split the more synthetic noise is added to the images
+        (raises an error when no print_split is defined).
+
+    transform : callable, optional
+        A function/transform that takes a `PIL` image, and returns a transformed 
+        version. See also `torchvision.transforms`.
+
+    target_transform : callable, optional
+        A function/transform that takes a target, and returns a transformed 
+        version. See also `torchvision.transforms`.
+
+    dataset_transform : callable, optional
+        A function/transform that takes a dataset (ie. a task), and returns a 
+        transformed version of it. E.g. `torchmeta.transforms.ClassSplitter()`.
+
+    class_augmentations : list of callable, optional
+        A list of functions that augment the dataset with new classes. These classes 
+        are transformations of existing classes. E.g.
+        `torchmeta.transforms.HorizontalFlip()`.
+
+    download : bool (default: `False`)
+        If `True`, downloads the zip files and processes the dataset in the root 
+        directory (under the `omniglot` folder). If the dataset is already 
+        available, this does not download/process the dataset again.
+
+    Notes
+    -----
+    The dataset is downloaded from the original [OmniPrint repository]
+    (https://github.com/SunHaozhe/OmniPrint-datasets). The meta train/validation/test 
+    splits are over 900/149/360 classes.
+
+    References
+    ----------
+    .. [1] H. Sun, W.-W. Tu, I. M. Guyon (2021). OmniPrint: A Configurable Printed
+           Character Synthesizer. in Thirty-fifth Conference on Neural Information
+           Processing Systems Datasets and Benchmarks Track (Round 1),
+           (https://openreview.net/forum?id=R07XwJPmgpl)
+
+    .. [2] Lake, B. M., Salakhutdinov, R., and Tenenbaum, J. B. (2015). Human-level 
+           concept learning through probabilistic program induction. Science, 350(6266), 
+           1332-1338 (http://www.sciencemag.org/content/350/6266/1332.short)
+
+    """
+    def __init__(self, root, num_classes_per_task=None, meta_train=False,
+                 meta_val=False, meta_test=False, meta_split=None,
+                 transform=None, target_transform=None, dataset_transform=None,
+                 class_augmentations=None, download=False, print_split=None
+                 ):
+        dataset = OmniPrintClassDataset(
+            root, meta_train=meta_train,
+            meta_val=meta_val, meta_test=meta_test,
+            print_split=print_split, transform=transform,
+            meta_split=meta_split,
+            class_augmentations=class_augmentations,
+            download=download)
+        super(OmniPrint, self).__init__(
+            dataset, num_classes_per_task,
+            target_transform=target_transform,
+            dataset_transform=dataset_transform)
+
+
+class OmniPrintClassDataset(ClassDataset):
+    gdrive_id = '1JBXYMTsdlm8RaEBPqrJbDRzs3hJ4q_gH'
+    folder = 'omniprint'
+
+    zip_filename = '{0}.zip'
+    filename = '{0}_{1}_data.hdf5'
+    filename_labels = '{0}_{1}_labels.json'
+
+    def __init__(self, root, meta_train=False, meta_val=False, meta_test=False,
+                 meta_split=None, print_split=None, transform=None,
+                 class_augmentations=None, download=False):
+        super(OmniPrintClassDataset, self).__init__(
+            meta_train=meta_train,
+            meta_val=meta_val,
+            meta_test=meta_test,
+            meta_split=meta_split,
+            class_augmentations=class_augmentations)
+
+        if print_split is None:
+            raise ValueError('Trying to use the OmniPrint dataset without '
+            'setting the print split. You must set `print_split` to meta1, '
+            'meta2, meta3, meta4 or meta5.')
+
+        self.root = os.path.join(os.path.expanduser(
+            root), self.folder)
+        self.print_split = print_split
+        self.transform = transform
+
+        self.split_filename = os.path.join(
+            self.root,
+            self.filename.format(print_split, self.meta_split))
+        self.split_filename_labels = os.path.join(
+            self.root,
+            self.filename_labels.format(print_split, self.meta_split))
+
+        self._data = None
+        self._labels = None
+
+        if download:
+            self.download()
+
+        if not self._check_integrity():
+            raise RuntimeError('OmniPrint integrity check failed')
+        self._num_classes = len(self.labels)
+
+    def __getitem__(self, index):
+        character_name = '/'.join(self.labels[index % self.num_classes])
+        data = self.data[character_name]
+        transform = self.get_transform(index, self.transform)
+        target_transform = self.get_target_transform(index)
+
+        return OmniPrintDataset(
+            index, data, character_name,
+            transform=transform, target_transform=target_transform)
+
+    @property
+    def num_classes(self):
+        return self._num_classes
+
+    @property
+    def data(self):
+        if self._data is None:
+            self._data = h5py.File(self.split_filename, 'r')
+        return self._data
+
+    @property
+    def labels(self):
+        if self._labels is None:
+            with open(self.split_filename_labels, 'r') as f:
+                self._labels = json.load(f)
+        return self._labels
+
+    def _check_integrity(self):
+        return (os.path.isfile(self.split_filename)
+                and os.path.isfile(self.split_filename_labels))
+
+    def close(self):
+        if self._data is not None:
+            self._data.close()
+            self._data = None
+
+    def download(self):
+        import zipfile
+        import shutil
+        import glob
+        from tqdm import tqdm
+
+        if self._check_integrity():
+            return
+
+        zip_foldername = os.path.join(
+            self.root, self.zip_filename.format(self.folder))
+        # Download the datasets
+        if not os.path.isfile(zip_foldername):
+            download_file_from_google_drive(
+                self.gdrive_id, self.root,
+                self.zip_filename.format(self.folder))
+
+        # Unzip the dataset
+        if not os.path.isdir(zip_foldername):
+            with zipfile.ZipFile(zip_foldername) as f:
+                for member in tqdm(f.infolist(), desc='Extracting '):
+                    try:
+                        f.extract(member, self.root)
+                    except zipfile.BadZipFile:
+                        print('Error: Zipfile is corrupted')
+
+        for print_split in ['meta1', 'meta2', 'meta3', 'meta4', 'meta5']:
+            for split in tqdm(['train', 'val', 'test'], desc=print_split):
+                filename_labels = os.path.join(
+                    self.root, self.filename_labels.format(print_split, split))
+
+                with open(filename_labels, 'r') as f:
+                    labels = json.load(f)
+
+                filename = os.path.join(
+                    self.root, self.filename.format(print_split, split))
+
+                with h5py.File(filename, 'w') as f:
+                    group = f.create_group(print_split)
+                    for _, alphabet, character in labels:
+                        filenames = glob.glob(
+                            os.path.join(
+                                self.root, print_split,
+                                alphabet, character, '*.png'))
+                        dataset = group.create_dataset('{0}/{1}'.format(
+                            alphabet, character),
+                            (len(filenames), 32, 32),
+                            dtype='uint8')
+
+                        for i, char_filename in enumerate(filenames):
+                            image = Image.open(
+                                char_filename, mode='r').convert('L')
+                            dataset[i] = image
+
+            shutil.rmtree(os.path.join(self.root, print_split))
+
+
+class OmniPrintDataset(Dataset):
+    def __init__(self, index, data, character_name,
+                 transform=None, target_transform=None):
+        super(OmniPrintDataset, self).__init__(
+            index, transform=transform,
+            target_transform=target_transform)
+        self.data = data
+        self.character_name = character_name
+
+    def __len__(self):
+        return len(self.data)
+
+    def __getitem__(self, index):
+        image = Image.fromarray(self.data[index])
+        target = self.character_name
+
+        if self.transform is not None:
+            image = self.transform(image)
+
+        if self.target_transform is not None:
+            target = self.target_transform(target)
+        return (image, target)