added custom dataset implementation

- added custom dataset in form of ADImageFolderDataset and custom runner - updated readme to contain custom dataset description - slightly changed dataset preview to return stacks instead of concatenations - slightly changed imagenet's __getitem__ to be able to handle malformed_normal as well - fixed some print typos - added fixes + error handling for trainer and dataset preview to be able to process tiny datasets (< ~10 samples)
subhankardori · Jun 8, 2021 · b2fc0fe · b2fc0fe
1 parent 5d6a6e7
commit b2fc0fe
Show file tree

Hide file tree

Showing 12 changed files with 354 additions and 22 deletions.
diff --git a/README.md b/README.md
@@ -82,10 +82,10 @@ For full OE:
 Please note that you have to manually download ImageNet1k and ImageNet22k and place them in the correct folders.
 Let **dsdir** be your specified dataset directory (per default `../../data/datasets/`). 
 
-ImageNet1k needs to be in `dsdir/imagenet`, containing the devkit, train, and val split in form of a tar file each -- with names `ILSVRC2012_devkit_t12.tar.gz`, `ILSVRC2012_img_train.tar`, and `ILSVRC2012_img_val.tar`. 
+ImageNet1k needs to be in `dsdir/imagenet/`, containing the devkit, train, and val split in form of a tar file each -- with names `ILSVRC2012_devkit_t12.tar.gz`, `ILSVRC2012_img_train.tar`, and `ILSVRC2012_img_val.tar`. 
 These are the default names expected by the PyTorch loaders. You can download ImageNet1k on the official website: http://image-net.org/download. Note that you have to register beforehand. 
 
-ImageNet22k needs to be in `dsdir/imagenet22k/fall11_whole_extracted`, containing all the extracted class directories with pictures, e.g. the folder n12267677 having pictures of acorns.
+ImageNet22k needs to be in `dsdir/imagenet22k/fall11_whole_extracted/`, containing all the extracted class directories with pictures, e.g. the folder n12267677 having pictures of acorns.
 Decompressing the downloaded archive should automatically yield this structure. 
 ImageNet22k, i.e. the full release fall 11, can also be downloaded on the official website: http://image-net.org/download.
 
@@ -102,7 +102,27 @@ Using a semi-supervised setup with one true anomaly per defection:
 #### Pascal VOC
 
     python runners/run_pascalvoc.py 
+
+
+#### Custom Data
+Let again **dsdir** be your specified dataset directory (per default `../../data/datasets/`). 
+Place your training data in `dsdir/custom/train/classX/` and your test data in `dsdir/custom/test/classX/`, with classX being one of the class folders (they can have arbitrary names, but need to be consistent for training and testing).
+For a one-vs-rest setup (as used for Cifar-10, etc.), place the corresponding images directly in the class folders and run:
+
+    python runners/run_custom.py -ovr 
+
+Otherwise, each class requires a separate set of nominal and anomalous test samples.
+Place the corresponding images in `dsdir/custom/test/classX/normal/`, `dsdir/custom/test/classX/anomalous/`, `dsdir/custom/train/classX/normal/` and run:
 
+    python runners/run_custom.py
+
+If you have some training anomalies in `dsdir/custom/train/classX/anomalous/`, you can use them in a semi-supervised setting with
+
+    python runners/run_custom.py --supervise-mode other
+
+In general, you can adapt most training parameters using the program's arguments (see `python runners/run_custom.py --help`).
+Per default, it chooses some parameters that are assumed general-purpose, such as the imagenet-pre-trained CNN for 224x224 images and imagenet22k outlier exposure.
+To, for example, use confetti noise instead of outlier exposure, set `--supervise-mode` to `malformed_normal` and `--noise-mode` to `confetti`.
 
 ## Train Baselines
 
@@ -210,6 +230,9 @@ Make sure that the class name is unique.
 <details>
 <summary>Add a new Dataset</summary>
 
+First, you should check whether it's possible to use the [custom dataset implementation](####custom-data).
+If not:
+
 1) Create a new python script in the `datasets` package. 
 Implement a dataset that inherits the `fcdd.datasets.bases.TorchvisionDataset` class. 
 Your implementation needs to process all parameters of the `fcdd.datasets.bases.load_dataset` function in its initialization. 

diff --git a/python/fcdd/datasets/__init__.py b/python/fcdd/datasets/__init__.py
@@ -1,17 +1,18 @@
 from copy import deepcopy
 from typing import List
-
 from fcdd.datasets.bases import TorchvisionDataset
 from fcdd.datasets.cifar import ADCIFAR10
 from fcdd.datasets.fmnist import ADFMNIST
 from fcdd.datasets.imagenet import ADImageNet
 from fcdd.datasets.mvtec import ADMvTec
 from fcdd.datasets.pascal_voc import ADPascalVoc
+from fcdd.datasets.image_folder import ADImageFolderDataset
 
-DS_CHOICES = ('mnist', 'cifar10', 'fmnist', 'mvtec', 'imagenet', 'pascalvoc')
+DS_CHOICES = ('mnist', 'cifar10', 'fmnist', 'mvtec', 'imagenet', 'pascalvoc', 'custom')
 PREPROC_CHOICES = (
     'lcn', 'lcnaug1', 'aug1', 'aug1_blackcenter', 'aug1_blackcenter_inverted', 'none'
 )
+CUSTOM_CLASSES = []
 
 
 def load_dataset(dataset_name: str, data_path: str, normal_class: int, preproc: str,
@@ -54,6 +55,14 @@ def load_dataset(dataset_name: str, data_path: str, normal_class: int, preproc:
             supervise_mode=supervise_mode, noise_mode=noise_mode, online_supervision=online_supervision,
             oe_limit=oe_limit, logger=logger, nominal_label=nominal_label
         )
+    elif dataset_name == 'custom':
+        dataset = ADImageFolderDataset(
+            root=data_path, normal_class=normal_class, preproc=preproc,
+            supervise_mode=supervise_mode, noise_mode=noise_mode, online_supervision=online_supervision,
+            oe_limit=oe_limit, logger=logger, nominal_label=nominal_label
+        )
+    else:
+        raise NotImplementedError(f'Dataset {dataset_name} is unknown.')
 
     return dataset
 
@@ -65,6 +74,7 @@ def no_classes(dataset_name: str) -> int:
         'mvtec': 15,
         'imagenet': 30,
         'pascalvoc': 1,
+        'custom': len(CUSTOM_CLASSES)
     }[dataset_name]
 
 
@@ -80,5 +90,6 @@ def str_labels(dataset_name: str) -> List[str]:
             'wood', 'zipper'
         ],
         'imagenet': deepcopy(ADImageNet.ad_classes),
-        'pascalvoc': ['horse']
+        'pascalvoc': ['horse'],
+        'custom': list(CUSTOM_CLASSES)
     }[dataset_name]
diff --git a/python/fcdd/datasets/bases.py b/python/fcdd/datasets/bases.py
@@ -1,5 +1,6 @@
 from abc import ABC, abstractmethod
 from typing import Tuple
+from collections import Counter
 
 import numpy as np
 import torch
@@ -112,7 +113,7 @@ def preview(self, percls=20, train=True) -> torch.Tensor:
                     g = g.repeat(1, x.shape[1], 1, 1)
                 out.append(g)
         self.logprint('Dataset preview generated.')
-        return torch.cat(out)
+        return torch.stack([o[:min(Counter(y.tolist()).values())] for o in out])
 
     def _generate_artificial_anomalies_train_set(self, supervise_mode: str, noise_mode: str, oe_limit: int,
                                                  train_set: Dataset, nom_class: int):

diff --git a/python/fcdd/datasets/image_folder.py b/python/fcdd/datasets/image_folder.py
@@ -0,0 +1,240 @@
+import random
+import os
+import os.path as pt
+import numpy as np
+import torchvision.transforms as transforms
+import torch
+from typing import Tuple, List
+from torch import Tensor
+from torch.utils.data import Subset, DataLoader
+from torchvision.datasets import ImageFolder
+from torchvision.transforms.functional import to_tensor, to_pil_image
+from fcdd.datasets.bases import TorchvisionDataset
+from fcdd.datasets.online_supervisor import OnlineSupervisor
+from fcdd.datasets.preprocessing import get_target_label_idx
+from fcdd.util.logging import Logger
+
+
+def extract_custom_classes(datapath: str) -> List[str]:
+    dir = os.path.join(datapath, 'custom', 'test')
+    classes = [d for d in os.listdir(dir) if os.path.isdir(os.path.join(dir, d))]
+    classes.sort()
+    return classes
+
+
+class ADImageFolderDataset(TorchvisionDataset):
+    base_folder = 'custom'
+    ovr = False
+
+    def __init__(self, root: str, normal_class: int, preproc: str, nominal_label: int,
+                 supervise_mode: str, noise_mode: str, oe_limit: int, online_supervision: bool,
+                 logger: Logger = None):
+        """
+        This is a general-purpose implementation for custom datasets.
+        It expects the data being contained in class folders and distinguishes between
+        (1) the one-vs-rest (ovr) approach where one class is considered normal
+        and is tested against all other classes being anomalous
+        (2) the general approach where each class folder contains a normal data folder and an anomalous data folder.
+        The :attr:`ovr` determines this.
+
+        For (1) the data folders have to follow this structure:
+        root/custom/train/dog/xxx.png
+        root/custom/train/dog/xxy.png
+        root/custom/train/dog/xxz.png
+
+        root/custom/train/cat/123.png
+        root/custom/train/cat/nsdf3.png
+        root/custom/train/cat/asd932_.png
+
+        For (2):
+        root/custom/train/hazelnut/normal/xxx.png
+        root/custom/train/hazelnut/normal/xxy.png
+        root/custom/train/hazelnut/normal/xxz.png
+        root/custom/train/hazelnut/anomalous/xxa.png    -- may be used during training for a semi-supervised setting
+
+        root/custom/train/screw/normal/123.png
+        root/custom/train/screw/normal/nsdf3.png
+        root/custom/train/screw/anomalous/asd932_.png   -- may be used during training for a semi-supervised setting
+
+        The same holds for the test set, where "train" has to be replaced by "test".
+
+        :param root: root directory where data is found.
+        :param normal_class: the class considered nominal.
+        :param preproc: the kind of preprocessing pipeline.
+        :param nominal_label: the label that marks nominal samples in training. The scores in the heatmaps always
+            rate label 1, thus usually the nominal label is 0, s.t. the scores are anomaly scores.
+        :param supervise_mode: the type of generated artificial anomalies.
+            See :meth:`fcdd.datasets.bases.TorchvisionDataset._generate_artificial_anomalies_train_set`.
+        :param noise_mode: the type of noise used, see :mod:`fcdd.datasets.noise_mode`.
+        :param oe_limit: limits the number of different anomalies in case of Outlier Exposure (defined in noise_mode).
+        :param online_supervision: whether to sample anomalies online in each epoch,
+            or offline before training (same for all epochs in this case).
+        :param logger: logger.
+        """
+        assert online_supervision, 'Artificial anomaly generation for custom datasets needs to be online'
+        trainpath = pt.join(root, self.base_folder, 'train')
+        testpath = pt.join(root, self.base_folder, 'test')
+        super().__init__(root, logger=logger)
+
+        self.n_classes = 2  # 0: normal, 1: outlier
+        self.raw_shape = (3, 248, 248)
+        self.shape = (3, 224, 224)  # shape of your data samples in channels x height x width after image preprocessing
+        self.normal_classes = tuple([normal_class])
+        self.outlier_classes = list(range(0, len(extract_custom_classes(root))))
+        self.outlier_classes.remove(normal_class)
+        assert nominal_label in [0, 1]
+        self.nominal_label = nominal_label
+        self.anomalous_label = 1 if self.nominal_label == 0 else 0
+
+        # precomputed mean and std of your training data
+        mean, std = self.extract_mean_std(trainpath, normal_class)
+
+        if preproc in ['', None, 'default', 'none']:
+            test_transform = transform = transforms.Compose([
+                transforms.Resize((self.shape[-2], self.shape[-1])),
+                transforms.ToTensor(),
+                transforms.Normalize(mean, std)
+            ])
+        elif preproc in ['aug1']:
+            test_transform = transforms.Compose([
+                transforms.Resize((self.raw_shape[-1])),
+                transforms.CenterCrop(self.shape[-1]),
+                transforms.ToTensor(),
+                transforms.Normalize(mean, std)
+            ])
+            transform = transforms.Compose([
+                transforms.Resize(self.raw_shape[-1]),
+                transforms.ColorJitter(brightness=0.01, contrast=0.01, saturation=0.01, hue=0.01),
+                transforms.RandomHorizontalFlip(),
+                transforms.RandomCrop(self.shape[-1]),
+                transforms.ToTensor(),
+                transforms.Lambda(lambda x: x + 0.001 * torch.randn_like(x)),
+                transforms.Normalize(mean, std)
+            ])
+        #  here you could define other pipelines with augmentations
+        else:
+            raise ValueError('Preprocessing pipeline {} is not known.'.format(preproc))
+
+        target_transform = transforms.Lambda(
+            lambda x: self.anomalous_label if x in self.outlier_classes else self.nominal_label
+        )
+        if supervise_mode not in ['unsupervised', 'other']:
+            all_transform = OnlineSupervisor(self, supervise_mode, noise_mode, oe_limit)
+        else:
+            all_transform = None
+
+        self._train_set = ImageFolderDataset(
+            trainpath, supervise_mode, self.raw_shape, self.ovr, self.nominal_label, self.anomalous_label,
+            normal_classes=self.normal_classes,
+            transform=transform, target_transform=target_transform, all_transform=all_transform,
+        )
+        if supervise_mode == 'other':  # (semi)-supervised setting
+            self.balance_dataset()
+        else:
+            self._train_set = Subset(
+                self._train_set, np.argwhere(
+                    (np.asarray(self._train_set.anomaly_labels) == self.nominal_label) *
+                    np.isin(self._train_set.targets, self.normal_classes)
+                ).flatten().tolist()
+            )
+
+        self._test_set = ImageFolderDataset(
+            testpath, supervise_mode, self.raw_shape, self.ovr, self.nominal_label, self.anomalous_label,
+            normal_classes=self.normal_classes,
+            transform=test_transform, target_transform=target_transform,
+        )
+        if not self.ovr:
+            self._test_set = Subset(
+                self._test_set, get_target_label_idx(self._test_set.targets, np.asarray(self.normal_classes))
+            )
+
+    def balance_dataset(self):
+        nominal_mask = (np.asarray(self._train_set.anomaly_labels) == self.nominal_label)
+        nominal_mask = nominal_mask * np.isin(self._train_set.targets, np.asarray(self.normal_classes))
+        anomaly_mask = (np.asarray(self._train_set.anomaly_labels) != self.nominal_label)
+        anomaly_mask = anomaly_mask * (1 if self.ovr else np.isin(
+            self._train_set.targets, np.asarray(self.normal_classes)
+        ))
+
+        if anomaly_mask.sum() == 0:
+            return
+
+        self._train_set = Subset(  # randomly pick n_nominal anomalies for a balanced training set
+            self._train_set, np.concatenate([
+                np.argwhere(nominal_mask).flatten().tolist(),
+                np.random.choice(np.argwhere(anomaly_mask).flatten().tolist(), nominal_mask.sum(), replace=True)
+            ])
+        )
+
+    def extract_mean_std(self, path: str, cls: int) -> Tuple[Tuple[float, float, float], Tuple[float, float, float]]:
+        transform = transforms.Compose([
+            transforms.Resize((self.shape[-2], self.shape[-1])),
+            transforms.ToTensor(),
+        ])
+        ds = ImageFolderDataset(
+            path, 'unsupervised', self.raw_shape, self.ovr, self.nominal_label, self.anomalous_label,
+            normal_classes=[cls], transform=transform, target_transform=transforms.Lambda(
+                lambda x: self.anomalous_label if x in self.outlier_classes else self.nominal_label
+            )
+        )
+        ds = Subset(
+            ds,
+            np.argwhere(
+                np.isin(ds.targets, np.asarray([cls])) * np.isin(ds.anomaly_labels, np.asarray([self.nominal_label]))
+            ).flatten().tolist()
+        )
+        loader = DataLoader(dataset=ds, batch_size=2, shuffle=False, num_workers=4, pin_memory=True)
+        all_x = []
+        for x, _ in loader:
+            all_x.append(x)
+        all_x = torch.cat(all_x)
+        return all_x.permute(1, 0, 2, 3).flatten(1).mean(1), all_x.permute(1, 0, 2, 3).flatten(1).std(1)
+
+
+class ImageFolderDataset(ImageFolder):
+    def __init__(self, root: str, supervise_mode: str, raw_shape: Tuple[int, int, int], ovr: bool,
+                 nominal_label: int, anomalous_label: int,
+                 transform=None, target_transform=None, normal_classes=None, all_transform=None, ):
+        super().__init__(root, transform=transform, target_transform=target_transform)
+        if ovr:
+            self.anomaly_labels = [self.target_transform(t) for t in self.targets]
+        else:
+            self.anomaly_labels = [
+                nominal_label if f.split(os.sep)[-2].lower() in ['normal', 'nominal'] else anomalous_label
+                for f, _ in self.samples
+            ]
+        self.normal_classes = normal_classes
+        self.all_transform = all_transform  # contains the OnlineSupervisor
+        self.supervise_mode = supervise_mode
+        self.raw_shape = torch.Size(raw_shape)
+
+    def __getitem__(self, index: int) -> Tuple[Tensor, int]:
+        target = self.anomaly_labels[index]
+
+        if self.target_transform is not None:
+            pass  # already applied since we use self.anomaly_labels instead of self.targets
+
+        if self.all_transform is not None:
+            replace = random.random() < 0.5
+            if replace:
+                if self.supervise_mode not in ['malformed_normal', 'malformed_normal_gt']:
+                    img, _, target = self.all_transform(
+                        torch.empty(self.raw_shape), None, target, replace=replace
+                    )
+                else:
+                    path, _ = self.samples[index]
+                    img = to_tensor(self.loader(path)).mul(255).byte()
+                    img, _, target = self.all_transform(img, None, target, replace=replace)
+                img = to_pil_image(img)
+            else:
+                path, _ = self.samples[index]
+                img = self.loader(path)
+
+        else:
+            path, _ = self.samples[index]
+            img = self.loader(path)
+
+        if self.transform is not None:
+            img = self.transform(img)
+
+        return img, target