pytorch-image-models/timm/data/dataset.py

""" Quick n Simple Image Folder, Tarfile based DataSet

Hacked together by / Copyright 2019, Ross Wightman
"""
import io
import logging

import torch
import torch.utils.data as data
from PIL import Image

from .parsers import create_parser

_logger = logging.getLogger(__name__)


_ERROR_RETRY = 50


class ImageDataset(data.Dataset):

    def __init__(
            self,
            root,
            parser=None,
            split='train',
            class_map=None,
            load_bytes=False,
            img_mode='RGB',
            transform=None,
            target_transform=None,
    ):
        if parser is None or isinstance(parser, str):
            parser = create_parser(
                parser or '',
                root=root,
                split=split,
                class_map=class_map
            )
        self.parser = parser
        self.load_bytes = load_bytes
        self.img_mode = img_mode
        self.transform = transform
        self.target_transform = target_transform
        self._consecutive_errors = 0

    def __getitem__(self, index):
        img, target = self.parser[index]

        try:
            img = img.read() if self.load_bytes else Image.open(img)
        except Exception as e:
            _logger.warning(f'Skipped sample (index {index}, file {self.parser.filename(index)}). {str(e)}')
            self._consecutive_errors += 1
            if self._consecutive_errors < _ERROR_RETRY:
                return self.__getitem__((index + 1) % len(self.parser))
            else:
                raise e
        self._consecutive_errors = 0

        if self.img_mode and not self.load_bytes:
            img = img.convert(self.img_mode)
        if self.transform is not None:
            img = self.transform(img)

        if target is None:
            target = -1
        elif self.target_transform is not None:
            target = self.target_transform(target)

        return img, target

    def __len__(self):
        return len(self.parser)

    def filename(self, index, basename=False, absolute=False):
        return self.parser.filename(index, basename, absolute)

    def filenames(self, basename=False, absolute=False):
        return self.parser.filenames(basename, absolute)


class IterableImageDataset(data.IterableDataset):

    def __init__(
            self,
            root,
            parser=None,
            split='train',
            is_training=False,
            batch_size=None,
            repeats=0,
            download=False,
            transform=None,
            target_transform=None,
    ):
        assert parser is not None
        if isinstance(parser, str):
            self.parser = create_parser(
                parser,
                root=root,
                split=split,
                is_training=is_training,
                batch_size=batch_size,
                repeats=repeats,
                download=download,
            )
        else:
            self.parser = parser
        self.transform = transform
        self.target_transform = target_transform
        self._consecutive_errors = 0

    def __iter__(self):
        for img, target in self.parser:
            if self.transform is not None:
                img = self.transform(img)
            if self.target_transform is not None:
                target = self.target_transform(target)
            yield img, target

    def __len__(self):
        if hasattr(self.parser, '__len__'):
            return len(self.parser)
        else:
            return 0

    def filename(self, index, basename=False, absolute=False):
        assert False, 'Filename lookup by index not supported, use filenames().'

    def filenames(self, basename=False, absolute=False):
        return self.parser.filenames(basename, absolute)


class AugMixDataset(torch.utils.data.Dataset):
    """Dataset wrapper to perform AugMix or other clean/augmentation mixes"""

    def __init__(self, dataset, num_splits=2):
        self.augmentation = None
        self.normalize = None
        self.dataset = dataset
        if self.dataset.transform is not None:
            self._set_transforms(self.dataset.transform)
        self.num_splits = num_splits

    def _set_transforms(self, x):
        assert isinstance(x, (list, tuple)) and len(x) == 3, 'Expecting a tuple/list of 3 transforms'
        self.dataset.transform = x[0]
        self.augmentation = x[1]
        self.normalize = x[2]

    @property
    def transform(self):
        return self.dataset.transform

    @transform.setter
    def transform(self, x):
        self._set_transforms(x)

    def _normalize(self, x):
        return x if self.normalize is None else self.normalize(x)

    def __getitem__(self, i):
        x, y = self.dataset[i]  # all splits share the same dataset base transform
        x_list = [self._normalize(x)]  # first split only normalizes (this is the 'clean' split)
        # run the full augmentation on the remaining splits
        for _ in range(self.num_splits - 1):
            x_list.append(self._normalize(self.augmentation(x)))
        return tuple(x_list), y

    def __len__(self):
        return len(self.dataset)
Fix some attributions, add copyrights to some file docstrings 4 years ago			`""" Quick n Simple Image Folder, Tarfile based DataSet`

Fix MobileNetV2 head conv size for multiplier < 1.0. Add some missing modification copyrights, fix starting date of some old ones. 3 years ago			`Hacked together by / Copyright 2019, Ross Wightman`
Fix some attributions, add copyrights to some file docstrings 4 years ago			`"""`
Refactor device handling in scripts, distributed init to be less 'cuda' centric. More device args passed through where needed. 2 years ago			`import io`
More work on dataset / parser split and imagenet21k (tar) support 4 years ago			`import logging`
Initial commit, puting some ol pieces together 6 years ago
Refactor device handling in scripts, distributed init to be less 'cuda' centric. More device args passed through where needed. 2 years ago			`import torch`
			`import torch.utils.data as data`
More work on dataset / parser split and imagenet21k (tar) support 4 years ago			`from PIL import Image`

More dataset work including factories and a tensorflow datasets (TFDS) wrapper * Add parser/dataset factory methods for more flexible dataset & parser creation * Add dataset parser that wraps TFDS image classification datasets * Tweak num_classes handling bug for 21k models * Add initial deit models so they can be benchmarked in next csv results runs 4 years ago			`from .parsers import create_parser`
More work on dataset / parser split and imagenet21k (tar) support 4 years ago
			`_logger = logging.getLogger(__name__)`


			`_ERROR_RETRY = 50`
Add support to Dataset for class id mapping file, clean up a bit of old logic. Add results file arg for validation and update script. 5 years ago

Initial commit for dataset / parser reorg to support additional datasets / types 4 years ago			`class ImageDataset(data.Dataset):`
Initial commit, puting some ol pieces together 6 years ago
			`def __init__(`
			`self,`
More work on dataset / parser split and imagenet21k (tar) support 4 years ago			`root,`
Initial commit for dataset / parser reorg to support additional datasets / types 4 years ago			`parser=None,`
Refactor device handling in scripts, distributed init to be less 'cuda' centric. More device args passed through where needed. 2 years ago			`split='train',`
Dataset work * support some torchvision datasets * improvements to TFDS wrapper for subsplit handling (fix #942), shuffle seed * add class-map support to train (fix #957) 3 years ago			`class_map=None,`
Ported Tensorflow pretrained EfficientNet weights and some model cleanup * B0-B3 weights ported from TF with close to paper accuracy * Renamed gen_mobilenet to gen_efficientnet since scaling params go well beyond 'mobile' specific * Add Tensorflow preprocessing option for closer images to source repo 6 years ago			`load_bytes=False,`
Refactor device handling in scripts, distributed init to be less 'cuda' centric. More device args passed through where needed. 2 years ago			`img_mode='RGB',`
Add support to Dataset for class id mapping file, clean up a bit of old logic. Add results file arg for validation and update script. 5 years ago			`transform=None,`
Dataset work * support some torchvision datasets * improvements to TFDS wrapper for subsplit handling (fix #942), shuffle seed * add class-map support to train (fix #957) 3 years ago			`target_transform=None,`
Initial commit for dataset / parser reorg to support additional datasets / types 4 years ago			`):`
More dataset work including factories and a tensorflow datasets (TFDS) wrapper * Add parser/dataset factory methods for more flexible dataset & parser creation * Add dataset parser that wraps TFDS image classification datasets * Tweak num_classes handling bug for 21k models * Add initial deit models so they can be benchmarked in next csv results runs 4 years ago			`if parser is None or isinstance(parser, str):`
Refactor device handling in scripts, distributed init to be less 'cuda' centric. More device args passed through where needed. 2 years ago			`parser = create_parser(`
			`parser or '',`
			`root=root,`
			`split=split,`
			`class_map=class_map`
			`)`
Initial commit for dataset / parser reorg to support additional datasets / types 4 years ago			`self.parser = parser`
Ported Tensorflow pretrained EfficientNet weights and some model cleanup * B0-B3 weights ported from TF with close to paper accuracy * Renamed gen_mobilenet to gen_efficientnet since scaling params go well beyond 'mobile' specific * Add Tensorflow preprocessing option for closer images to source repo 6 years ago			`self.load_bytes = load_bytes`
Refactor device handling in scripts, distributed init to be less 'cuda' centric. More device args passed through where needed. 2 years ago			`self.img_mode = img_mode`
Initial commit, puting some ol pieces together 6 years ago			`self.transform = transform`
Dataset work * support some torchvision datasets * improvements to TFDS wrapper for subsplit handling (fix #942), shuffle seed * add class-map support to train (fix #957) 3 years ago			`self.target_transform = target_transform`
More work on dataset / parser split and imagenet21k (tar) support 4 years ago			`self._consecutive_errors = 0`
Initial commit, puting some ol pieces together 6 years ago
			`def __getitem__(self, index):`
Initial commit for dataset / parser reorg to support additional datasets / types 4 years ago			`img, target = self.parser[index]`
Refactor device handling in scripts, distributed init to be less 'cuda' centric. More device args passed through where needed. 2 years ago
More work on dataset / parser split and imagenet21k (tar) support 4 years ago			`try:`
Refactor device handling in scripts, distributed init to be less 'cuda' centric. More device args passed through where needed. 2 years ago			`img = img.read() if self.load_bytes else Image.open(img)`
More work on dataset / parser split and imagenet21k (tar) support 4 years ago			`except Exception as e:`
			`_logger.warning(f'Skipped sample (index {index}, file {self.parser.filename(index)}). {str(e)}')`
			`self._consecutive_errors += 1`
			`if self._consecutive_errors < _ERROR_RETRY:`
			`return self.__getitem__((index + 1) % len(self.parser))`
			`else:`
			`raise e`
			`self._consecutive_errors = 0`
Refactor device handling in scripts, distributed init to be less 'cuda' centric. More device args passed through where needed. 2 years ago
			`if self.img_mode and not self.load_bytes:`
			`img = img.convert(self.img_mode)`
Improve creation of data pipeline with prefetch enabled vs disabled, fixup inception_res_v2 and dpn models 6 years ago			`if self.transform is not None:`
			`img = self.transform(img)`
Refactor device handling in scripts, distributed init to be less 'cuda' centric. More device args passed through where needed. 2 years ago
Initial commit, puting some ol pieces together 6 years ago			`if target is None:`
Dataset work * support some torchvision datasets * improvements to TFDS wrapper for subsplit handling (fix #942), shuffle seed * add class-map support to train (fix #957) 3 years ago			`target = -1`
			`elif self.target_transform is not None:`
			`target = self.target_transform(target)`
Refactor device handling in scripts, distributed init to be less 'cuda' centric. More device args passed through where needed. 2 years ago
Initial commit, puting some ol pieces together 6 years ago			`return img, target`

			`def __len__(self):`
Initial commit for dataset / parser reorg to support additional datasets / types 4 years ago			`return len(self.parser)`
Initial commit, puting some ol pieces together 6 years ago
More models in sotabench, more control over sotabench run, dataset filename extraction consistency 4 years ago			`def filename(self, index, basename=False, absolute=False):`
Initial commit for dataset / parser reorg to support additional datasets / types 4 years ago			`return self.parser.filename(index, basename, absolute)`
More models in sotabench, more control over sotabench run, dataset filename extraction consistency 4 years ago
			`def filenames(self, basename=False, absolute=False):`
Initial commit for dataset / parser reorg to support additional datasets / types 4 years ago			`return self.parser.filenames(basename, absolute)`
More models in sotabench, more control over sotabench run, dataset filename extraction consistency 4 years ago
Working on an implementation of AugMix with JensenShannonDivergence loss that's compatible with my AutoAugment and RandAugment impl 5 years ago
More dataset work including factories and a tensorflow datasets (TFDS) wrapper * Add parser/dataset factory methods for more flexible dataset & parser creation * Add dataset parser that wraps TFDS image classification datasets * Tweak num_classes handling bug for 21k models * Add initial deit models so they can be benchmarked in next csv results runs 4 years ago			`class IterableImageDataset(data.IterableDataset):`

			`def __init__(`
			`self,`
			`root,`
			`parser=None,`
			`split='train',`
			`is_training=False,`
			`batch_size=None,`
Add epoch-repeats arg to multiply the number of dataset passes per epoch. Currently for iterable datasets (read TFDS wrapper) only. 4 years ago			`repeats=0,`
Dataset work * support some torchvision datasets * improvements to TFDS wrapper for subsplit handling (fix #942), shuffle seed * add class-map support to train (fix #957) 3 years ago			`download=False,`
More dataset work including factories and a tensorflow datasets (TFDS) wrapper * Add parser/dataset factory methods for more flexible dataset & parser creation * Add dataset parser that wraps TFDS image classification datasets * Tweak num_classes handling bug for 21k models * Add initial deit models so they can be benchmarked in next csv results runs 4 years ago			`transform=None,`
Dataset work * support some torchvision datasets * improvements to TFDS wrapper for subsplit handling (fix #942), shuffle seed * add class-map support to train (fix #957) 3 years ago			`target_transform=None,`
More dataset work including factories and a tensorflow datasets (TFDS) wrapper * Add parser/dataset factory methods for more flexible dataset & parser creation * Add dataset parser that wraps TFDS image classification datasets * Tweak num_classes handling bug for 21k models * Add initial deit models so they can be benchmarked in next csv results runs 4 years ago			`):`
			`assert parser is not None`
			`if isinstance(parser, str):`
			`self.parser = create_parser(`
Refactor device handling in scripts, distributed init to be less 'cuda' centric. More device args passed through where needed. 2 years ago			`parser,`
			`root=root,`
			`split=split,`
			`is_training=is_training,`
			`batch_size=batch_size,`
			`repeats=repeats,`
			`download=download,`
			`)`
More dataset work including factories and a tensorflow datasets (TFDS) wrapper * Add parser/dataset factory methods for more flexible dataset & parser creation * Add dataset parser that wraps TFDS image classification datasets * Tweak num_classes handling bug for 21k models * Add initial deit models so they can be benchmarked in next csv results runs 4 years ago			`else:`
			`self.parser = parser`
			`self.transform = transform`
Dataset work * support some torchvision datasets * improvements to TFDS wrapper for subsplit handling (fix #942), shuffle seed * add class-map support to train (fix #957) 3 years ago			`self.target_transform = target_transform`
More dataset work including factories and a tensorflow datasets (TFDS) wrapper * Add parser/dataset factory methods for more flexible dataset & parser creation * Add dataset parser that wraps TFDS image classification datasets * Tweak num_classes handling bug for 21k models * Add initial deit models so they can be benchmarked in next csv results runs 4 years ago			`self._consecutive_errors = 0`

			`def __iter__(self):`
			`for img, target in self.parser:`
			`if self.transform is not None:`
			`img = self.transform(img)`
Dataset work * support some torchvision datasets * improvements to TFDS wrapper for subsplit handling (fix #942), shuffle seed * add class-map support to train (fix #957) 3 years ago			`if self.target_transform is not None:`
			`target = self.target_transform(target)`
More dataset work including factories and a tensorflow datasets (TFDS) wrapper * Add parser/dataset factory methods for more flexible dataset & parser creation * Add dataset parser that wraps TFDS image classification datasets * Tweak num_classes handling bug for 21k models * Add initial deit models so they can be benchmarked in next csv results runs 4 years ago			`yield img, target`

			`def __len__(self):`
			`if hasattr(self.parser, '__len__'):`
			`return len(self.parser)`
			`else:`
			`return 0`

			`def filename(self, index, basename=False, absolute=False):`
			`assert False, 'Filename lookup by index not supported, use filenames().'`

			`def filenames(self, basename=False, absolute=False):`
			`return self.parser.filenames(basename, absolute)`


Working on an implementation of AugMix with JensenShannonDivergence loss that's compatible with my AutoAugment and RandAugment impl 5 years ago			`class AugMixDataset(torch.utils.data.Dataset):`
			`"""Dataset wrapper to perform AugMix or other clean/augmentation mixes"""`

Add SplitBatchNorm. AugMix, Rand/AutoAugment, Split (Aux) BatchNorm, Jensen-Shannon Divergence, RandomErasing all working together 5 years ago			`def __init__(self, dataset, num_splits=2):`
Working on an implementation of AugMix with JensenShannonDivergence loss that's compatible with my AutoAugment and RandAugment impl 5 years ago			`self.augmentation = None`
			`self.normalize = None`
			`self.dataset = dataset`
			`if self.dataset.transform is not None:`
			`self._set_transforms(self.dataset.transform)`
Add SplitBatchNorm. AugMix, Rand/AutoAugment, Split (Aux) BatchNorm, Jensen-Shannon Divergence, RandomErasing all working together 5 years ago			`self.num_splits = num_splits`
Working on an implementation of AugMix with JensenShannonDivergence loss that's compatible with my AutoAugment and RandAugment impl 5 years ago
			`def _set_transforms(self, x):`
			`assert isinstance(x, (list, tuple)) and len(x) == 3, 'Expecting a tuple/list of 3 transforms'`
			`self.dataset.transform = x[0]`
			`self.augmentation = x[1]`
			`self.normalize = x[2]`

			`@property`
			`def transform(self):`
			`return self.dataset.transform`

			`@transform.setter`
			`def transform(self, x):`
			`self._set_transforms(x)`

			`def _normalize(self, x):`
			`return x if self.normalize is None else self.normalize(x)`

			`def __getitem__(self, i):`
Add SplitBatchNorm. AugMix, Rand/AutoAugment, Split (Aux) BatchNorm, Jensen-Shannon Divergence, RandomErasing all working together 5 years ago			`x, y = self.dataset[i] # all splits share the same dataset base transform`
			`x_list = [self._normalize(x)] # first split only normalizes (this is the 'clean' split)`
			`# run the full augmentation on the remaining splits`
			`for _ in range(self.num_splits - 1):`
Working on an implementation of AugMix with JensenShannonDivergence loss that's compatible with my AutoAugment and RandAugment impl 5 years ago			`x_list.append(self._normalize(self.augmentation(x)))`
			`return tuple(x_list), y`

			`def __len__(self):`
			`return len(self.dataset)`