pytorch-image-models/timm/data/loader.py

""" Loader Factory, Fast Collate, CUDA Prefetcher

Prefetcher and Fast Collate inspired by NVIDIA APEX example at
https://github.com/NVIDIA/apex/commit/d5e2bb4bdeedd27b1dfaf5bb2b24d6c000dee9be#diff-cf86c282ff7fba81fad27a559379d5bf

Hacked together by / Copyright 2020 Ross Wightman
"""

import torch.utils.data

from timm.bits import get_device, DeviceEnvType

from .fetcher import Fetcher
from .prefetcher_cuda import PrefetcherCuda
from .collate import fast_collate
from .transforms_factory import create_transform
from .constants import IMAGENET_DEFAULT_MEAN, IMAGENET_DEFAULT_STD
from .distributed_sampler import OrderedDistributedSampler


def create_loader(
        dataset,
        input_size,
        batch_size,
        is_training=False,
        dev_env=None,
        no_aug=False,
        re_prob=0.,
        re_mode='const',
        re_count=1,
        re_split=False,
        scale=None,
        ratio=None,
        hflip=0.5,
        vflip=0.,
        color_jitter=0.4,
        auto_augment=None,
        num_aug_splits=0,
        interpolation='bilinear',
        mean=IMAGENET_DEFAULT_MEAN,
        std=IMAGENET_DEFAULT_STD,
        num_workers=1,
        crop_pct=None,
        collate_fn=None,
        pin_memory=False,
        tf_preprocessing=False,
        use_multi_epochs_loader=False,
        persistent_workers=True,
):
    re_num_splits = 0
    if re_split:
        # apply RE to second half of batch if no aug split otherwise line up with aug split
        re_num_splits = num_aug_splits or 2
    dataset.transform = create_transform(
        input_size,
        is_training=is_training,
        use_fetcher=True,
        no_aug=no_aug,
        scale=scale,
        ratio=ratio,
        hflip=hflip,
        vflip=vflip,
        color_jitter=color_jitter,
        auto_augment=auto_augment,
        interpolation=interpolation,
        mean=mean,
        std=std,
        crop_pct=crop_pct,
        tf_preprocessing=tf_preprocessing,
        re_prob=re_prob,
        re_mode=re_mode,
        re_count=re_count,
        re_num_splits=re_num_splits,
        separate=num_aug_splits > 0,
    )

    if dev_env is None:
        dev_env = get_device()

    sampler = None
    if dev_env.distributed and not isinstance(dataset, torch.utils.data.IterableDataset):
        if is_training:
            sampler = torch.utils.data.distributed.DistributedSampler(
                dataset, num_replicas=dev_env.world_size, rank=dev_env.global_rank)
        else:
            # This will add extra duplicate entries to result in equal num
            # of samples per-process, will slightly alter validation results
            sampler = OrderedDistributedSampler(dataset, num_replicas=dev_env.world_size, rank=dev_env.global_rank)

    if collate_fn is None:
        collate_fn = fast_collate

    loader_class = torch.utils.data.DataLoader
    if use_multi_epochs_loader:
        loader_class = MultiEpochsDataLoader

    loader_args = dict(
        batch_size=batch_size,
        shuffle=not isinstance(dataset, torch.utils.data.IterableDataset) and sampler is None and is_training,
        num_workers=num_workers,
        sampler=sampler,
        collate_fn=collate_fn,
        pin_memory=pin_memory,
        drop_last=is_training,
        persistent_workers=persistent_workers)
    try:
        loader = loader_class(dataset, **loader_args)
    except TypeError as e:
        loader_args.pop('persistent_workers')  # only in Pytorch 1.7+
        loader = loader_class(dataset, **loader_args)

    fetcher_kwargs = dict(
        mean=mean,
        std=std,
        re_prob=re_prob if is_training and not no_aug else 0.,
        re_mode=re_mode,
        re_count=re_count,
        re_num_splits=re_num_splits
    )
    if dev_env.type_cuda:
        loader = PrefetcherCuda(loader, **fetcher_kwargs)
    else:
        loader = Fetcher(loader, device=dev_env.device, **fetcher_kwargs)

    return loader


class MultiEpochsDataLoader(torch.utils.data.DataLoader):

    def __init__(self, *args, **kwargs):
        super().__init__(*args, **kwargs)
        self._DataLoader__initialized = False
        self.batch_sampler = _RepeatSampler(self.batch_sampler)
        self._DataLoader__initialized = True
        self.iterator = super().__iter__()

    def __len__(self):
        return len(self.batch_sampler.sampler)

    def __iter__(self):
        for i in range(len(self)):
            yield next(self.iterator)


class _RepeatSampler(object):
    """ Sampler that repeats forever.

    Args:
        sampler (Sampler)
    """

    def __init__(self, sampler):
        self.sampler = sampler

    def __iter__(self):
        while True:
            yield from iter(self.sampler)
Fix some attributions, add copyrights to some file docstrings 4 years ago			`""" Loader Factory, Fast Collate, CUDA Prefetcher`

			`Prefetcher and Fast Collate inspired by NVIDIA APEX example at`
			`https://github.com/NVIDIA/apex/commit/d5e2bb4bdeedd27b1dfaf5bb2b24d6c000dee9be#diff-cf86c282ff7fba81fad27a559379d5bf`

			`Hacked together by / Copyright 2020 Ross Wightman`
			`"""`

Loader tweaks 6 years ago			`import torch.utils.data`
Working on an implementation of AugMix with JensenShannonDivergence loss that's compatible with my AutoAugment and RandAugment impl 5 years ago
Major timm.bits update. Updater and DeviceEnv now dataclasses, after_step closure used, metrics base impl w/ distributed reduce, many tweaks/fixes. 4 years ago			`from timm.bits import get_device, DeviceEnvType`
First timm.bits commit, add initial abstractions, WIP updates to train, val... some of it working 4 years ago
			`from .fetcher import Fetcher`
			`from .prefetcher_cuda import PrefetcherCuda`
			`from .collate import fast_collate`
Working on an implementation of AugMix with JensenShannonDivergence loss that's compatible with my AutoAugment and RandAugment impl 5 years ago			`from .transforms_factory import create_transform`
			`from .constants import IMAGENET_DEFAULT_MEAN, IMAGENET_DEFAULT_STD`
Big re-org, working towards making pip/module as 'timm' 5 years ago			`from .distributed_sampler import OrderedDistributedSampler`
Mixup and prefetcher improvements * Do mixup in custom collate fn if prefetcher enabled, reduces performance impact * Move mixup code to own file * Add arg to disable prefetcher * Fix no cuda transfer when prefetcher off * Random erasing when prefetcher off wasn't changed to match new args, fixed * Default random erasing to off (prob = 0.) for train 6 years ago
Improve creation of data pipeline with prefetch enabled vs disabled, fixup inception_res_v2 and dpn models 6 years ago
Add initial sotabench attempt. Split create_transform out of create_loader. Update requirements.txt 5 years ago			`def create_loader(`
			`dataset,`
			`input_size,`
			`batch_size,`
			`is_training=False,`
First timm.bits commit, add initial abstractions, WIP updates to train, val... some of it working 4 years ago			`dev_env=None,`
Add more augmentation arguments, including a no_aug disable flag. Fix #209 4 years ago			`no_aug=False,`
Add SplitBatchNorm. AugMix, Rand/AutoAugment, Split (Aux) BatchNorm, Jensen-Shannon Divergence, RandomErasing all working together 5 years ago			`re_prob=0.,`
			`re_mode='const',`
			`re_count=1,`
			`re_split=False,`
Add more augmentation arguments, including a no_aug disable flag. Fix #209 4 years ago			`scale=None,`
			`ratio=None,`
			`hflip=0.5,`
			`vflip=0.,`
Add initial sotabench attempt. Split create_transform out of create_loader. Update requirements.txt 5 years ago			`color_jitter=0.4,`
More AutoAugment work. Ready to roll... 5 years ago			`auto_augment=None,`
Add SplitBatchNorm. AugMix, Rand/AutoAugment, Split (Aux) BatchNorm, Jensen-Shannon Divergence, RandomErasing all working together 5 years ago			`num_aug_splits=0,`
Add initial sotabench attempt. Split create_transform out of create_loader. Update requirements.txt 5 years ago			`interpolation='bilinear',`
			`mean=IMAGENET_DEFAULT_MEAN,`
			`std=IMAGENET_DEFAULT_STD,`
			`num_workers=1,`
			`crop_pct=None,`
			`collate_fn=None,`
Add --pin-mem arg to enable dataloader pin_memory (showing more benefit in some scenarios now), also add --torchscript arg to validate.py for testing models with jit.script 5 years ago			`pin_memory=False,`
Add initial sotabench attempt. Split create_transform out of create_loader. Update requirements.txt 5 years ago			`tf_preprocessing=False,`
More dataset work including factories and a tensorflow datasets (TFDS) wrapper * Add parser/dataset factory methods for more flexible dataset & parser creation * Add dataset parser that wraps TFDS image classification datasets * Tweak num_classes handling bug for 21k models * Add initial deit models so they can be benchmarked in next csv results runs 4 years ago			`use_multi_epochs_loader=False,`
			`persistent_workers=True,`
Add initial sotabench attempt. Split create_transform out of create_loader. Update requirements.txt 5 years ago			`):`
Add SplitBatchNorm. AugMix, Rand/AutoAugment, Split (Aux) BatchNorm, Jensen-Shannon Divergence, RandomErasing all working together 5 years ago			`re_num_splits = 0`
			`if re_split:`
			`# apply RE to second half of batch if no aug split otherwise line up with aug split`
			`re_num_splits = num_aug_splits or 2`
Add initial sotabench attempt. Split create_transform out of create_loader. Update requirements.txt 5 years ago			`dataset.transform = create_transform(`
			`input_size,`
			`is_training=is_training,`
First timm.bits commit, add initial abstractions, WIP updates to train, val... some of it working 4 years ago			`use_fetcher=True,`
Add more augmentation arguments, including a no_aug disable flag. Fix #209 4 years ago			`no_aug=no_aug,`
			`scale=scale,`
			`ratio=ratio,`
			`hflip=hflip,`
			`vflip=vflip,`
Add initial sotabench attempt. Split create_transform out of create_loader. Update requirements.txt 5 years ago			`color_jitter=color_jitter,`
More AutoAugment work. Ready to roll... 5 years ago			`auto_augment=auto_augment,`
Add initial sotabench attempt. Split create_transform out of create_loader. Update requirements.txt 5 years ago			`interpolation=interpolation,`
			`mean=mean,`
			`std=std,`
			`crop_pct=crop_pct,`
			`tf_preprocessing=tf_preprocessing,`
Add SplitBatchNorm. AugMix, Rand/AutoAugment, Split (Aux) BatchNorm, Jensen-Shannon Divergence, RandomErasing all working together 5 years ago			`re_prob=re_prob,`
			`re_mode=re_mode,`
			`re_count=re_count,`
			`re_num_splits=re_num_splits,`
			`separate=num_aug_splits > 0,`
Add initial sotabench attempt. Split create_transform out of create_loader. Update requirements.txt 5 years ago			`)`
Improve creation of data pipeline with prefetch enabled vs disabled, fixup inception_res_v2 and dpn models 6 years ago
First timm.bits commit, add initial abstractions, WIP updates to train, val... some of it working 4 years ago			`if dev_env is None:`
			`dev_env = get_device()`

Distributed (multi-process) train, multi-gpu single process train, and NVIDIA AMP support 6 years ago			`sampler = None`
Major timm.bits update. Updater and DeviceEnv now dataclasses, after_step closure used, metrics base impl w/ distributed reduce, many tweaks/fixes. 4 years ago			`if dev_env.distributed and not isinstance(dataset, torch.utils.data.IterableDataset):`
Add distributed sampler that maintains order of original dataset (for validation) 6 years ago			`if is_training:`
Fix some bugs with XLA support, logger, add hacky xla dist launch script since torch.dist.launch doesn't work 4 years ago			`sampler = torch.utils.data.distributed.DistributedSampler(`
			`dataset, num_replicas=dev_env.world_size, rank=dev_env.global_rank)`
Add distributed sampler that maintains order of original dataset (for validation) 6 years ago			`else:`
			`# This will add extra duplicate entries to result in equal num`
			`# of samples per-process, will slightly alter validation results`
Fix some bugs with XLA support, logger, add hacky xla dist launch script since torch.dist.launch doesn't work 4 years ago			`sampler = OrderedDistributedSampler(dataset, num_replicas=dev_env.world_size, rank=dev_env.global_rank)`
Distributed (multi-process) train, multi-gpu single process train, and NVIDIA AMP support 6 years ago
Mixup and prefetcher improvements * Do mixup in custom collate fn if prefetcher enabled, reduces performance impact * Move mixup code to own file * Add arg to disable prefetcher * Fix no cuda transfer when prefetcher off * Random erasing when prefetcher off wasn't changed to match new args, fixed * Default random erasing to off (prob = 0.) for train 6 years ago			`if collate_fn is None:`
First timm.bits commit, add initial abstractions, WIP updates to train, val... some of it working 4 years ago			`collate_fn = fast_collate`
Mixup and prefetcher improvements * Do mixup in custom collate fn if prefetcher enabled, reduces performance impact * Move mixup code to own file * Add arg to disable prefetcher * Fix no cuda transfer when prefetcher off * Random erasing when prefetcher off wasn't changed to match new args, fixed * Default random erasing to off (prob = 0.) for train 6 years ago
added MultiEpochsDataLoader 5 years ago			`loader_class = torch.utils.data.DataLoader`
			`if use_multi_epochs_loader:`
			`loader_class = MultiEpochsDataLoader`

More dataset work including factories and a tensorflow datasets (TFDS) wrapper * Add parser/dataset factory methods for more flexible dataset & parser creation * Add dataset parser that wraps TFDS image classification datasets * Tweak num_classes handling bug for 21k models * Add initial deit models so they can be benchmarked in next csv results runs 4 years ago			`loader_args = dict(`
Improve creation of data pipeline with prefetch enabled vs disabled, fixup inception_res_v2 and dpn models 6 years ago			`batch_size=batch_size,`
More dataset work including factories and a tensorflow datasets (TFDS) wrapper * Add parser/dataset factory methods for more flexible dataset & parser creation * Add dataset parser that wraps TFDS image classification datasets * Tweak num_classes handling bug for 21k models * Add initial deit models so they can be benchmarked in next csv results runs 4 years ago			`shuffle=not isinstance(dataset, torch.utils.data.IterableDataset) and sampler is None and is_training,`
Improve creation of data pipeline with prefetch enabled vs disabled, fixup inception_res_v2 and dpn models 6 years ago			`num_workers=num_workers,`
Distributed (multi-process) train, multi-gpu single process train, and NVIDIA AMP support 6 years ago			`sampler=sampler,`
Mixup and prefetcher improvements * Do mixup in custom collate fn if prefetcher enabled, reduces performance impact * Move mixup code to own file * Add arg to disable prefetcher * Fix no cuda transfer when prefetcher off * Random erasing when prefetcher off wasn't changed to match new args, fixed * Default random erasing to off (prob = 0.) for train 6 years ago			`collate_fn=collate_fn,`
Add --pin-mem arg to enable dataloader pin_memory (showing more benefit in some scenarios now), also add --torchscript arg to validate.py for testing models with jit.script 5 years ago			`pin_memory=pin_memory,`
Loader tweaks 6 years ago			`drop_last=is_training,`
More dataset work including factories and a tensorflow datasets (TFDS) wrapper * Add parser/dataset factory methods for more flexible dataset & parser creation * Add dataset parser that wraps TFDS image classification datasets * Tweak num_classes handling bug for 21k models * Add initial deit models so they can be benchmarked in next csv results runs 4 years ago			`persistent_workers=persistent_workers)`
			`try:`
			`loader = loader_class(dataset, **loader_args)`
			`except TypeError as e:`
			`loader_args.pop('persistent_workers') # only in Pytorch 1.7+`
			`loader = loader_class(dataset, **loader_args)`
First timm.bits commit, add initial abstractions, WIP updates to train, val... some of it working 4 years ago
			`fetcher_kwargs = dict(`
			`mean=mean,`
			`std=std,`
			`re_prob=re_prob if is_training and not no_aug else 0.,`
			`re_mode=re_mode,`
			`re_count=re_count,`
			`re_num_splits=re_num_splits`
			`)`
Major timm.bits update. Updater and DeviceEnv now dataclasses, after_step closure used, metrics base impl w/ distributed reduce, many tweaks/fixes. 4 years ago			`if dev_env.type_cuda:`
First timm.bits commit, add initial abstractions, WIP updates to train, val... some of it working 4 years ago			`loader = PrefetcherCuda(loader, **fetcher_kwargs)`
			`else:`
			`loader = Fetcher(loader, device=dev_env.device, **fetcher_kwargs)`
Improve creation of data pipeline with prefetch enabled vs disabled, fixup inception_res_v2 and dpn models 6 years ago
			`return loader`
added MultiEpochsDataLoader 5 years ago

			`class MultiEpochsDataLoader(torch.utils.data.DataLoader):`

			`def __init__(self, args, *kwargs):`
			`super().__init__(args, *kwargs)`
			`self._DataLoader__initialized = False`
			`self.batch_sampler = _RepeatSampler(self.batch_sampler)`
			`self._DataLoader__initialized = True`
			`self.iterator = super().__iter__()`

			`def __len__(self):`
			`return len(self.batch_sampler.sampler)`

			`def __iter__(self):`
			`for i in range(len(self)):`
			`yield next(self.iterator)`


			`class _RepeatSampler(object):`
			`""" Sampler that repeats forever.`

			`Args:`
			`sampler (Sampler)`
			`"""`

			`def __init__(self, sampler):`
			`self.sampler = sampler`

			`def __iter__(self):`
			`while True:`
			`yield from iter(self.sampler)`