pytorch-image-models/timm/data/loader.py

import torch.utils.data
from .transforms import *
from .distributed_sampler import OrderedDistributedSampler
from .mixup import FastCollateMixup


def fast_collate(batch):
    targets = torch.tensor([b[1] for b in batch], dtype=torch.int64)
    batch_size = len(targets)
    tensor = torch.zeros((batch_size, *batch[0][0].shape), dtype=torch.uint8)
    for i in range(batch_size):
        tensor[i] += torch.from_numpy(batch[i][0])

    return tensor, targets


class PrefetchLoader:

    def __init__(self,
            loader,
            rand_erase_prob=0.,
            rand_erase_mode='const',
            rand_erase_count=1,
            mean=IMAGENET_DEFAULT_MEAN,
            std=IMAGENET_DEFAULT_STD,
            fp16=False):
        self.loader = loader
        self.mean = torch.tensor([x * 255 for x in mean]).cuda().view(1, 3, 1, 1)
        self.std = torch.tensor([x * 255 for x in std]).cuda().view(1, 3, 1, 1)
        self.fp16 = fp16
        if fp16:
            self.mean = self.mean.half()
            self.std = self.std.half()
        if rand_erase_prob > 0.:
            self.random_erasing = RandomErasing(
                probability=rand_erase_prob, mode=rand_erase_mode, max_count=rand_erase_count)
        else:
            self.random_erasing = None

    def __iter__(self):
        stream = torch.cuda.Stream()
        first = True

        for next_input, next_target in self.loader:
            with torch.cuda.stream(stream):
                next_input = next_input.cuda(non_blocking=True)
                next_target = next_target.cuda(non_blocking=True)
                if self.fp16:
                    next_input = next_input.half().sub_(self.mean).div_(self.std)
                else:
                    next_input = next_input.float().sub_(self.mean).div_(self.std)
                if self.random_erasing is not None:
                    next_input = self.random_erasing(next_input)

            if not first:
                yield input, target
            else:
                first = False

            torch.cuda.current_stream().wait_stream(stream)
            input = next_input
            target = next_target

        yield input, target

    def __len__(self):
        return len(self.loader)

    @property
    def sampler(self):
        return self.loader.sampler

    @property
    def dataset(self):
        return self.loader.dataset

    @property
    def mixup_enabled(self):
        if isinstance(self.loader.collate_fn, FastCollateMixup):
            return self.loader.collate_fn.mixup_enabled
        else:
            return False

    @mixup_enabled.setter
    def mixup_enabled(self, x):
        if isinstance(self.loader.collate_fn, FastCollateMixup):
            self.loader.collate_fn.mixup_enabled = x


def create_transform(
        input_size,
        is_training=False,
        use_prefetcher=False,
        color_jitter=0.4,
        interpolation='bilinear',
        mean=IMAGENET_DEFAULT_MEAN,
        std=IMAGENET_DEFAULT_STD,
        crop_pct=None,
        tf_preprocessing=False):

    if isinstance(input_size, tuple):
        img_size = input_size[-2:]
    else:
        img_size = input_size

    if tf_preprocessing and use_prefetcher:
        from timm.data.tf_preprocessing import TfPreprocessTransform
        transform = TfPreprocessTransform(
            is_training=is_training, size=img_size, interpolation=interpolation)
    else:
        if is_training:
            if True:
                transform = transforms_imagenet_aa(
                    img_size,
                    interpolation=interpolation,
                    use_prefetcher=use_prefetcher,
                    mean=mean,
                    std=std)
            else:
                transform = transforms_imagenet_train(
                    img_size,
                    color_jitter=color_jitter,
                    interpolation=interpolation,
                    use_prefetcher=use_prefetcher,
                    mean=mean,
                    std=std)
        else:
            transform = transforms_imagenet_eval(
                img_size,
                interpolation=interpolation,
                use_prefetcher=use_prefetcher,
                mean=mean,
                std=std,
                crop_pct=crop_pct)

    return transform


def create_loader(
        dataset,
        input_size,
        batch_size,
        is_training=False,
        use_prefetcher=True,
        rand_erase_prob=0.,
        rand_erase_mode='const',
        rand_erase_count=1,
        color_jitter=0.4,
        interpolation='bilinear',
        mean=IMAGENET_DEFAULT_MEAN,
        std=IMAGENET_DEFAULT_STD,
        num_workers=1,
        distributed=False,
        crop_pct=None,
        collate_fn=None,
        fp16=False,
        tf_preprocessing=False,
):
    dataset.transform = create_transform(
        input_size,
        is_training=is_training,
        use_prefetcher=use_prefetcher,
        color_jitter=color_jitter,
        interpolation=interpolation,
        mean=mean,
        std=std,
        crop_pct=crop_pct,
        tf_preprocessing=tf_preprocessing,
    )

    sampler = None
    if distributed:
        if is_training:
            sampler = torch.utils.data.distributed.DistributedSampler(dataset)
        else:
            # This will add extra duplicate entries to result in equal num
            # of samples per-process, will slightly alter validation results
            sampler = OrderedDistributedSampler(dataset)

    if collate_fn is None:
        collate_fn = fast_collate if use_prefetcher else torch.utils.data.dataloader.default_collate

    loader = torch.utils.data.DataLoader(
        dataset,
        batch_size=batch_size,
        shuffle=sampler is None and is_training,
        num_workers=num_workers,
        sampler=sampler,
        collate_fn=collate_fn,
        drop_last=is_training,
    )
    if use_prefetcher:
        loader = PrefetchLoader(
            loader,
            rand_erase_prob=rand_erase_prob if is_training else 0.,
            rand_erase_mode=rand_erase_mode,
            rand_erase_count=rand_erase_count,
            mean=mean,
            std=std,
            fp16=fp16)

    return loader
Loader tweaks 6 years ago			`import torch.utils.data`
Big re-org, working towards making pip/module as 'timm' 5 years ago			`from .transforms import *`
			`from .distributed_sampler import OrderedDistributedSampler`
			`from .mixup import FastCollateMixup`
Add some Nvidia performance enhancements (prefetch loader, fast collate), and refactor some of training and model fact/transforms 6 years ago

			`def fast_collate(batch):`
			`targets = torch.tensor([b[1] for b in batch], dtype=torch.int64)`
			`batch_size = len(targets)`
			`tensor = torch.zeros((batch_size, *batch[0][0].shape), dtype=torch.uint8)`
			`for i in range(batch_size):`
			`tensor[i] += torch.from_numpy(batch[i][0])`

			`return tensor, targets`


			`class PrefetchLoader:`

			`def __init__(self,`
			`loader,`
Random erasing crash fix and args pass through 6 years ago			`rand_erase_prob=0.,`
Change args for RandomErasing so only one required for pixel/color mode 6 years ago			`rand_erase_mode='const',`
Add support to split random erasing blocks into randomly selected number with --recount arg. Fix random selection of aspect ratios. 5 years ago			`rand_erase_count=1,`
Improve creation of data pipeline with prefetch enabled vs disabled, fixup inception_res_v2 and dpn models 6 years ago			`mean=IMAGENET_DEFAULT_MEAN,`
Add explicit half/fp16 support to loader and validation script 5 years ago			`std=IMAGENET_DEFAULT_STD,`
			`fp16=False):`
Add some Nvidia performance enhancements (prefetch loader, fast collate), and refactor some of training and model fact/transforms 6 years ago			`self.loader = loader`
			`self.mean = torch.tensor([x * 255 for x in mean]).cuda().view(1, 3, 1, 1)`
			`self.std = torch.tensor([x * 255 for x in std]).cuda().view(1, 3, 1, 1)`
Add explicit half/fp16 support to loader and validation script 5 years ago			`self.fp16 = fp16`
			`if fp16:`
			`self.mean = self.mean.half()`
			`self.std = self.std.half()`
Add per model crop pct, interpolation defaults, tie it all together * create one resolve fn to pull together model defaults + cmd line args * update attribution comments in some models * test update train/validation/inference scripts 6 years ago			`if rand_erase_prob > 0.:`
Some transform/data/loader refactoring, hopefully didn't break things * factor out data related constants to own file * move data related config helpers to own file * add a variant of RandomResizeCrop that randomizes interpolation method * remove old Numpy version of RandomErasing * cleanup torch version of RandomErasing and use it in either GPU loader batch mode or single image cpu Transform 6 years ago			`self.random_erasing = RandomErasing(`
Add support to split random erasing blocks into randomly selected number with --recount arg. Fix random selection of aspect ratios. 5 years ago			`probability=rand_erase_prob, mode=rand_erase_mode, max_count=rand_erase_count)`
Add some Nvidia performance enhancements (prefetch loader, fast collate), and refactor some of training and model fact/transforms 6 years ago			`else:`
			`self.random_erasing = None`

			`def __iter__(self):`
Add per model crop pct, interpolation defaults, tie it all together * create one resolve fn to pull together model defaults + cmd line args * update attribution comments in some models * test update train/validation/inference scripts 6 years ago			`stream = torch.cuda.Stream()`
Add some Nvidia performance enhancements (prefetch loader, fast collate), and refactor some of training and model fact/transforms 6 years ago			`first = True`

			`for next_input, next_target in self.loader:`
Add per model crop pct, interpolation defaults, tie it all together * create one resolve fn to pull together model defaults + cmd line args * update attribution comments in some models * test update train/validation/inference scripts 6 years ago			`with torch.cuda.stream(stream):`
Add some Nvidia performance enhancements (prefetch loader, fast collate), and refactor some of training and model fact/transforms 6 years ago			`next_input = next_input.cuda(non_blocking=True)`
			`next_target = next_target.cuda(non_blocking=True)`
Add explicit half/fp16 support to loader and validation script 5 years ago			`if self.fp16:`
			`next_input = next_input.half().sub_(self.mean).div_(self.std)`
			`else:`
			`next_input = next_input.float().sub_(self.mean).div_(self.std)`
Add some Nvidia performance enhancements (prefetch loader, fast collate), and refactor some of training and model fact/transforms 6 years ago			`if self.random_erasing is not None:`
			`next_input = self.random_erasing(next_input)`

			`if not first:`
			`yield input, target`
			`else:`
			`first = False`

Add per model crop pct, interpolation defaults, tie it all together * create one resolve fn to pull together model defaults + cmd line args * update attribution comments in some models * test update train/validation/inference scripts 6 years ago			`torch.cuda.current_stream().wait_stream(stream)`
Add some Nvidia performance enhancements (prefetch loader, fast collate), and refactor some of training and model fact/transforms 6 years ago			`input = next_input`
			`target = next_target`

			`yield input, target`

			`def __len__(self):`
			`return len(self.loader)`
Improve creation of data pipeline with prefetch enabled vs disabled, fixup inception_res_v2 and dpn models 6 years ago
Distributed (multi-process) train, multi-gpu single process train, and NVIDIA AMP support 6 years ago			`@property`
			`def sampler(self):`
			`return self.loader.sampler`

dataset not passed through PrefetchLoader for inference script. Fix #10 * also, make top5 configurable for lower class count cases 5 years ago			`@property`
			`def dataset(self):`
			`return self.loader.dataset`

Mixup and prefetcher improvements * Do mixup in custom collate fn if prefetcher enabled, reduces performance impact * Move mixup code to own file * Add arg to disable prefetcher * Fix no cuda transfer when prefetcher off * Random erasing when prefetcher off wasn't changed to match new args, fixed * Default random erasing to off (prob = 0.) for train 6 years ago			`@property`
			`def mixup_enabled(self):`
			`if isinstance(self.loader.collate_fn, FastCollateMixup):`
			`return self.loader.collate_fn.mixup_enabled`
			`else:`
			`return False`

			`@mixup_enabled.setter`
			`def mixup_enabled(self, x):`
			`if isinstance(self.loader.collate_fn, FastCollateMixup):`
			`self.loader.collate_fn.mixup_enabled = x`

Improve creation of data pipeline with prefetch enabled vs disabled, fixup inception_res_v2 and dpn models 6 years ago
Add initial sotabench attempt. Split create_transform out of create_loader. Update requirements.txt 5 years ago			`def create_transform(`
Add per model crop pct, interpolation defaults, tie it all together * create one resolve fn to pull together model defaults + cmd line args * update attribution comments in some models * test update train/validation/inference scripts 6 years ago			`input_size,`
Improve creation of data pipeline with prefetch enabled vs disabled, fixup inception_res_v2 and dpn models 6 years ago			`is_training=False,`
Add initial sotabench attempt. Split create_transform out of create_loader. Update requirements.txt 5 years ago			`use_prefetcher=False,`
A number of tweaks to arguments, epoch handling, config * reorganize train args * allow resolve_data_config to be used with dict args, not just arparse * stop incrementing epoch before save, more consistent naming vs csv, etc * update resume and start epoch handling to match above * stop auto-incrementing epoch in scheduler 5 years ago			`color_jitter=0.4,`
Add per model crop pct, interpolation defaults, tie it all together * create one resolve fn to pull together model defaults + cmd line args * update attribution comments in some models * test update train/validation/inference scripts 6 years ago			`interpolation='bilinear',`
Improve creation of data pipeline with prefetch enabled vs disabled, fixup inception_res_v2 and dpn models 6 years ago			`mean=IMAGENET_DEFAULT_MEAN,`
			`std=IMAGENET_DEFAULT_STD,`
Lots of refactoring and cleanup. * Move 'test time pool' to Module that can be used by any model, remove from DPN * Remove ResNext model file and combine with ResNet * Remove fbresnet200 as it was an old conversion and pretrained performance not worth param count * Cleanup adaptive avgmax pooling and add back conctat variant * Factor out checkpoint load fn 6 years ago			`crop_pct=None,`
Add initial sotabench attempt. Split create_transform out of create_loader. Update requirements.txt 5 years ago			`tf_preprocessing=False):`

Add per model crop pct, interpolation defaults, tie it all together * create one resolve fn to pull together model defaults + cmd line args * update attribution comments in some models * test update train/validation/inference scripts 6 years ago			`if isinstance(input_size, tuple):`
			`img_size = input_size[-2:]`
			`else:`
			`img_size = input_size`
Improve creation of data pipeline with prefetch enabled vs disabled, fixup inception_res_v2 and dpn models 6 years ago
Ported Tensorflow pretrained EfficientNet weights and some model cleanup * B0-B3 weights ported from TF with close to paper accuracy * Renamed gen_mobilenet to gen_efficientnet since scaling params go well beyond 'mobile' specific * Add Tensorflow preprocessing option for closer images to source repo 6 years ago			`if tf_preprocessing and use_prefetcher:`
Big re-org, working towards making pip/module as 'timm' 5 years ago			`from timm.data.tf_preprocessing import TfPreprocessTransform`
Add MixNet (https://arxiv.org/abs/1907.09595) with pretrained weights converted from Tensorflow impl * refactor 'same' convolution and add helper to use MixedConv2d when needed * improve performance of 'same' padding for cases that can be handled statically * add support for extra exp, pw, and dw kernel specs with grouping support to decoder/string defs for MixNet * shuffle some args for a bit more consistency, a little less clutter overall in gen_efficientnet.py 5 years ago			`transform = TfPreprocessTransform(`
			`is_training=is_training, size=img_size, interpolation=interpolation)`
Improve creation of data pipeline with prefetch enabled vs disabled, fixup inception_res_v2 and dpn models 6 years ago			`else:`
Ported Tensorflow pretrained EfficientNet weights and some model cleanup * B0-B3 weights ported from TF with close to paper accuracy * Renamed gen_mobilenet to gen_efficientnet since scaling params go well beyond 'mobile' specific * Add Tensorflow preprocessing option for closer images to source repo 6 years ago			`if is_training:`
Working on auto-augment 5 years ago			`if True:`
			`transform = transforms_imagenet_aa(`
			`img_size,`
			`interpolation=interpolation,`
			`use_prefetcher=use_prefetcher,`
			`mean=mean,`
			`std=std)`
			`else:`
			`transform = transforms_imagenet_train(`
			`img_size,`
			`color_jitter=color_jitter,`
			`interpolation=interpolation,`
			`use_prefetcher=use_prefetcher,`
			`mean=mean,`
			`std=std)`
Ported Tensorflow pretrained EfficientNet weights and some model cleanup * B0-B3 weights ported from TF with close to paper accuracy * Renamed gen_mobilenet to gen_efficientnet since scaling params go well beyond 'mobile' specific * Add Tensorflow preprocessing option for closer images to source repo 6 years ago			`else:`
			`transform = transforms_imagenet_eval(`
			`img_size,`
			`interpolation=interpolation,`
			`use_prefetcher=use_prefetcher,`
			`mean=mean,`
			`std=std,`
			`crop_pct=crop_pct)`
Improve creation of data pipeline with prefetch enabled vs disabled, fixup inception_res_v2 and dpn models 6 years ago
Add initial sotabench attempt. Split create_transform out of create_loader. Update requirements.txt 5 years ago			`return transform`


			`def create_loader(`
			`dataset,`
			`input_size,`
			`batch_size,`
			`is_training=False,`
			`use_prefetcher=True,`
			`rand_erase_prob=0.,`
			`rand_erase_mode='const',`
Merge remote-tracking branch 'origin/re-exp' into opt 5 years ago			`rand_erase_count=1,`
Add initial sotabench attempt. Split create_transform out of create_loader. Update requirements.txt 5 years ago			`color_jitter=0.4,`
			`interpolation='bilinear',`
			`mean=IMAGENET_DEFAULT_MEAN,`
			`std=IMAGENET_DEFAULT_STD,`
			`num_workers=1,`
			`distributed=False,`
			`crop_pct=None,`
			`collate_fn=None,`
			`fp16=False,`
			`tf_preprocessing=False,`
			`):`
			`dataset.transform = create_transform(`
			`input_size,`
			`is_training=is_training,`
			`use_prefetcher=use_prefetcher,`
			`color_jitter=color_jitter,`
			`interpolation=interpolation,`
			`mean=mean,`
			`std=std,`
			`crop_pct=crop_pct,`
			`tf_preprocessing=tf_preprocessing,`
			`)`
Improve creation of data pipeline with prefetch enabled vs disabled, fixup inception_res_v2 and dpn models 6 years ago
Distributed (multi-process) train, multi-gpu single process train, and NVIDIA AMP support 6 years ago			`sampler = None`
			`if distributed:`
Add distributed sampler that maintains order of original dataset (for validation) 6 years ago			`if is_training:`
			`sampler = torch.utils.data.distributed.DistributedSampler(dataset)`
			`else:`
			`# This will add extra duplicate entries to result in equal num`
			`# of samples per-process, will slightly alter validation results`
			`sampler = OrderedDistributedSampler(dataset)`
Distributed (multi-process) train, multi-gpu single process train, and NVIDIA AMP support 6 years ago
Mixup and prefetcher improvements * Do mixup in custom collate fn if prefetcher enabled, reduces performance impact * Move mixup code to own file * Add arg to disable prefetcher * Fix no cuda transfer when prefetcher off * Random erasing when prefetcher off wasn't changed to match new args, fixed * Default random erasing to off (prob = 0.) for train 6 years ago			`if collate_fn is None:`
			`collate_fn = fast_collate if use_prefetcher else torch.utils.data.dataloader.default_collate`

Loader tweaks 6 years ago			`loader = torch.utils.data.DataLoader(`
Improve creation of data pipeline with prefetch enabled vs disabled, fixup inception_res_v2 and dpn models 6 years ago			`dataset,`
			`batch_size=batch_size,`
Distributed (multi-process) train, multi-gpu single process train, and NVIDIA AMP support 6 years ago			`shuffle=sampler is None and is_training,`
Improve creation of data pipeline with prefetch enabled vs disabled, fixup inception_res_v2 and dpn models 6 years ago			`num_workers=num_workers,`
Distributed (multi-process) train, multi-gpu single process train, and NVIDIA AMP support 6 years ago			`sampler=sampler,`
Mixup and prefetcher improvements * Do mixup in custom collate fn if prefetcher enabled, reduces performance impact * Move mixup code to own file * Add arg to disable prefetcher * Fix no cuda transfer when prefetcher off * Random erasing when prefetcher off wasn't changed to match new args, fixed * Default random erasing to off (prob = 0.) for train 6 years ago			`collate_fn=collate_fn,`
Loader tweaks 6 years ago			`drop_last=is_training,`
Improve creation of data pipeline with prefetch enabled vs disabled, fixup inception_res_v2 and dpn models 6 years ago			`)`
			`if use_prefetcher:`
			`loader = PrefetchLoader(`
			`loader,`
Random erasing crash fix and args pass through 6 years ago			`rand_erase_prob=rand_erase_prob if is_training else 0.,`
Change args for RandomErasing so only one required for pixel/color mode 6 years ago			`rand_erase_mode=rand_erase_mode,`
Add support to split random erasing blocks into randomly selected number with --recount arg. Fix random selection of aspect ratios. 5 years ago			`rand_erase_count=rand_erase_count,`
Improve creation of data pipeline with prefetch enabled vs disabled, fixup inception_res_v2 and dpn models 6 years ago			`mean=mean,`
Add explicit half/fp16 support to loader and validation script 5 years ago			`std=std,`
			`fp16=fp16)`
Improve creation of data pipeline with prefetch enabled vs disabled, fixup inception_res_v2 and dpn models 6 years ago
			`return loader`