pytorch-image-models/timm/models/gluon_xception.py

"""Pytorch impl of Gluon Xception
This is a port of the Gluon Xception code and weights, itself ported from a PyTorch DeepLab impl.

Gluon model: (https://gluon-cv.mxnet.io/_modules/gluoncv/model_zoo/xception.html)
Original PyTorch DeepLab impl: https://github.com/jfzhang95/pytorch-deeplab-xception

Hacked together by Ross Wightman
"""
from collections import OrderedDict

import torch.nn as nn
import torch.nn.functional as F

from timm.data import IMAGENET_DEFAULT_MEAN, IMAGENET_DEFAULT_STD
from .helpers import load_pretrained
from .layers import SelectAdaptivePool2d, get_padding
from .registry import register_model

__all__ = ['Xception65']

default_cfgs = {
    'gluon_xception65': {
        'url': 'https://github.com/rwightman/pytorch-image-models/releases/download/v0.1-weights/gluon_xception-7015a15c.pth',
        'input_size': (3, 299, 299),
        'crop_pct': 0.903,
        'pool_size': (10, 10),
        'interpolation': 'bicubic',
        'mean': IMAGENET_DEFAULT_MEAN,
        'std': IMAGENET_DEFAULT_STD,
        'num_classes': 1000,
        'first_conv': 'conv1',
        'classifier': 'fc'
        # The resize parameter of the validation transform should be 333, and make sure to center crop at 299x299
    },
}

""" PADDING NOTES
The original PyTorch and Gluon impl of these models dutifully reproduced the 
aligned padding added to Tensorflow models for Deeplab. This padding was compensating
for  Tensorflow 'SAME' padding. PyTorch symmetric padding behaves the way we'd want it to. 
"""


class SeparableConv2d(nn.Module):
    def __init__(self, inplanes, planes, kernel_size=3, stride=1,
                 dilation=1, bias=False, norm_layer=None, norm_kwargs=None):
        super(SeparableConv2d, self).__init__()
        norm_kwargs = norm_kwargs if norm_kwargs is not None else {}
        self.kernel_size = kernel_size
        self.dilation = dilation

        # depthwise convolution
        padding = get_padding(kernel_size, stride, dilation)
        self.conv_dw = nn.Conv2d(
            inplanes, inplanes, kernel_size, stride=stride,
            padding=padding, dilation=dilation, groups=inplanes, bias=bias)
        self.bn = norm_layer(num_features=inplanes, **norm_kwargs)
        # pointwise convolution
        self.conv_pw = nn.Conv2d(inplanes, planes, kernel_size=1, bias=bias)

    def forward(self, x):
        x = self.conv_dw(x)
        x = self.bn(x)
        x = self.conv_pw(x)
        return x


class Block(nn.Module):
    def __init__(self, inplanes, planes, stride=1, dilation=1, start_with_relu=True,
                 norm_layer=None, norm_kwargs=None, ):
        super(Block, self).__init__()
        norm_kwargs = norm_kwargs if norm_kwargs is not None else {}
        if isinstance(planes, (list, tuple)):
            assert len(planes) == 3
        else:
            planes = (planes,) * 3
        outplanes = planes[-1]

        if outplanes != inplanes or stride != 1:
            self.skip = nn.Sequential()
            self.skip.add_module('conv1', nn.Conv2d(
                inplanes, outplanes, 1, stride=stride, bias=False)),
            self.skip.add_module('bn1', norm_layer(num_features=outplanes, **norm_kwargs))
        else:
            self.skip = None

        rep = OrderedDict()
        for i in range(3):
            rep['act%d' % (i + 1)] = nn.ReLU(inplace=True)
            rep['conv%d' % (i + 1)] = SeparableConv2d(
                inplanes, planes[i], 3, stride=stride if i == 2 else 1, dilation=dilation,
                norm_layer=norm_layer, norm_kwargs=norm_kwargs)
            rep['bn%d' % (i + 1)] = norm_layer(planes[i], **norm_kwargs)
            inplanes = planes[i]

        if not start_with_relu:
            del rep['act1']
        else:
            rep['act1'] = nn.ReLU(inplace=False)
        self.rep = nn.Sequential(rep)

    def forward(self, x):
        skip = x
        if self.skip is not None:
            skip = self.skip(skip)
        x = self.rep(x) + skip
        return x


class Xception65(nn.Module):
    """Modified Aligned Xception.

    NOTE: only the 65 layer version is included here, the 71 layer variant
    was not correct and had no pretrained weights
    """

    def __init__(self, num_classes=1000, in_chans=3, output_stride=32, norm_layer=nn.BatchNorm2d,
                 norm_kwargs=None, drop_rate=0., global_pool='avg'):
        super(Xception65, self).__init__()
        self.num_classes = num_classes
        self.drop_rate = drop_rate
        norm_kwargs = norm_kwargs if norm_kwargs is not None else {}
        if output_stride == 32:
            entry_block3_stride = 2
            exit_block20_stride = 2
            middle_block_dilation = 1
            exit_block_dilations = (1, 1)
        elif output_stride == 16:
            entry_block3_stride = 2
            exit_block20_stride = 1
            middle_block_dilation = 1
            exit_block_dilations = (1, 2)
        elif output_stride == 8:
            entry_block3_stride = 1
            exit_block20_stride = 1
            middle_block_dilation = 2
            exit_block_dilations = (2, 4)
        else:
            raise NotImplementedError

        # Entry flow
        self.conv1 = nn.Conv2d(in_chans, 32, kernel_size=3, stride=2, padding=1, bias=False)
        self.bn1 = norm_layer(num_features=32, **norm_kwargs)
        self.relu = nn.ReLU(inplace=True)

        self.conv2 = nn.Conv2d(32, 64, kernel_size=3, stride=1, padding=1, bias=False)
        self.bn2 = norm_layer(num_features=64)

        self.block1 = Block(
            64, 128, stride=2, start_with_relu=False, norm_layer=norm_layer, norm_kwargs=norm_kwargs)
        self.block2 = Block(
            128, 256, stride=2, start_with_relu=False, norm_layer=norm_layer, norm_kwargs=norm_kwargs)
        self.block3 = Block(
            256, 728, stride=entry_block3_stride, norm_layer=norm_layer, norm_kwargs=norm_kwargs)

        # Middle flow
        self.mid = nn.Sequential(OrderedDict([('block%d' % i, Block(
            728, 728, stride=1, dilation=middle_block_dilation,
            norm_layer=norm_layer, norm_kwargs=norm_kwargs)) for i in range(4, 20)]))

        # Exit flow
        self.block20 = Block(
            728, (728, 1024, 1024), stride=exit_block20_stride, dilation=exit_block_dilations[0],
            norm_layer=norm_layer, norm_kwargs=norm_kwargs)

        self.conv3 = SeparableConv2d(
            1024, 1536, 3, stride=1, dilation=exit_block_dilations[1],
            norm_layer=norm_layer, norm_kwargs=norm_kwargs)
        self.bn3 = norm_layer(num_features=1536, **norm_kwargs)

        self.conv4 = SeparableConv2d(
            1536, 1536, 3, stride=1, dilation=exit_block_dilations[1],
            norm_layer=norm_layer, norm_kwargs=norm_kwargs)
        self.bn4 = norm_layer(num_features=1536, **norm_kwargs)

        self.num_features = 2048
        self.conv5 = SeparableConv2d(
            1536, self.num_features, 3, stride=1, dilation=exit_block_dilations[1],
            norm_layer=norm_layer, norm_kwargs=norm_kwargs)
        self.bn5 = norm_layer(num_features=self.num_features, **norm_kwargs)
        self.global_pool = SelectAdaptivePool2d(pool_type=global_pool)
        self.fc = nn.Linear(self.num_features * self.global_pool.feat_mult(), num_classes)

    def get_classifier(self):
        return self.fc

    def reset_classifier(self, num_classes, global_pool='avg'):
        self.num_classes = num_classes
        self.global_pool = SelectAdaptivePool2d(pool_type=global_pool)
        self.fc = nn.Linear(self.num_features * self.global_pool.feat_mult(), num_classes) if num_classes else None

    def forward_features(self, x):
        # Entry flow
        x = self.conv1(x)
        x = self.bn1(x)
        x = self.relu(x)

        x = self.conv2(x)
        x = self.bn2(x)
        x = self.relu(x)

        x = self.block1(x)
        # add relu here
        x = self.relu(x)
        # c1 = x
        x = self.block2(x)
        # c2 = x
        x = self.block3(x)

        # Middle flow
        x = self.mid(x)
        # c3 = x

        # Exit flow
        x = self.block20(x)
        x = self.relu(x)
        x = self.conv3(x)
        x = self.bn3(x)
        x = self.relu(x)

        x = self.conv4(x)
        x = self.bn4(x)
        x = self.relu(x)

        x = self.conv5(x)
        x = self.bn5(x)
        x = self.relu(x)
        return x

    def forward(self, x):
        x = self.forward_features(x)
        x = self.global_pool(x).flatten(1)
        if self.drop_rate:
            F.dropout(x, self.drop_rate, training=self.training)
        x = self.fc(x)
        return x


@register_model
def gluon_xception65(pretrained=False, num_classes=1000, in_chans=3, **kwargs):
    """ Modified Aligned Xception-65
    """
    default_cfg = default_cfgs['gluon_xception65']
    model = Xception65(num_classes=num_classes, in_chans=in_chans, **kwargs)
    model.default_cfg = default_cfg
    if pretrained:
        load_pretrained(model, default_cfg, num_classes, in_chans)
    return model
Add working Gluon Xception-65 model. Some cleanup still needed. 5 years ago			`"""Pytorch impl of Gluon Xception`
			`This is a port of the Gluon Xception code and weights, itself ported from a PyTorch DeepLab impl.`

			`Gluon model: (https://gluon-cv.mxnet.io/_modules/gluoncv/model_zoo/xception.html)`
			`Original PyTorch DeepLab impl: https://github.com/jfzhang95/pytorch-deeplab-xception`

			`Hacked together by Ross Wightman`
			`"""`
Replace all None by nn.Identity() in all models reset_classifier when False-values num_classes is given. Make small code refactoring 5 years ago			`from collections import OrderedDict`

Add working Gluon Xception-65 model. Some cleanup still needed. 5 years ago			`import torch.nn as nn`
			`import torch.nn.functional as F`

Replace all None by nn.Identity() in all models reset_classifier when False-values num_classes is given. Make small code refactoring 5 years ago			`from timm.data import IMAGENET_DEFAULT_MEAN, IMAGENET_DEFAULT_STD`
Add working Gluon Xception-65 model. Some cleanup still needed. 5 years ago			`from .helpers import load_pretrained`
Working on feature extraction, interfaces refined, a number of models working, some in progress. 4 years ago			`from .layers import SelectAdaptivePool2d, get_padding`
Replace all None by nn.Identity() in all models reset_classifier when False-values num_classes is given. Make small code refactoring 5 years ago			`from .registry import register_model`
Add working Gluon Xception-65 model. Some cleanup still needed. 5 years ago
Working on feature extraction, interfaces refined, a number of models working, some in progress. 4 years ago			`__all__ = ['Xception65']`
Add working Gluon Xception-65 model. Some cleanup still needed. 5 years ago
			`default_cfgs = {`
			`'gluon_xception65': {`
			`'url': 'https://github.com/rwightman/pytorch-image-models/releases/download/v0.1-weights/gluon_xception-7015a15c.pth',`
			`'input_size': (3, 299, 299),`
Working on feature extraction, interfaces refined, a number of models working, some in progress. 4 years ago			`'crop_pct': 0.903,`
A few more additions to Gluon Xception models to match interface of others. 5 years ago			`'pool_size': (10, 10),`
Add working Gluon Xception-65 model. Some cleanup still needed. 5 years ago			`'interpolation': 'bicubic',`
			`'mean': IMAGENET_DEFAULT_MEAN,`
			`'std': IMAGENET_DEFAULT_STD,`
			`'num_classes': 1000,`
			`'first_conv': 'conv1',`
			`'classifier': 'fc'`
			`# The resize parameter of the validation transform should be 333, and make sure to center crop at 299x299`
			`},`
			`}`

			`""" PADDING NOTES`
			`The original PyTorch and Gluon impl of these models dutifully reproduced the`
			`aligned padding added to Tensorflow models for Deeplab. This padding was compensating`
			`for Tensorflow 'SAME' padding. PyTorch symmetric padding behaves the way we'd want it to.`
			`"""`


			`class SeparableConv2d(nn.Module):`
			`def __init__(self, inplanes, planes, kernel_size=3, stride=1,`
			`dilation=1, bias=False, norm_layer=None, norm_kwargs=None):`
			`super(SeparableConv2d, self).__init__()`
			`norm_kwargs = norm_kwargs if norm_kwargs is not None else {}`
			`self.kernel_size = kernel_size`
			`self.dilation = dilation`

			`# depthwise convolution`
Working on feature extraction, interfaces refined, a number of models working, some in progress. 4 years ago			`padding = get_padding(kernel_size, stride, dilation)`
Add working Gluon Xception-65 model. Some cleanup still needed. 5 years ago			`self.conv_dw = nn.Conv2d(`
			`inplanes, inplanes, kernel_size, stride=stride,`
Working on feature extraction, interfaces refined, a number of models working, some in progress. 4 years ago			`padding=padding, dilation=dilation, groups=inplanes, bias=bias)`
Add working Gluon Xception-65 model. Some cleanup still needed. 5 years ago			`self.bn = norm_layer(num_features=inplanes, **norm_kwargs)`
			`# pointwise convolution`
			`self.conv_pw = nn.Conv2d(inplanes, planes, kernel_size=1, bias=bias)`

			`def forward(self, x):`
			`x = self.conv_dw(x)`
			`x = self.bn(x)`
			`x = self.conv_pw(x)`
			`return x`


			`class Block(nn.Module):`
Working on feature extraction, interfaces refined, a number of models working, some in progress. 4 years ago			`def __init__(self, inplanes, planes, stride=1, dilation=1, start_with_relu=True,`
			`norm_layer=None, norm_kwargs=None, ):`
Add working Gluon Xception-65 model. Some cleanup still needed. 5 years ago			`super(Block, self).__init__()`
			`norm_kwargs = norm_kwargs if norm_kwargs is not None else {}`
Working on feature extraction, interfaces refined, a number of models working, some in progress. 4 years ago			`if isinstance(planes, (list, tuple)):`
			`assert len(planes) == 3`
			`else:`
			`planes = (planes,) * 3`
			`outplanes = planes[-1]`

			`if outplanes != inplanes or stride != 1:`
Add working Gluon Xception-65 model. Some cleanup still needed. 5 years ago			`self.skip = nn.Sequential()`
			`self.skip.add_module('conv1', nn.Conv2d(`
Working on feature extraction, interfaces refined, a number of models working, some in progress. 4 years ago			`inplanes, outplanes, 1, stride=stride, bias=False)),`
			`self.skip.add_module('bn1', norm_layer(num_features=outplanes, **norm_kwargs))`
Add working Gluon Xception-65 model. Some cleanup still needed. 5 years ago			`else:`
			`self.skip = None`

			`rep = OrderedDict()`
Working on feature extraction, interfaces refined, a number of models working, some in progress. 4 years ago			`for i in range(3):`
			`rep['act%d' % (i + 1)] = nn.ReLU(inplace=True)`
			`rep['conv%d' % (i + 1)] = SeparableConv2d(`
			`inplanes, planes[i], 3, stride=stride if i == 2 else 1, dilation=dilation,`
			`norm_layer=norm_layer, norm_kwargs=norm_kwargs)`
			`rep['bn%d' % (i + 1)] = norm_layer(planes[i], **norm_kwargs)`
			`inplanes = planes[i]`

			`if not start_with_relu:`
			`del rep['act1']`
			`else:`
			`rep['act1'] = nn.ReLU(inplace=False)`
Add working Gluon Xception-65 model. Some cleanup still needed. 5 years ago			`self.rep = nn.Sequential(rep)`

			`def forward(self, x):`
			`skip = x`
			`if self.skip is not None:`
			`skip = self.skip(skip)`
			`x = self.rep(x) + skip`
			`return x`


			`class Xception65(nn.Module):`
Working on feature extraction, interfaces refined, a number of models working, some in progress. 4 years ago			`"""Modified Aligned Xception.`

			`NOTE: only the 65 layer version is included here, the 71 layer variant`
			`was not correct and had no pretrained weights`
Add working Gluon Xception-65 model. Some cleanup still needed. 5 years ago			`"""`

			`def __init__(self, num_classes=1000, in_chans=3, output_stride=32, norm_layer=nn.BatchNorm2d,`
			`norm_kwargs=None, drop_rate=0., global_pool='avg'):`
			`super(Xception65, self).__init__()`
A few more additions to Gluon Xception models to match interface of others. 5 years ago			`self.num_classes = num_classes`
Add working Gluon Xception-65 model. Some cleanup still needed. 5 years ago			`self.drop_rate = drop_rate`
			`norm_kwargs = norm_kwargs if norm_kwargs is not None else {}`
			`if output_stride == 32:`
			`entry_block3_stride = 2`
			`exit_block20_stride = 2`
			`middle_block_dilation = 1`
			`exit_block_dilations = (1, 1)`
			`elif output_stride == 16:`
			`entry_block3_stride = 2`
			`exit_block20_stride = 1`
			`middle_block_dilation = 1`
			`exit_block_dilations = (1, 2)`
			`elif output_stride == 8:`
			`entry_block3_stride = 1`
			`exit_block20_stride = 1`
			`middle_block_dilation = 2`
			`exit_block_dilations = (2, 4)`
			`else:`
			`raise NotImplementedError`

			`# Entry flow`
			`self.conv1 = nn.Conv2d(in_chans, 32, kernel_size=3, stride=2, padding=1, bias=False)`
			`self.bn1 = norm_layer(num_features=32, **norm_kwargs)`
			`self.relu = nn.ReLU(inplace=True)`

			`self.conv2 = nn.Conv2d(32, 64, kernel_size=3, stride=1, padding=1, bias=False)`
			`self.bn2 = norm_layer(num_features=64)`

			`self.block1 = Block(`
Working on feature extraction, interfaces refined, a number of models working, some in progress. 4 years ago			`64, 128, stride=2, start_with_relu=False, norm_layer=norm_layer, norm_kwargs=norm_kwargs)`
Add working Gluon Xception-65 model. Some cleanup still needed. 5 years ago			`self.block2 = Block(`
Working on feature extraction, interfaces refined, a number of models working, some in progress. 4 years ago			`128, 256, stride=2, start_with_relu=False, norm_layer=norm_layer, norm_kwargs=norm_kwargs)`
Add working Gluon Xception-65 model. Some cleanup still needed. 5 years ago			`self.block3 = Block(`
Working on feature extraction, interfaces refined, a number of models working, some in progress. 4 years ago			`256, 728, stride=entry_block3_stride, norm_layer=norm_layer, norm_kwargs=norm_kwargs)`
Add working Gluon Xception-65 model. Some cleanup still needed. 5 years ago
			`# Middle flow`
Replace all None by nn.Identity() in all models reset_classifier when False-values num_classes is given. Make small code refactoring 5 years ago			`self.mid = nn.Sequential(OrderedDict([('block%d' % i, Block(`
Working on feature extraction, interfaces refined, a number of models working, some in progress. 4 years ago			`728, 728, stride=1, dilation=middle_block_dilation,`
			`norm_layer=norm_layer, norm_kwargs=norm_kwargs)) for i in range(4, 20)]))`
Add working Gluon Xception-65 model. Some cleanup still needed. 5 years ago
			`# Exit flow`
			`self.block20 = Block(`
Working on feature extraction, interfaces refined, a number of models working, some in progress. 4 years ago			`728, (728, 1024, 1024), stride=exit_block20_stride, dilation=exit_block_dilations[0],`
			`norm_layer=norm_layer, norm_kwargs=norm_kwargs)`
Add working Gluon Xception-65 model. Some cleanup still needed. 5 years ago
			`self.conv3 = SeparableConv2d(`
			`1024, 1536, 3, stride=1, dilation=exit_block_dilations[1],`
			`norm_layer=norm_layer, norm_kwargs=norm_kwargs)`
			`self.bn3 = norm_layer(num_features=1536, **norm_kwargs)`

			`self.conv4 = SeparableConv2d(`
			`1536, 1536, 3, stride=1, dilation=exit_block_dilations[1],`
			`norm_layer=norm_layer, norm_kwargs=norm_kwargs)`
			`self.bn4 = norm_layer(num_features=1536, **norm_kwargs)`

A few more additions to Gluon Xception models to match interface of others. 5 years ago			`self.num_features = 2048`
Add working Gluon Xception-65 model. Some cleanup still needed. 5 years ago			`self.conv5 = SeparableConv2d(`
A few more additions to Gluon Xception models to match interface of others. 5 years ago			`1536, self.num_features, 3, stride=1, dilation=exit_block_dilations[1],`
Add working Gluon Xception-65 model. Some cleanup still needed. 5 years ago			`norm_layer=norm_layer, norm_kwargs=norm_kwargs)`
A few more additions to Gluon Xception models to match interface of others. 5 years ago			`self.bn5 = norm_layer(num_features=self.num_features, **norm_kwargs)`
Finish with HRNet, weights and models updated. Improve consistency in model classifier/global pool treatment. 5 years ago			`self.global_pool = SelectAdaptivePool2d(pool_type=global_pool)`
			`self.fc = nn.Linear(self.num_features * self.global_pool.feat_mult(), num_classes)`
A few more additions to Gluon Xception models to match interface of others. 5 years ago
			`def get_classifier(self):`
			`return self.fc`

			`def reset_classifier(self, num_classes, global_pool='avg'):`
			`self.num_classes = num_classes`
Finish with HRNet, weights and models updated. Improve consistency in model classifier/global pool treatment. 5 years ago			`self.global_pool = SelectAdaptivePool2d(pool_type=global_pool)`
			`self.fc = nn.Linear(self.num_features * self.global_pool.feat_mult(), num_classes) if num_classes else None`
Add working Gluon Xception-65 model. Some cleanup still needed. 5 years ago
Finish with HRNet, weights and models updated. Improve consistency in model classifier/global pool treatment. 5 years ago			`def forward_features(self, x):`
Add working Gluon Xception-65 model. Some cleanup still needed. 5 years ago			`# Entry flow`
			`x = self.conv1(x)`
			`x = self.bn1(x)`
			`x = self.relu(x)`

			`x = self.conv2(x)`
			`x = self.bn2(x)`
			`x = self.relu(x)`

			`x = self.block1(x)`
			`# add relu here`
			`x = self.relu(x)`
			`# c1 = x`
			`x = self.block2(x)`
			`# c2 = x`
			`x = self.block3(x)`

			`# Middle flow`
			`x = self.mid(x)`
			`# c3 = x`

			`# Exit flow`
			`x = self.block20(x)`
			`x = self.relu(x)`
			`x = self.conv3(x)`
			`x = self.bn3(x)`
			`x = self.relu(x)`

			`x = self.conv4(x)`
			`x = self.bn4(x)`
			`x = self.relu(x)`

			`x = self.conv5(x)`
			`x = self.bn5(x)`
			`x = self.relu(x)`
A few more additions to Gluon Xception models to match interface of others. 5 years ago			`return x`

			`def forward(self, x):`
			`x = self.forward_features(x)`
Finish with HRNet, weights and models updated. Improve consistency in model classifier/global pool treatment. 5 years ago			`x = self.global_pool(x).flatten(1)`
A few more additions to Gluon Xception models to match interface of others. 5 years ago			`if self.drop_rate:`
			`F.dropout(x, self.drop_rate, training=self.training)`
Add working Gluon Xception-65 model. Some cleanup still needed. 5 years ago			`x = self.fc(x)`
			`return x`


			`@register_model`
			`def gluon_xception65(pretrained=False, num_classes=1000, in_chans=3, **kwargs):`
A few more additions to Gluon Xception models to match interface of others. 5 years ago			`""" Modified Aligned Xception-65`
			`"""`
Add working Gluon Xception-65 model. Some cleanup still needed. 5 years ago			`default_cfg = default_cfgs['gluon_xception65']`
			`model = Xception65(num_classes=num_classes, in_chans=in_chans, **kwargs)`
			`model.default_cfg = default_cfg`
			`if pretrained:`
			`load_pretrained(model, default_cfg, num_classes, in_chans)`
			`return model`