Merge 8ed5ca81cc into a5b01ec04e

2 years ago · 22329d045f
parent a5b01ec04e 8ed5ca81cc
commit 22329d045f
4 changed files with 597 additions and 0 deletions
--- a/docs/models.md
+++ b/docs/models.md
@ -142,6 +142,10 @@ NOTE: I am deprecating this version of the networks, the new ones are part of `r
 * Paper: `Squeeze-and-Excitation Networks` - https://arxiv.org/abs/1709.01507
 * Code: https://github.com/Cadene/pretrained-models.pytorch 

+## SimpleNet [[simplenet.py](https://github.com/rwightman/pytorch-image-models/blob/master/timm/models/simplenet.py)]
+* Paper: `Lets Keep it simple, Using simple architectures to outperform deeper and more complex architectures` - https://arxiv.org/abs/1608.06037
+* Code: https://github.com/Coderx7/SimpleNet_Pytorch
+
 ## TResNet [[tresnet.py](https://github.com/rwightman/pytorch-image-models/blob/master/timm/models/tresnet.py)]
 * Paper: `TResNet: High Performance GPU-Dedicated Architecture` - https://arxiv.org/abs/2003.13630
 * Code: https://github.com/mrT23/TResNet
--- a/docs/models/simplenet.md
+++ b/docs/models/simplenet.md
@ -0,0 +1,96 @@
+# SimpleNet v1
+
+**SimpleNetV1** is a convolutional neural network that is designed with simplicity in mind and outperforms much deeper and more complex architectures. The network design includes the most basic operators in a plain CNN network and is completely comprised of just Convolutional layers followed by BatchNormalization and ReLU activation function.  
+
+## How do I use this model on an image?
+To load a pretrained model:
+simply choose a variant among available ones and do as follows:
+```python
+import timm
+model = timm.create_model('simplenetv1_5m_m2', pretrained=True)
+model.eval()
+```
+
+To load and preprocess the image:
+```python 
+import urllib
+from PIL import Image
+from timm.data import resolve_data_config
+from timm.data.transforms_factory import create_transform
+
+config = resolve_data_config({}, model=model)
+transform = create_transform(**config)
+
+url, filename = ("https://github.com/pytorch/hub/raw/master/images/dog.jpg", "dog.jpg")
+urllib.request.urlretrieve(url, filename)
+img = Image.open(filename).convert('RGB')
+tensor = transform(img).unsqueeze(0) # transform and add batch dimension
+```
+
+To get the model predictions:
+```python
+import torch
+with torch.no_grad():
+    out = model(tensor)
+probabilities = torch.nn.functional.softmax(out[0], dim=0)
+print(probabilities.shape)
+# prints: torch.Size([1000])
+```
+
+To get the top-5 predictions class names:
+```python
+# Get imagenet class mappings
+url, filename = ("https://raw.githubusercontent.com/pytorch/hub/master/imagenet_classes.txt", "imagenet_classes.txt")
+urllib.request.urlretrieve(url, filename) 
+with open("imagenet_classes.txt", "r") as f:
+    categories = [s.strip() for s in f.readlines()]
+
+# Print top categories per image
+top5_prob, top5_catid = torch.topk(probabilities, 5)
+for i in range(top5_prob.size(0)):
+    print(categories[top5_catid[i]], top5_prob[i].item())
+# prints class names and probabilities like:
+# Samoyed 0.8442415595054626
+# Pomeranian 0.09159677475690842
+# Great Pyrenees 0.013929242268204689
+# Arctic fox 0.00913404393941164
+# white wolf 0.008576451800763607
+```
+
+Replace the model name with the variant you want to use, e.g. `simplenetv1_9m_m2`. You can find the IDs in the model summaries at the top of this page.
+
+To extract image features with this model, follow the [timm feature extraction examples](https://rwightman.github.io/pytorch-image-models/feature_extraction/), just change the name of the model you want to use.
+
+## How do I finetune this model?
+You can finetune any of the pre-trained models just by changing the classifier (the last layer).
+```python
+model = timm.create_model('simplenetv1_5m_m2', pretrained=True, num_classes=NUM_FINETUNE_CLASSES)
+```
+To finetune on your own dataset, you have to write a training loop or adapt [timm's training
+script](https://github.com/rwightman/pytorch-image-models/blob/master/train.py) to use your dataset.
+
+## How do I train this model?
+
+You can follow the [timm recipe scripts](https://rwightman.github.io/pytorch-image-models/scripts/) for training a new model afresh.
+
+## Citation
+
+```BibTeX
+@article{DBLP:journals/corr/HasanPourRVS16,
+  author    = {Seyyed Hossein HasanPour and
+               Mohammad Rouhani and
+               Mohsen Fayyaz and
+               Mohammad Sabokrou},
+  title     = {Lets keep it simple, Using simple architectures to outperform deeper
+               and more complex architectures},
+  journal   = {CoRR},
+  volume    = {abs/1608.06037},
+  year      = {2016},
+  url       = {http://arxiv.org/abs/1608.06037},
+  eprinttype = {arXiv},
+  eprint    = {1608.06037},
+  timestamp = {Mon, 13 Aug 2018 16:48:25 +0200},
+  biburl    = {https://dblp.org/rec/journals/corr/HasanPourRVS16.bib},
+  bibsource = {dblp computer science bibliography, https://dblp.org}
+}
+```
--- a/timm/models/init.py
+++ b/timm/models/init.py
@ -48,6 +48,7 @@ from .rexnet import *
 from .selecsls import *
 from .senet import *
 from .sequencer import *
+from .simplenet import *
 from .sknet import *
 from .swin_transformer import *
 from .swin_transformer_v2 import *
--- a/timm/models/simplenet.py
+++ b/timm/models/simplenet.py
@ -0,0 +1,496 @@
+""" SimpleNet
+
+Paper: `Lets Keep it simple, Using simple architectures to outperform deeper and more complex architectures`
+    - https://arxiv.org/abs/1608.06037
+
+@article{hasanpour2016lets,
+  title={Lets keep it simple, Using simple architectures to outperform deeper and more complex architectures},
+  author={Hasanpour, Seyyed Hossein and Rouhani, Mohammad and Fayyaz, Mohsen and Sabokrou, Mohammad},
+  journal={arXiv preprint arXiv:1608.06037},
+  year={2016}
+}
+
+Official Caffe impl at https://github.com/Coderx7/SimpleNet
+Official Pythorch impl at https://github.com/Coderx7/SimpleNet_Pytorch
+Seyyed Hossein Hasanpour
+"""
+import math
+from typing import Union, Tuple, List, Dict, Any, Optional
+
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+
+from ._builder import build_model_with_cfg
+from ._registry import register_model
+from timm.data import IMAGENET_DEFAULT_MEAN, IMAGENET_DEFAULT_STD
+
+__all__ = [
+    "simplenet",
+    "simplenetv1_small_m1_05",  # 1.5m
+    "simplenetv1_small_m2_05",  # 1.5m
+    "simplenetv1_small_m1_075",  # 3m
+    "simplenetv1_small_m2_075",  # 3m
+    "simplenetv1_5m_m1",  # 5m
+    "simplenetv1_5m_m2",  # 5m
+    "simplenetv1_9m_m1",  # 9m
+    "simplenetv1_9m_m2",  # 9m
+]  # model_registry will add each entrypoint fn to this
+
+
+def _cfg(url="", **kwargs):
+    return {
+        "url": url,
+        "num_classes": 1000,
+        "input_size": (3, 224, 224),
+        "crop_pct": 0.875,
+        "interpolation": "bicubic",
+        "mean": IMAGENET_DEFAULT_MEAN,
+        "std": IMAGENET_DEFAULT_STD,
+        **kwargs,
+    }
+
+
+default_cfgs: Dict[str, Dict[str, Any]] = {
+    "simplenetv1_small_m1_05": _cfg(
+        url="https://github.com/Coderx7/SimpleNet_Pytorch/releases/download/v1.0.0/simplenetv1_small_m1_05-a7ec600b.pth"
+    ),
+    "simplenetv1_small_m2_05": _cfg(
+        url="https://github.com/Coderx7/SimpleNet_Pytorch/releases/download/v1.0.0/simplenetv1_small_m2_05-62617ea1.pth"
+    ),
+    "simplenetv1_small_m1_075": _cfg(
+        url="https://github.com/Coderx7/SimpleNet_Pytorch/releases/download/v1.0.0/simplenetv1_small_m1_075-8427bf60.pth"
+    ),
+    "simplenetv1_small_m2_075": _cfg(
+        url="https://github.com/Coderx7/SimpleNet_Pytorch/releases/download/v1.0.0/simplenetv1_small_m2_075-da714eb5.pth"
+    ),
+    "simplenetv1_5m_m1": _cfg(
+        url="https://github.com/Coderx7/SimpleNet_Pytorch/releases/download/v1.0.0/simplenetv1_5m_m1-cc6b3ad1.pth"
+    ),
+    "simplenetv1_5m_m2": _cfg(
+        url="https://github.com/Coderx7/SimpleNet_Pytorch/releases/download/v1.0.0/simplenetv1_5m_m2-c35297bf.pth"
+    ),
+    "simplenetv1_9m_m1": _cfg(
+        url="https://github.com/Coderx7/SimpleNet_Pytorch/releases/download/v1.0.0/simplenetv1_9m_m1-8c98a0a5.pth"
+    ),
+    "simplenetv1_9m_m2": _cfg(
+        url="https://github.com/Coderx7/SimpleNet_Pytorch/releases/download/v1.0.0/simplenetv1_9m_m2-6b01be1e.pth"
+    ),
+}
+
+
+class View(nn.Module):
+    def forward(self, x):
+        print(f"{x.shape}")
+        return x
+
+
+class SimpleNet(nn.Module):
+    def __init__(
+        self,
+        num_classes: int = 1000,
+        in_chans: int = 3,
+        scale: float = 1,
+        network_idx: int = 0,
+        mode: int = 2,
+        drop_rates: Dict[int, float] = {},
+    ):
+        """Instantiates a SimpleNet model. SimpleNet is comprised of the most basic building blocks of a CNN architecture.
+        It uses basic principles to maximize the network performance both in terms of feature representation and speed without
+        resorting to complex design or operators.
+
+        Args:
+            num_classes (int, optional): number of classes. Defaults to 1000.
+            in_chans (int, optional): number of input channels. Defaults to 3.
+            scale (float, optional): scale of the architecture width. Defaults to 1.0.
+            network_idx (int, optional): the network index indicating the 5 million or 8 million version(0 and 1 respectively). Defaults to 0.
+            mode (int, optional): stride mode of the architecture. specifies how fast the input shrinks.
+                This is used for larger input sizes such as the 224x224 in imagenet training where the
+                input size incurs a lot of overhead if not downsampled properly.
+                you can choose between 0 meaning no change and 4. where each number denotes a specific
+                downsampling strategy. For imagenet use 1-4.
+                the larger the stride mode, usually the higher accuracy and the slower
+                the network gets. stride mode 1 is the fastest and achives very good accuracy.
+                Defaults to 2.
+            drop_rates (Dict[int,float], optional): custom drop out rates specified per layer.
+                each rate should be paired with the corrosponding layer index(pooling and cnn layers are counted only). Defaults to {}.
+        """
+        super(SimpleNet, self).__init__()
+        # (channels or layer-type, stride=1, drp=0.)
+        self.cfg: Dict[str, List[Tuple[Union(int, str), int, Union(float, None), Optional[str]]]] = {
+            "simplenetv1_imagenet": [
+                (64, 1, 0.0),
+                (128, 1, 0.0),
+                (128, 1, 0.0),
+                (128, 1, 0.0),
+                (128, 1, 0.0),
+                (128, 1, 0.0),
+                ("p", 2, 0.0),
+                (256, 1, 0.0),
+                (256, 1, 0.0),
+                (256, 1, 0.0),
+                (512, 1, 0.0),
+                ("p", 2, 0.0),
+                (2048, 1, 0.0, "k1"),
+                (256, 1, 0.0, "k1"),
+                (256, 1, 0.0),
+            ],
+            "simplenetv1_imagenet_9m": [
+                (128, 1, 0.0),
+                (192, 1, 0.0),
+                (192, 1, 0.0),
+                (192, 1, 0.0),
+                (192, 1, 0.0),
+                (192, 1, 0.0),
+                ("p", 2, 0.0),
+                (320, 1, 0.0),
+                (320, 1, 0.0),
+                (320, 1, 0.0),
+                (640, 1, 0.0),
+                ("p", 2, 0.0),
+                (2560, 1, 0.0, "k1"),
+                (320, 1, 0.0, "k1"),
+                (320, 1, 0.0),
+            ],
+        }
+
+        self.dropout_rates = drop_rates
+        # 15 is the last layer of the network(including two previous pooling layers)
+        # basically specifying the dropout rate for the very last layer to be used after the pooling
+        self.last_dropout_rate = self.dropout_rates.get(15, 0.0)
+        self.strides = {
+            0: {},
+            1: {0: 2, 1: 2, 2: 2},
+            2: {0: 2, 1: 2, 2: 1, 3: 2},
+            3: {0: 2, 1: 2, 2: 1, 3: 1, 4: 2},
+            4: {0: 2, 1: 1, 2: 2, 3: 1, 4: 2, 5: 1},
+        }
+
+        self.num_classes = num_classes
+        self.in_chans = in_chans
+        self.scale = scale
+        self.networks = [
+            "simplenetv1_imagenet",  # 0
+            "simplenetv1_imagenet_9m",  # 1
+            # other archs
+        ]
+        self.network_idx = network_idx
+        self.mode = mode
+
+        self.features = self._make_layers(scale)
+        self.classifier = nn.Linear(round(self.cfg[self.networks[network_idx]][-1][0] * scale), num_classes)
+
+    def forward(self, x: torch.Tensor):
+        out = self.features(x)
+        out = F.max_pool2d(out, kernel_size=out.size()[2:])
+        out = F.dropout2d(out, self.last_dropout_rate, training=self.training)
+        out = out.view(out.size(0), -1)
+        out = self.classifier(out)
+        return out
+
+    def _make_layers(self, scale: float):
+        layers: List[nn.Module] = []
+        input_channel = self.in_chans
+        stride_list = self.strides[self.mode]
+        for idx, (layer, stride, defaul_dropout_rate, *layer_type) in enumerate(
+            self.cfg[self.networks[self.network_idx]]
+        ):
+            stride = stride_list[idx] if len(stride_list) > idx else stride
+            # check if any custom dropout rate is specified
+            # for this layer, note that pooling also counts as 1 layer
+            custom_dropout = self.dropout_rates.get(idx, None)
+            custom_dropout = defaul_dropout_rate if custom_dropout is None else custom_dropout
+            # dropout values must be strictly decimal. while 0 doesnt introduce any issues here
+            # i.e. during training and inference, if you try to jit trace your model it will crash
+            # due to using 0 as dropout value(this applies up to 1.13.1) so here is an explicit
+            # check to convert any possible integer value to its decimal counterpart.
+            custom_dropout = None if custom_dropout is None else float(custom_dropout)
+            kernel_size = 3 if layer_type == [] else 1
+
+            if layer == "p":
+                layers += [
+                    nn.MaxPool2d(kernel_size=(2, 2), stride=(stride, stride)),
+                    nn.Dropout2d(p=custom_dropout, inplace=True),
+                ]
+            else:
+                filters = round(layer * scale)
+                if custom_dropout is None:
+                    layers += [
+                        nn.Conv2d(input_channel, filters, kernel_size=kernel_size, stride=stride, padding=1),
+                        nn.BatchNorm2d(filters, eps=1e-05, momentum=0.05, affine=True),
+                        nn.ReLU(inplace=True),
+                    ]
+                else:
+                    layers += [
+                        nn.Conv2d(input_channel, filters, kernel_size=kernel_size, stride=stride, padding=1),
+                        nn.BatchNorm2d(filters, eps=1e-05, momentum=0.05, affine=True),
+                        nn.ReLU(inplace=True),
+                        nn.Dropout2d(p=custom_dropout, inplace=False),
+                    ]
+
+                input_channel = filters
+
+        model = nn.Sequential(*layers)
+        for m in model.modules():
+            if isinstance(m, nn.Conv2d):
+                nn.init.xavier_uniform_(m.weight.data, gain=nn.init.calculate_gain("relu"))
+        return model
+
+    @torch.jit.ignore
+    def group_matcher(self, coarse=False):
+        # this treats BN layers as separate groups for bn variants, a lot of effort to fix that
+        return dict(stem=r"^features\.0", blocks=r"^features\.(\d+)")
+
+    @torch.jit.ignore
+    def set_grad_checkpointing(self, enable=True):
+        assert not enable, "gradient checkpointing not supported"
+
+    @torch.jit.ignore
+    def get_classifier(self):
+        return self.classifier
+
+    def reset_classifier(self, num_classes: int):
+        self.num_classes = num_classes
+        self.classifier = nn.Linear(round(self.cfg[self.networks[self.network_idx]][-1][0] * self.scale), num_classes)
+
+    def forward_features(self, x: torch.Tensor) -> torch.Tensor:
+        return self.features(x)
+
+    def forward_head(self, x: torch.Tensor, pre_logits: bool = False):
+        x = self.forward_features(x)
+        if pre_logits:
+            return x
+        else:
+            x = F.max_pool2d(x, kernel_size=x.size()[2:])
+            x = F.dropout2d(x, self.last_dropout_rate, training=self.training)
+            x = x.view(x.size(0), -1)
+        return self.classifier(x)
+
+
+def _gen_simplenet(
+    model_variant: str = "simplenetv1_m2",
+    num_classes: int = 1000,
+    in_chans: int = 3,
+    scale: float = 1.0,
+    network_idx: int = 0,
+    mode: int = 2,
+    pretrained: bool = False,
+    drop_rates: Dict[int, float] = {},
+    **kwargs,
+) -> SimpleNet:
+    model_args = dict(
+        in_chans=in_chans,
+        scale=scale,
+        network_idx=network_idx,
+        mode=mode,
+        drop_rates=drop_rates,
+        **kwargs,
+    )
+    # to allow for seemless finetuning, remove the num_classes
+    # and load the model intact, we apply the changes afterward!
+    if "num_classes" in kwargs:
+        kwargs.pop("num_classes")
+    model = build_model_with_cfg(SimpleNet, model_variant, pretrained, **model_args)
+    # if the num_classes is different than imagenet's, it
+    # means its going to be finetuned, so only create a
+    # new classifier after the whole model is loaded!
+    if num_classes != 1000:
+        model.reset_classifier(num_classes)
+    return model
+
+
+@register_model
+def simplenet(pretrained: bool = False, **kwargs: Any) -> SimpleNet:
+    """Generic simplenet model builder. by default it returns `simplenetv1_5m_m2` model
+    but specifying different arguments such as `netidx`, `scale` or `mode` will result in
+    the corrosponding network variant.
+
+    when pretrained is specified, if the combination of settings resemble any known variants
+    specified in the `default_cfg`, their respective pretrained weights will be loaded, otherwise
+    an exception will be thrown denoting Unknown model variant being specified.
+
+    Args:
+        pretrained (bool, optional): loads the model with pretrained weights only if the model is a known variant specified in default_cfg. Defaults to False.
+
+    Raises:
+        Exception: if pretrained is used with an unknown/custom model variant and exception is raised.
+
+    Returns:
+        SimpleNet: a SimpleNet model instance is returned upon successful instantiation.
+    """
+    num_classes = kwargs.get("num_classes", 1000)
+    in_chans = kwargs.get("in_chans", 3)
+    scale = kwargs.get("scale", 1.0)
+    network_idx = kwargs.get("network_idx", 0)
+    mode = kwargs.get("mode", 2)
+    drop_rates = kwargs.get("drop_rates", {})
+    model_variant = "simplenetv1_5m_m2"
+    if pretrained:
+        # check if the model specified is a known variant
+        model_base = None
+        if network_idx == 0:
+            model_base = 5
+        elif network_idx == 1:
+            model_base = 9
+        config = ""
+        if math.isclose(scale, 1.0):
+            config = f"{model_base}m_m{mode}"
+        elif math.isclose(scale, 0.75):
+            config = f"small_m{mode}_075"
+        elif math.isclose(scale, 0.5):
+            config = f"small_m{mode}_05"
+        else:
+            config = f"m{mode}_{scale:.2f}".replace(".", "")
+        model_variant = f"simplenetv1_{config}"
+
+        cfg = default_cfgs.get(model_variant, None)
+        if cfg is None:
+            raise Exception(f"Unknown model variant ('{model_variant}') specified!")
+
+    return _gen_simplenet(model_variant, num_classes, in_chans, scale, network_idx, mode, pretrained, drop_rates)
+
+
+def remove_network_settings(kwargs: Dict[str, Any]) -> Dict[str, Any]:
+    """Removes network related settings passed in kwargs for predefined network configruations below
+
+    Returns:
+        Dict[str,Any]: cleaned kwargs
+    """
+    model_args = {k: v for k, v in kwargs.items() if k not in ["scale", "network_idx", "mode", "drop_rate"]}
+    return model_args
+
+
+# imagenet models
+@register_model
+def simplenetv1_small_m1_05(pretrained: bool = False, **kwargs: Any) -> SimpleNet:
+    """Creates a small variant of simplenetv1_5m, with 1.5m parameters. This uses m1 stride mode
+    which makes it the fastest variant available.
+
+    Args:
+        pretrained (bool, optional): loads the model with pretrained weights. Defaults to False.
+
+    Returns:
+        SimpleNet: a SimpleNet model instance is returned upon successful instantiation.
+    """
+    model_variant = "simplenetv1_small_m1_05"
+    model_args = remove_network_settings(kwargs)
+    return _gen_simplenet(model_variant, scale=0.5, network_idx=0, mode=1, pretrained=pretrained, **model_args)
+
+
+@register_model
+def simplenetv1_small_m2_05(pretrained: bool = False, **kwargs: Any) -> SimpleNet:
+    """Creates a second small variant of simplenetv1_5m, with 1.5m parameters. This uses m2 stride mode
+    which makes it the second fastest variant available.
+
+    Args:
+        pretrained (bool, optional): loads the model with pretrained weights. Defaults to False.
+
+    Returns:
+        SimpleNet: a SimpleNet model instance is returned upon successful instantiation.
+    """
+    model_variant = "simplenetv1_small_m2_05"
+    model_args = remove_network_settings(kwargs)
+    return _gen_simplenet(model_variant, scale=0.5, network_idx=0, mode=2, pretrained=pretrained, **model_args)
+
+
+@register_model
+def simplenetv1_small_m1_075(pretrained: bool = False, **kwargs: Any) -> SimpleNet:
+    """Creates a third small variant of simplenetv1_5m, with 3m parameters. This uses m1 stride mode
+    which makes it the third fastest variant available.
+
+    Args:
+        pretrained (bool, optional): loads the model with pretrained weights. Defaults to False.
+
+    Returns:
+        SimpleNet: a SimpleNet model instance is returned upon successful instantiation.
+    """
+    model_variant = "simplenetv1_small_m1_075"
+    model_args = remove_network_settings(kwargs)
+    return _gen_simplenet(model_variant, scale=0.75, network_idx=0, mode=1, pretrained=pretrained, **model_args)
+
+
+@register_model
+def simplenetv1_small_m2_075(pretrained: bool = False, **kwargs: Any) -> SimpleNet:
+    """Creates a forth small variant of simplenetv1_5m, with 3m parameters. This uses m2 stride mode
+    which makes it the forth fastest variant available.
+
+    Args:
+        pretrained (bool, optional): loads the model with pretrained weights. Defaults to False.
+
+    Returns:
+        SimpleNet: a SimpleNet model instance is returned upon successful instantiation.
+    """
+    model_variant = "simplenetv1_small_m2_075"
+    model_args = remove_network_settings(kwargs)
+    return _gen_simplenet(model_variant, scale=0.75, network_idx=0, mode=2, pretrained=pretrained, **model_args)
+
+
+@register_model
+def simplenetv1_5m_m1(pretrained: bool = False, **kwargs: Any) -> SimpleNet:
+    """Creates the base simplement model known as simplenetv1_5m, with 5m parameters. This variant uses m1 stride mode
+    which makes it a fast and performant model.
+
+    Args:
+        pretrained (bool, optional): loads the model with pretrained weights. Defaults to False.
+
+    Returns:
+        SimpleNet: a SimpleNet model instance is returned upon successful instantiation.
+    """
+    model_variant = "simplenetv1_5m_m1"
+    model_args = remove_network_settings(kwargs)
+    return _gen_simplenet(model_variant, scale=1.0, network_idx=0, mode=1, pretrained=pretrained, **model_args)
+
+
+@register_model
+def simplenetv1_5m_m2(pretrained: bool = False, **kwargs: Any) -> SimpleNet:
+    """Creates the base simplement model known as simplenetv1_5m, with 5m parameters. This variant uses m2 stride mode
+    which makes it a bit more performant model compared to the m1 variant of the same variant at the expense of a bit slower inference.
+
+    Args:
+        pretrained (bool, optional): loads the model with pretrained weights. Defaults to False.
+
+    Returns:
+        SimpleNet: a SimpleNet model instance is returned upon successful instantiation.
+    """
+    model_variant = "simplenetv1_5m_m2"
+    model_args = remove_network_settings(kwargs)
+    return _gen_simplenet(model_variant, scale=1.0, network_idx=0, mode=2, pretrained=pretrained, **model_args)
+
+
+@register_model
+def simplenetv1_9m_m1(pretrained: bool = False, **kwargs: Any) -> SimpleNet:
+    """Creates a variant of the simplenetv1_5m, with 9m parameters. This variant uses m1 stride mode
+    which makes it run faster.
+
+    Args:
+        pretrained (bool, optional): loads the model with pretrained weights. Defaults to False.
+
+    Returns:
+        SimpleNet: a SimpleNet model instance is returned upon successful instantiation.
+    """
+    model_variant = "simplenetv1_9m_m1"
+    model_args = remove_network_settings(kwargs)
+    return _gen_simplenet(model_variant, scale=1.0, network_idx=1, mode=1, pretrained=pretrained, **model_args)
+
+
+@register_model
+def simplenetv1_9m_m2(pretrained: bool = False, **kwargs: Any) -> SimpleNet:
+    """Creates a variant of the simplenetv1_5m, with 9m parameters. This variant uses m2 stride mode
+    which makes it a bit more performant model compared to the m1 variant of the same variant at the expense of a bit slower inference.
+
+    Args:
+        pretrained (bool, optional): loads the model with pretrained weights. Defaults to False.
+
+    Returns:
+        SimpleNet: a SimpleNet model instance is returned upon successful instantiation.
+    """
+    model_variant = "simplenetv1_9m_m2"
+    model_args = remove_network_settings(kwargs)
+    return _gen_simplenet(model_variant, scale=1.0, network_idx=1, mode=2, pretrained=pretrained, **model_args)
+
+
+if __name__ == "__main__":
+    model = simplenet(num_classes=1000, pretrained=True)
+    input_dummy = torch.randn(size=(1, 224, 224, 3))
+    out = model(input_dummy)
+    print(f"output: {out.size()}")