pytorch-image-models/timm/models/helpers.py

import torch
import torch.utils.model_zoo as model_zoo
import os
from collections import OrderedDict


def load_checkpoint(model, checkpoint_path, use_ema=False):
    if checkpoint_path and os.path.isfile(checkpoint_path):
        checkpoint = torch.load(checkpoint_path)
        state_dict_key = ''
        if isinstance(checkpoint, dict):
            state_dict_key = 'state_dict'
            if use_ema and 'state_dict_ema' in checkpoint:
                state_dict_key = 'state_dict_ema'
        if state_dict_key and state_dict_key in checkpoint:
            new_state_dict = OrderedDict()
            for k, v in checkpoint[state_dict_key].items():
                # strip `module.` prefix
                name = k[7:] if k.startswith('module') else k
                new_state_dict[name] = v
            model.load_state_dict(new_state_dict)
        else:
            model.load_state_dict(checkpoint)
        print("=> Loaded {} from checkpoint '{}'".format(state_dict_key or 'weights', checkpoint_path))
    else:
        print("=> Error: No checkpoint found at '{}'".format(checkpoint_path))
        raise FileNotFoundError()


def resume_checkpoint(model, checkpoint_path, start_epoch=None):
    optimizer_state = None
    if os.path.isfile(checkpoint_path):
        checkpoint = torch.load(checkpoint_path)
        if isinstance(checkpoint, dict) and 'state_dict' in checkpoint:
            new_state_dict = OrderedDict()
            for k, v in checkpoint['state_dict'].items():
                name = k[7:] if k.startswith('module') else k
                new_state_dict[name] = v
            model.load_state_dict(new_state_dict)
            if 'optimizer' in checkpoint:
                optimizer_state = checkpoint['optimizer']
            start_epoch = checkpoint['epoch'] if start_epoch is None else start_epoch
            print("=> Loaded checkpoint '{}' (epoch {})".format(checkpoint_path, checkpoint['epoch']))
        else:
            model.load_state_dict(checkpoint)
            start_epoch = 0 if start_epoch is None else start_epoch
            print("=> Loaded checkpoint '{}'".format(checkpoint_path))
        return optimizer_state, start_epoch
    else:
        print("=> Error: No checkpoint found at '{}'".format(checkpoint_path))
        raise FileNotFoundError()


def load_pretrained(model, default_cfg, num_classes=1000, in_chans=3, filter_fn=None):
    if 'url' not in default_cfg or not default_cfg['url']:
        print("Warning: pretrained model URL is invalid, using random initialization.")
        return

    state_dict = model_zoo.load_url(default_cfg['url'])

    if in_chans == 1:
        conv1_name = default_cfg['first_conv']
        print('Converting first conv (%s) from 3 to 1 channel' % conv1_name)
        conv1_weight = state_dict[conv1_name + '.weight']
        state_dict[conv1_name + '.weight'] = conv1_weight.sum(dim=1, keepdim=True)
    elif in_chans != 3:
        assert False, "Invalid in_chans for pretrained weights"

    strict = True
    classifier_name = default_cfg['classifier']
    if num_classes == 1000 and default_cfg['num_classes'] == 1001:
        # special case for imagenet trained models with extra background class in pretrained weights
        classifier_weight = state_dict[classifier_name + '.weight']
        state_dict[classifier_name + '.weight'] = classifier_weight[1:]
        classifier_bias = state_dict[classifier_name + '.bias']
        state_dict[classifier_name + '.bias'] = classifier_bias[1:]
    elif num_classes != default_cfg['num_classes']:
        # completely discard fully connected for all other differences between pretrained and created model
        del state_dict[classifier_name + '.weight']
        del state_dict[classifier_name + '.bias']
        strict = False

    if filter_fn is not None:
        state_dict = filter_fn(state_dict)

    model.load_state_dict(state_dict, strict=strict)
Uniform pretrained model handling. * All models have 'default_cfgs' dict * load/resume/pretrained helpers factored out * pretrained load operates on state_dict based on default_cfg * test all models in validate * schedule, optim factor factored out * test time pool wrapper applied based on default_cfg 6 years ago			`import torch`
			`import torch.utils.model_zoo as model_zoo`
			`import os`
			`from collections import OrderedDict`


Add exponential moving average for model weights + few other additions and cleanup * ModelEma class added to track an EMA set of weights for the model being trained * EMA handling added to train, validation and clean_checkpoint scripts * Add multi checkpoint or multi-model validation support to validate.py * Add syncbn option (APEX) to train script for experimentation * Cleanup interface of CheckpointSaver while adding ema functionality 5 years ago			`def load_checkpoint(model, checkpoint_path, use_ema=False):`
Uniform pretrained model handling. * All models have 'default_cfgs' dict * load/resume/pretrained helpers factored out * pretrained load operates on state_dict based on default_cfg * test all models in validate * schedule, optim factor factored out * test time pool wrapper applied based on default_cfg 6 years ago			`if checkpoint_path and os.path.isfile(checkpoint_path):`
			`checkpoint = torch.load(checkpoint_path)`
Add exponential moving average for model weights + few other additions and cleanup * ModelEma class added to track an EMA set of weights for the model being trained * EMA handling added to train, validation and clean_checkpoint scripts * Add multi checkpoint or multi-model validation support to validate.py * Add syncbn option (APEX) to train script for experimentation * Cleanup interface of CheckpointSaver while adding ema functionality 5 years ago			`state_dict_key = ''`
			`if isinstance(checkpoint, dict):`
			`state_dict_key = 'state_dict'`
			`if use_ema and 'state_dict_ema' in checkpoint:`
			`state_dict_key = 'state_dict_ema'`
			`if state_dict_key and state_dict_key in checkpoint:`
Uniform pretrained model handling. * All models have 'default_cfgs' dict * load/resume/pretrained helpers factored out * pretrained load operates on state_dict based on default_cfg * test all models in validate * schedule, optim factor factored out * test time pool wrapper applied based on default_cfg 6 years ago			`new_state_dict = OrderedDict()`
Add exponential moving average for model weights + few other additions and cleanup * ModelEma class added to track an EMA set of weights for the model being trained * EMA handling added to train, validation and clean_checkpoint scripts * Add multi checkpoint or multi-model validation support to validate.py * Add syncbn option (APEX) to train script for experimentation * Cleanup interface of CheckpointSaver while adding ema functionality 5 years ago			`for k, v in checkpoint[state_dict_key].items():`
			# strip `module.` prefix
			`name = k[7:] if k.startswith('module') else k`
Uniform pretrained model handling. * All models have 'default_cfgs' dict * load/resume/pretrained helpers factored out * pretrained load operates on state_dict based on default_cfg * test all models in validate * schedule, optim factor factored out * test time pool wrapper applied based on default_cfg 6 years ago			`new_state_dict[name] = v`
			`model.load_state_dict(new_state_dict)`
			`else:`
			`model.load_state_dict(checkpoint)`
Add exponential moving average for model weights + few other additions and cleanup * ModelEma class added to track an EMA set of weights for the model being trained * EMA handling added to train, validation and clean_checkpoint scripts * Add multi checkpoint or multi-model validation support to validate.py * Add syncbn option (APEX) to train script for experimentation * Cleanup interface of CheckpointSaver while adding ema functionality 5 years ago			`print("=> Loaded {} from checkpoint '{}'".format(state_dict_key or 'weights', checkpoint_path))`
Uniform pretrained model handling. * All models have 'default_cfgs' dict * load/resume/pretrained helpers factored out * pretrained load operates on state_dict based on default_cfg * test all models in validate * schedule, optim factor factored out * test time pool wrapper applied based on default_cfg 6 years ago			`else:`
			`print("=> Error: No checkpoint found at '{}'".format(checkpoint_path))`
			`raise FileNotFoundError()`


			`def resume_checkpoint(model, checkpoint_path, start_epoch=None):`
			`optimizer_state = None`
			`if os.path.isfile(checkpoint_path):`
			`checkpoint = torch.load(checkpoint_path)`
			`if isinstance(checkpoint, dict) and 'state_dict' in checkpoint:`
			`new_state_dict = OrderedDict()`
			`for k, v in checkpoint['state_dict'].items():`
Add exponential moving average for model weights + few other additions and cleanup * ModelEma class added to track an EMA set of weights for the model being trained * EMA handling added to train, validation and clean_checkpoint scripts * Add multi checkpoint or multi-model validation support to validate.py * Add syncbn option (APEX) to train script for experimentation * Cleanup interface of CheckpointSaver while adding ema functionality 5 years ago			`name = k[7:] if k.startswith('module') else k`
Uniform pretrained model handling. * All models have 'default_cfgs' dict * load/resume/pretrained helpers factored out * pretrained load operates on state_dict based on default_cfg * test all models in validate * schedule, optim factor factored out * test time pool wrapper applied based on default_cfg 6 years ago			`new_state_dict[name] = v`
			`model.load_state_dict(new_state_dict)`
			`if 'optimizer' in checkpoint:`
			`optimizer_state = checkpoint['optimizer']`
			`start_epoch = checkpoint['epoch'] if start_epoch is None else start_epoch`
Add exponential moving average for model weights + few other additions and cleanup * ModelEma class added to track an EMA set of weights for the model being trained * EMA handling added to train, validation and clean_checkpoint scripts * Add multi checkpoint or multi-model validation support to validate.py * Add syncbn option (APEX) to train script for experimentation * Cleanup interface of CheckpointSaver while adding ema functionality 5 years ago			`print("=> Loaded checkpoint '{}' (epoch {})".format(checkpoint_path, checkpoint['epoch']))`
Uniform pretrained model handling. * All models have 'default_cfgs' dict * load/resume/pretrained helpers factored out * pretrained load operates on state_dict based on default_cfg * test all models in validate * schedule, optim factor factored out * test time pool wrapper applied based on default_cfg 6 years ago			`else:`
			`model.load_state_dict(checkpoint)`
Add per model crop pct, interpolation defaults, tie it all together * create one resolve fn to pull together model defaults + cmd line args * update attribution comments in some models * test update train/validation/inference scripts 6 years ago			`start_epoch = 0 if start_epoch is None else start_epoch`
Add exponential moving average for model weights + few other additions and cleanup * ModelEma class added to track an EMA set of weights for the model being trained * EMA handling added to train, validation and clean_checkpoint scripts * Add multi checkpoint or multi-model validation support to validate.py * Add syncbn option (APEX) to train script for experimentation * Cleanup interface of CheckpointSaver while adding ema functionality 5 years ago			`print("=> Loaded checkpoint '{}'".format(checkpoint_path))`
Uniform pretrained model handling. * All models have 'default_cfgs' dict * load/resume/pretrained helpers factored out * pretrained load operates on state_dict based on default_cfg * test all models in validate * schedule, optim factor factored out * test time pool wrapper applied based on default_cfg 6 years ago			`return optimizer_state, start_epoch`
			`else:`
Add exponential moving average for model weights + few other additions and cleanup * ModelEma class added to track an EMA set of weights for the model being trained * EMA handling added to train, validation and clean_checkpoint scripts * Add multi checkpoint or multi-model validation support to validate.py * Add syncbn option (APEX) to train script for experimentation * Cleanup interface of CheckpointSaver while adding ema functionality 5 years ago			`print("=> Error: No checkpoint found at '{}'".format(checkpoint_path))`
Uniform pretrained model handling. * All models have 'default_cfgs' dict * load/resume/pretrained helpers factored out * pretrained load operates on state_dict based on default_cfg * test all models in validate * schedule, optim factor factored out * test time pool wrapper applied based on default_cfg 6 years ago			`raise FileNotFoundError()`


			`def load_pretrained(model, default_cfg, num_classes=1000, in_chans=3, filter_fn=None):`
Add ported Tensorflow EfficientNet B4/B5 weights 5 years ago			`if 'url' not in default_cfg or not default_cfg['url']:`
			`print("Warning: pretrained model URL is invalid, using random initialization.")`
			`return`

Uniform pretrained model handling. * All models have 'default_cfgs' dict * load/resume/pretrained helpers factored out * pretrained load operates on state_dict based on default_cfg * test all models in validate * schedule, optim factor factored out * test time pool wrapper applied based on default_cfg 6 years ago			`state_dict = model_zoo.load_url(default_cfg['url'])`

			`if in_chans == 1:`
			`conv1_name = default_cfg['first_conv']`
			`print('Converting first conv (%s) from 3 to 1 channel' % conv1_name)`
			`conv1_weight = state_dict[conv1_name + '.weight']`
			`state_dict[conv1_name + '.weight'] = conv1_weight.sum(dim=1, keepdim=True)`
			`elif in_chans != 3:`
			`assert False, "Invalid in_chans for pretrained weights"`

			`strict = True`
			`classifier_name = default_cfg['classifier']`
			`if num_classes == 1000 and default_cfg['num_classes'] == 1001:`
			`# special case for imagenet trained models with extra background class in pretrained weights`
			`classifier_weight = state_dict[classifier_name + '.weight']`
			`state_dict[classifier_name + '.weight'] = classifier_weight[1:]`
			`classifier_bias = state_dict[classifier_name + '.bias']`
			`state_dict[classifier_name + '.bias'] = classifier_bias[1:]`
			`elif num_classes != default_cfg['num_classes']:`
			`# completely discard fully connected for all other differences between pretrained and created model`
			`del state_dict[classifier_name + '.weight']`
			`del state_dict[classifier_name + '.bias']`
			`strict = False`

			`if filter_fn is not None:`
			`state_dict = filter_fn(state_dict)`

			`model.load_state_dict(state_dict, strict=strict)`