Consider the situation where I would like to restore all weights till the last layer.
# args has the model name, num classes and other irrelevant stuff
self._model = models.__dict__[args.arch](pretrained = False,
num_classes = args.classes,
aux_logits = False)
if self.args.pretrained:
print("=> using pre-trained model '{}'".format(args.arch))
pretrained_state = model_zoo.load_url(model_names[args.arch])
model_state = self._model.state_dict()
pretrained_state = { k:v for k,v in pretrained_state.iteritems() if k in model_state and v.size() == model_state[k].size() }
model_state.update(pretrained_state)
self._model.load_state_dict(model_state)
Shouldn’t we also be checking if the sizes match before restoring? It looks like we are comparing only the names.