Source code for bob.learn.pytorch.architectures.MCCNNv2

#!/usr/bin/env python
# encoding: utf-8

import torch
import torch.nn as nn
import torch.nn.functional as F

import os
import numpy as np

import pkg_resources 
import bob.extension.download

import bob.io.base

from .utils import MaxFeatureMap
from .utils import group
from .utils import resblock

import logging
logger = logging.getLogger("bob.learn.pytorch")

[docs]class MCCNNv2(nn.Module):
  """ The class defining the MCCNNv2 the difference from MCCNN is that it uses shared layers for
  layers which are not adapted. This avoids replicating shared layers.
  
  Attributes
  ----------
  num_channels: int
    The number of channels present in the input
  lcnn_layers: list
  	The adaptable layers present in the base LightCNN model
  module_dict: dict
  	A dictionary containing module names and `torch.nn.Module` elements as key, value pairs.
  layer_dict: :py:class:`torch.nn.ModuleDict`
  	Pytorch class containing the modules as a dictionary. 
  light_cnn_model_file: str
  	Absolute path to the pretrained LightCNN model file. 
  adapted_layers: str
    The layers to be adapted in training, they are to be separated by '-'. 
    Example: 'conv1-block1-group1-ffc'; 'ffc' denotes final fully connected layers which
    are adapted in all the cases. 
  url: str
  	The path to download the pretrained LightCNN model from.
  
  """
  def __init__(self, block=resblock, layers=[1, 2, 3, 4], num_channels=4, adapted_layers = 'conv1-block1-group1-ffc', verbosity_level=2):
    """ Init function

    Parameters
    ----------

    num_channels: int
      The number of channels present in the input
    adapted_layers: str
      The layers to be adapted in training, they are to be separated by '-'. 
      Example: 'conv1-block1-group1-ffc'; 'ffc' denotes final fully connected layers which
      are adapted in all the cases.
    verbosity_level: int
      Verbosity level.
    
    """
    super(MCCNNv2, self).__init__()

    self.num_channels=num_channels

    self.lcnn_layers=['conv1','block1','group1','block2', 'group2','block3','group3','block4','group4','fc']

    layers_present = self.lcnn_layers.copy()

    layers_present.append('ffc')

    # select the layers in the network to adapt

    adapted_layers_list=adapted_layers.split('-')

    assert('ffc' in adapted_layers_list)

    assert(set(adapted_layers_list)<=set(layers_present)) # to ensure layer names are valid

    self.shared_layers = list(set(layers_present) - set(adapted_layers_list)) # shared layers

    self.domain_specific_layers= list(set(adapted_layers_list)-set(['ffc']))

    logger.setLevel(verbosity_level)

    self.pool1  = nn.MaxPool2d(kernel_size=2, stride=2, ceil_mode=True)
    self.pool2  = nn.MaxPool2d(kernel_size=2, stride=2, ceil_mode=True)
    self.pool3  = nn.MaxPool2d(kernel_size=2, stride=2, ceil_mode=True)
    self.pool4  = nn.MaxPool2d(kernel_size=2, stride=2, ceil_mode=True)

    # newly added FC layers

    self.linear1fc=nn.Linear(256*num_channels,10)
    self.linear2fc=nn.Linear(10,1)

    # add modules 

    module_dict={}

    for i in range(self.num_channels):

      m_dict={}

      m_dict['conv1']  = MaxFeatureMap(1, 48, 5, 1, 2)
      m_dict['block1'] = self._make_layer(block, layers[0], 48, 48)
      m_dict['group1'] = group(48, 96, 3, 1, 1)
      m_dict['block2'] = self._make_layer(block, layers[1], 96, 96)
      m_dict['group2'] = group(96, 192, 3, 1, 1)
      m_dict['block3'] = self._make_layer(block, layers[2], 192, 192)
      m_dict['group3'] = group(192, 128, 3, 1, 1)
      m_dict['block4'] = self._make_layer(block, layers[3], 128, 128)
      m_dict['group4'] = group(128, 128, 3, 1, 1)
      m_dict['fc']   = MaxFeatureMap(8*8*128, 256, type=0)

      # ch_0_should be the anchor 

      for layer in self.domain_specific_layers: # needs copies for domain specific layers

        layer_name="ch_{}_".format(i)+layer

        module_dict[layer_name] = m_dict[layer]

    m_dict={}

    m_dict['conv1']  = MaxFeatureMap(1, 48, 5, 1, 2)
    m_dict['block1'] = self._make_layer(block, layers[0], 48, 48)
    m_dict['group1'] = group(48, 96, 3, 1, 1)
    m_dict['block2'] = self._make_layer(block, layers[1], 96, 96)
    m_dict['group2'] = group(96, 192, 3, 1, 1)
    m_dict['block3'] = self._make_layer(block, layers[2], 192, 192)
    m_dict['group3'] = group(192, 128, 3, 1, 1)
    m_dict['block4'] = self._make_layer(block, layers[3], 128, 128)
    m_dict['group4'] = group(128, 128, 3, 1, 1)
    m_dict['fc']   = MaxFeatureMap(8*8*128, 256, type=0)

    for layer in self.shared_layers: # shared layers have ch_0_ prefix to make loading from pretrained model easier.

        layer_name="ch_0_"+layer

        module_dict[layer_name] = m_dict[layer]

    self.layer_dict = nn.ModuleDict(module_dict)

    # check for pretrained model 

    light_cnn_model_file = os.path.join(MCCNNv2.get_mccnnv2path(), "LightCNN_29Layers_checkpoint.pth.tar")

    url='http://www.idiap.ch/software/bob/data/bob/bob.learn.pytorch/master/LightCNN_29Layers_checkpoint.pth.tar'

    logger.info("Light_cnn_model_file path: {}".format(light_cnn_model_file))


    if not os.path.exists(light_cnn_model_file):

      bob.io.base.create_directories_safe(os.path.split(light_cnn_model_file)[0])

      logger.info('Downloading the LightCNN model')

      bob.extension.download.download_file(url,light_cnn_model_file)

      logger.info('Downloaded LightCNN model to location: {}'.format(light_cnn_model_file))


    ## Loding the pretrained model for ch_0

    self.load_state_dict(self.get_model_state_dict(light_cnn_model_file),strict=False)

    # copy over the weights to all other domain specific layers

    for layer in self.domain_specific_layers:

      for i in range(1, self.num_channels): # except for 0 th channel

        self.layer_dict["ch_{}_".format(i)+layer].load_state_dict(self.layer_dict["ch_0_"+layer].state_dict())  

            
  def _make_layer(self, block, num_blocks, in_channels, out_channels):
    """ makes multiple copies of the same base module

    Parameters
    ----------
    block: :py:class:`torch.nn.Module`
      The base block to replicate
    num_blocks: int
      Number of copies of the block to be made
    in_channels: int
      Number of input channels for a block
    out_channels: int
      Number of output channels for a block
    """
    layers = []
    for i in range(0, num_blocks):
        layers.append(block(in_channels, out_channels))
    return nn.Sequential(*layers)

[docs]  def forward(self, img):
    """ Propagate data through the network

    Parameters
    ----------
    img: :py:class:`torch.Tensor` 
      The data to forward through the network. Image of size num_channelsx128x128

    Returns
    -------
    output: :py:class:`torch.Tensor` 
      score 

    """
    
    embeddings=[]

    for i in range(self.num_channels):

      commom_layer = lambda x,y: x if self.lcnn_layers[y] in self.domain_specific_layers else 0

      # for ll in range(0,10):
      #   logger.debug("ch_{}_".format(commom_layer(i,ll))+self.lcnn_layers[ll])

      x=img[:,i,:,:].unsqueeze(1) # the image for the specific channel

      x = self.layer_dict["ch_{}_".format(commom_layer(i,0))+self.lcnn_layers[0]](x)
      x = self.pool1(x)

      x = self.layer_dict["ch_{}_".format(commom_layer(i,1))+self.lcnn_layers[1]](x)
      x = self.layer_dict["ch_{}_".format(commom_layer(i,2))+self.lcnn_layers[2]](x)
      x = self.pool2(x)

      x = self.layer_dict["ch_{}_".format(commom_layer(i,3))+self.lcnn_layers[3]](x)
      x = self.layer_dict["ch_{}_".format(commom_layer(i,4))+self.lcnn_layers[4]](x)
      x = self.pool3(x)

      x = self.layer_dict["ch_{}_".format(commom_layer(i,5))+self.lcnn_layers[5]](x)
      x = self.layer_dict["ch_{}_".format(commom_layer(i,6))+self.lcnn_layers[6]](x)
      x = self.layer_dict["ch_{}_".format(commom_layer(i,7))+self.lcnn_layers[7]](x)
      x = self.layer_dict["ch_{}_".format(commom_layer(i,8))+self.lcnn_layers[8]](x)
      x = self.pool4(x)

      x = x.view(x.size(0), -1)

      fc = self.layer_dict["ch_{}_".format(commom_layer(i,9))+self.lcnn_layers[9]](x)

      fc = F.dropout(fc, training=self.training)

      embeddings.append(fc)

    merged = torch.cat(embeddings, 1)

    output = self.linear1fc(merged)

    output = nn.Sigmoid()(output)

    output = self.linear2fc(output)

    output=nn.Sigmoid()(output)

    return output

[docs]  @staticmethod
  def get_mccnnv2path():

    import pkg_resources
    return pkg_resources.resource_filename('bob.learn.pytorch', 'models')


[docs]  def get_model_state_dict(self,pretrained_model_path):


    """ The class to load pretrained LightCNN model

    Attributes
    ----------
    pretrained_model_path: str
      Absolute path to the LightCNN model file

    new_state_dict: dict
      Dictionary with LightCNN weights

    """

    checkpoint = torch.load(pretrained_model_path,map_location=lambda storage,loc:storage)
    start_epoch = checkpoint['epoch']
    state_dict = checkpoint['state_dict']
    # create new OrderedDict that does not contain `module.`
    from collections import OrderedDict
    new_state_dict = OrderedDict()
    for k, v in state_dict.items():
      name = 'layer_dict.ch_0_'+k[7:] # remove `module.`
      new_state_dict[name] = v
    # load params
    return new_state_dict