Source code for bob.learn.pytorch.architectures.ConditionalGAN

#!/usr/bin/env python
# encoding: utf-8

import torch
import torch.nn as nn


[docs]class ConditionalGAN_generator(nn.Module):
    """ Class implementating the conditional GAN generator

  This network is introduced in the following publication:
  Mehdi Mirza, Simon Osindero: "Conditional Generative Adversarial Nets"

  Attributes
  ----------
  ngpu : int
    The number of available GPU devices
  main : :py:class:`torch.nn.Sequential`
    The sequential container

  """

    def __init__(self, noise_dim, conditional_dim, channels=3, ngpu=1):
        """Init function

    Parameters
    ----------
    noise_dim : int
      The dimension of the noise 
    conditional_dim : int
      The dimension of the conditioning variable 
    channels : int
      The number of channels in the image 
    ngpu : int
      The number of available GPU devices

    """
        super(ConditionalGAN_generator, self).__init__()
        self.ngpu = ngpu
        self.conditional_dim = conditional_dim

        # output dimension
        ngf = 64

        self.main = nn.Sequential(
            # input is Z, going into a convolution
            nn.ConvTranspose2d(
                (noise_dim + conditional_dim), ngf * 8, 4, 1, 0, bias=False
            ),
            nn.BatchNorm2d(ngf * 8),
            nn.ReLU(True),
            # state size. (ngf*8) x 4 x 4
            nn.ConvTranspose2d(ngf * 8, ngf * 4, 4, 2, 1, bias=False),
            nn.BatchNorm2d(ngf * 4),
            nn.ReLU(True),
            # state size. (ngf*4) x 8 x 8
            nn.ConvTranspose2d(ngf * 4, ngf * 2, 4, 2, 1, bias=False),
            nn.BatchNorm2d(ngf * 2),
            nn.ReLU(True),
            # state size. (ngf*2) x 16 x 16
            nn.ConvTranspose2d(ngf * 2, ngf, 4, 2, 1, bias=False),
            nn.BatchNorm2d(ngf),
            nn.ReLU(True),
            # state size. (ngf) x 32 x 32
            nn.ConvTranspose2d(ngf, channels, 4, 2, 1, bias=False),
            nn.Tanh()
            # state size. (nc) x 64 x 64
        )

[docs]    def forward(self, z, y):
        """Forward function

    Parameters
    ----------
    z : :py:class: `torch.autograd.Variable`
      The minibatch of noise.
    y : :py:class: `torch.autograd.Variable`
      The conditional one hot encoded vector for the minibatch.
    
    Returns
    -------
    :py:class:`torch.Tensor`
      the output of the generator (i.e. an image)
    
    """
        generator_input = torch.cat((z, y), 1)
        # if isinstance(generator_input.data, torch.cuda.FloatTensor) and self.ngpu > 1:
        #  output = nn.parallel.data_parallel(self.main, generator_input, range(self.ngpu))
        # else:
        #  output = self.main(generator_input)

        # let's assume that we will never face the case where more than a GPU is used ...
        output = self.main(generator_input)
        return output


[docs]class ConditionalGAN_discriminator(nn.Module):
    """ Class implementating the conditional GAN discriminator

  Attributes
  ----------
  conditional_dim: int
    The dimension of the conditioning variable.
  channels: int
    The number of channels in the input image (default: 3).
  ngpu : int
    The number of available GPU devices
  main : :py:class:`torch.nn.Sequential`
    The sequential container

  """

    def __init__(self, conditional_dim, channels=3, ngpu=1):
        """Init function

    Parameters
    ----------
    conditional_dim: int
      The dimension of the conditioning variable.
    channels: int
      The number of channels in the input image (default: 3).
    ngpu : int
      The number of available GPU devices
   
    """
        super(ConditionalGAN_discriminator, self).__init__()
        self.conditional_dim = conditional_dim
        self.ngpu = ngpu

        # input dimension
        ndf = 64
        self.main = nn.Sequential(
            # input is (nc) x 64 x 64
            nn.Conv2d((channels + conditional_dim), ndf, 4, 2, 1, bias=False),
            nn.LeakyReLU(0.2, inplace=True),
            # state size. (ndf) x 32 x 32
            nn.Conv2d(ndf, ndf * 2, 4, 2, 1, bias=False),
            nn.BatchNorm2d(ndf * 2),
            nn.LeakyReLU(0.2, inplace=True),
            # state size. (ndf*2) x 16 x 16
            nn.Conv2d(ndf * 2, ndf * 4, 4, 2, 1, bias=False),
            nn.BatchNorm2d(ndf * 4),
            nn.LeakyReLU(0.2, inplace=True),
            # state size. (ndf*4) x 8 x 8
            nn.Conv2d(ndf * 4, ndf * 8, 4, 2, 1, bias=False),
            nn.BatchNorm2d(ndf * 8),
            nn.LeakyReLU(0.2, inplace=True),
            # state size. (ndf*8) x 4 x 4
            nn.Conv2d(ndf * 8, 1, 4, 1, 0, bias=False),
            nn.Sigmoid(),
        )

[docs]    def forward(self, images, y):
        """Forward function

    Parameters
    ----------
    images : :py:class: `torch.autograd.Variable`
      The minibatch of input images.
    y : :py:class: `torch.autograd.Variable`
      The corresponding conditional feature maps.
    
    Returns
    -------
    :py:class:`torch.Tensor`
      the output of the discriminator
    """
        input_discriminator = torch.cat((images, y), 1)
        # if isinstance(input_discriminator.data, torch.cuda.FloatTensor) and self.ngpu > 1:
        #  output = nn.parallel.data_parallel(self.main, input_discriminator, range(self.ngpu))
        # else:
        #  output = self.main(input_discriminator)

        # let's assume that we will never face the case where more than a GPU is used ...
        output = self.main(input_discriminator)
        return output.view(-1, 1).squeeze(1)