rbmsemisuplearn.py

from rbmpygivenx import rbmpygivenx
import numpy as np
from rbmgenerative import rbmgenerative
from rbmdiscriminative import rbmdiscriminative
import sys
sys.path.insert(0, './util/')
from samplematrix import samplematrix

# rbmsemisuplearn semisupervised learning function
# Combines unsupervised training objective with either
# hybrid, discriminative or generative trainign using the formula:
#
#  L = L_type + L_unsup*opts.semisup_beta
#
#  for discription of semisupervised training objective see ref [2]
#   INPUTS:
#       rbm       : a rbm struct
#       x        : the initial state of the hidden units
#       ey        : one hot encoded labels if classRBM otherwise empty
#       opts      : opts struct. opts.train_type determines if CD or PCD should
#                   be used for generative training. otps.cdn determines the
#                   number of gibbs steps.
#                   opts.hybrid_alpha determines the weigthing of hybrid and
#                   generative training.
#  chains_comb    : PCD chains for otps.semisup_type and semisupervised train
#                   func
#  chainsy_type   : PCD chains for the tranining func det. by otps.semisup_type
#
#   OUTPUTS
#      A grads struct with the fields:
#       grads.dw   : w weights chainge normalized by minibatch size
#       grads.db   : bias of visible layer weight change norm by minibatch size
#                    (db is zero for the discriminative RBM)
#       grads.dc   : bias of hidden layer weight change norm by minibatch size
#       grads.du   : class label layer weight change norm by minibatch size
#       grads.dd   : class label hidden bias weight change norm by minibatch size
#       curr_err   : not used returns 0
#  chains_comb     : updated PCD chains
#  chainsy_type    : updated PCD chains
#
#
#
# References
#    [1] H. Larochelle and Y. Bengio, Classification using discriminative
#        restricted Boltzmann machines,? ? 25th Int. Conf. Mach. ?, 2008.
#    [2] H. Larochelle and M. Mandel, ?Learning algorithms for the
#        classification restricted boltzmann machine,? J. Mach.  ?, 2012.
#
# NOTATION
# data  : all data given as      [n_samples   x #vis]
#    v  : all data given as      [n_samples   x #vis]
#   ey  : all data given as      [n_samples   x #n_classes]
#    W  : vis - hid weights      [ #hid       x #vis ]
#    U  : label - hid weights    [ #hid       x #n_classes ]
#    b  : bias of visible layer  [ #vis       x 1]
#    c  : bias of hidden layer   [ #hid       x 1]
#    d  : bias of label layer    [ #n_classes x 1]
#
# See also RBMGENERATIVE, RBMDISCRIMINATIVE RBMHYBRID
#
# Copyright Sřren Sřnderby June 2014

# split chains don't if it matters that i use the correct chains??


def rbmsemisuplearn(rbm, x, ey, opts, chains_comb, chainsy_comb):

    if opts.traintype == 'PCD':
        chains_semisup = chains_comb[0:opts.batchsize,:]
        chains_type = chains_comb[opts.batchsize+2:,:]
        chainsy_semisup = chainsy_comb[0:opts.batchsize,:]
        chainsy_type = chainsy_comb[opts.batchsize+2:, :]
    else:
        chains_semisup = []
        chains_type = []
        chainsy_semisup = []
        chainsy_type = []

    # sample p(y | x)
    ey_semisup, _ = rbmpygivenx(rbm, x, 'train')
    ey_semisup = samplematrix(ey_semisup)

    grads_semisup, _, chains_semisup, chainsy_semisup = rbmgenerative(rbm, opts.x_semisup_batch, ey_semisup, opts, chains_semisup, chainsy_semisup)

#:o     [grads_semisup, _, chains_semisup, chainsy_semisup] = rbmgenerative(rbm, opts.x_semisup_batch, ey_semisup, opts,
#                                                                        chains_semisup, chainsy_semisup)
#
    # combine the generative unsupervised training with either @rbmhybrid,
    # @rbmgenerative or @rbmdiscriminative
    # note here we have labels
    grads_type, _, chains_type, chainsy_type = opts.semisup_type(rbm, x, ey, opts, chains_type, chainsy_type)

    chains_comb = [chains_semisup, chains_type]
    chainsy_comb = [chainsy_semisup, chainsy_type]

    grads = {
        'dw': grads_type['dw'] + opts.semisup_beta * grads_semisup['dw'],
        'db': grads_type['db'] + opts.semisup_beta * np.reshape(grads_semisup['db'], (grads_type['db'].shape)),
        # O:        'db': grads_type['db'] + opts.semisup_beta * grads_semisup['db'],
        'dc': grads_type['dc'] + opts.semisup_beta * np.reshape(grads_semisup['dc'], (grads_type['dc'].shape)),
        'du': grads_type['du'] + opts.semisup_beta * grads_semisup['du'],
        'dd': grads_type['dd'] + opts.semisup_beta * grads_semisup['dd'],
    }

    curr_err = 0

    return grads, curr_err, chains_comb, chainsy_comb