Source Code of tv.floe.metronome.deeplearning.neuralnetwork.layer.OutputLayer

package tv.floe.metronome.deeplearning.neuralnetwork.layer;


import org.apache.mahout.math.DenseMatrix;
import org.apache.mahout.math.Matrix;


import tv.floe.metronome.math.MatrixUtils;


/**
 * 
 * DEPRECATED - NOT USED
 * 
 * 
 * By assigning a softmax activation function, a generalization of the logistic function, 
 * on the output layer of the neural network (or a softmax component in a component-based 
 * neural network) for categorical target variables, the outputs can be interpreted
 * as posterior probabilities. 
 * This is very useful in classification as it gives a certainty measure on classifications.
 * 
 * @author josh
 *
 */
@Deprecated
public class OutputLayer {




  private static final long serialVersionUID = -7065564817460914364L;
  public int numInputNeurons;
  public int numOutputNeurons;
  
  public Matrix inputTrainingData = null;
  public Matrix outputTrainingLabels = null;
  
  public Matrix connectionWeights;
  public Matrix biasTerms;






  public OutputLayer(Matrix input,Matrix labels, int nIn, int nOut) {
    this.inputTrainingData = input;
    this.outputTrainingLabels = labels;
    this.numInputNeurons = nIn;
    this.numOutputNeurons = nOut;
    this.connectionWeights = new DenseMatrix( nIn, nOut );
    this.connectionWeights.assign(0.0);
    
    this.biasTerms = new DenseMatrix(nOut, 1); //Matrix.zeros(nOut);
    this.biasTerms.assign(0.0);
  }


  public OutputLayer(Matrix input, int nIn, int nOut) {
    this( input, null, nIn, nOut );
  }




  public void train(double learningRate) {
    train( inputTrainingData, outputTrainingLabels, learningRate );
  }




  public void train( Matrix x, double learningRate ) {
    train( x, outputTrainingLabels, learningRate );


  }
  
/*  public void merge(HiddenLayer layer,int batchSize) {
    connectionWeights.addi(layer.connectionWeights.subi(connectionWeights).div(batchSize));
    biasTerms.addi(layer.biasTerms.subi(biasTerms).div(batchSize));
  }
*/
  /**
   * Objective function:  minimize negative log likelihood
   * @return the negative log likelihood of the model
   */
  public double negativeLogLikelihood() {
        
    Matrix mult = this.inputTrainingData.times(connectionWeights);
    Matrix multPlusBias = MatrixUtils.addRowVector(mult, this.biasTerms.viewRow(0));
    Matrix sigAct = MatrixUtils.softmax(multPlusBias); 
    
    Matrix eleMul = MatrixUtils.elementWiseMultiplication( this.outputTrainingLabels, MatrixUtils.log(sigAct) );


    Matrix oneMinusLabels = MatrixUtils.oneMinus( this.outputTrainingLabels );
    Matrix logOneMinusSigAct = MatrixUtils.log( MatrixUtils.oneMinus(sigAct) );
    Matrix labelsMulSigAct = MatrixUtils.elementWiseMultiplication(oneMinusLabels, logOneMinusSigAct);


    Matrix sum = eleMul.plus(labelsMulSigAct);
    
    Matrix colSumsMatrix = MatrixUtils.columnSums(sum);
    
    double matrixMean = MatrixUtils.mean(colSumsMatrix);
    
    return -matrixMean;
    
  }


  /**
   * Train on the given inputs and labels.
   * 
   * This will assign the passed in values as fields to this logistic function for 
   * caching.
   * 
   * @param input the inputs to train on
   * @param labels the labels to train on
   * @param lr the learning rate
   */
  public void train(Matrix input, Matrix labels, double lr) {
    
    MatrixUtils.ensureValidOutcomeMatrix(labels);


    this.inputTrainingData = input;
    this.outputTrainingLabels = labels;


    if (input.numRows() != labels.numRows()) {
      throw new IllegalArgumentException("Can't train on the 2 given inputs and labels");
    }


    //Matrix p_y_given_x = softmax(input.mmul(connectionWeights).addRoconnectionWeightsVector(biasTerms));
    Matrix p_LabelsGivenInput = input.times(this.connectionWeights);
    p_LabelsGivenInput = MatrixUtils.softmax(MatrixUtils.addRowVector(p_LabelsGivenInput, this.biasTerms.viewRow(0)));
    
    //Matrix dy = y.sub(p_y_given_x);
    Matrix dy = labels.minus(p_LabelsGivenInput);


    //connectionWeights = connectionWeights.add(x.transpose().mmul(dy).mul(lr));    
    Matrix baseConnectionUpdate = input.transpose().times(dy);
    this.connectionWeights = this.connectionWeights.plus( baseConnectionUpdate.times(lr) );
    
    //biasTerms = biasTerms.add(dy.columnMeans().mul(lr));
    this.biasTerms = this.biasTerms.plus( MatrixUtils.columnMeans(dy).times(lr) );


  }










  /**
   * Classify input the input 
   * 
   * 
   * Each row will be the likelihood of a label given that example
   * 
   * @return a probability distribution for each row
   */
  public Matrix predict(Matrix input) {
    
    Matrix prediction = input.times(this.connectionWeights);
    prediction = MatrixUtils.softmax(MatrixUtils.addRowVector(prediction, this.biasTerms.viewRow(0)));
    
    return prediction;
    
  }  


}
Source Code of tv.floe.metronome.deeplearning.neuralnetwork.layer.OutputLayer

Related Classes of tv.floe.metronome.deeplearning.neuralnetwork.layer.OutputLayer