Source Code of tv.floe.metronome.deeplearning.neuralnetwork.core.learning.AdagradLearningRate

package tv.floe.metronome.deeplearning.neuralnetwork.core.learning;


import java.io.DataInput;
import java.io.DataInputStream;
import java.io.DataOutput;
import java.io.DataOutputStream;
import java.io.IOException;
import java.io.InputStream;
import java.io.ObjectInputStream;
import java.io.OutputStream;


import org.apache.mahout.math.DenseMatrix;
import org.apache.mahout.math.Matrix;
import org.apache.mahout.math.MatrixWritable;


import tv.floe.metronome.math.MatrixUtils;


/**
 * 
 * Vectorized Learning Rate used per Connection Weight
 * 
 * @author josh
 *
 */
public class AdagradLearningRate {


  private double masterStepSize = 1e-3; // default for masterStepSize (this is the numerator)
  public Matrix historicalGradient;
  public Matrix adjustedGradient;
  public double fudgeFactor = 0.000001;
  public Matrix gradient;
  public int rows;
  public int cols;
  private int numIterations = 0;
  private double lrDecay = 0.95;
  private boolean decayLr;
  private double minLearningRate = 1e-4;


//  public double autoCorrect = 0.95;  


  public AdagradLearningRate( int rows, int cols, double gamma) {


    this.rows = rows;
    this.cols = cols;


    this.adjustedGradient = new DenseMatrix(rows, cols);
    this.adjustedGradient.assign( 0.0 );


    this.historicalGradient = new DenseMatrix(rows, cols);
    this.historicalGradient.assign( 0.0 );


    this.masterStepSize = gamma;
    this.decayLr = false;


    // gonna default init this for serde purposes
    this.gradient = new DenseMatrix(rows, cols);
    this.gradient.assign( 0.0 );


  }


  public AdagradLearningRate( int rows, int cols) {


    this( rows, cols, 0.01 );


  }






  public Matrix getLearningRates(Matrix gradient) {
        Matrix gradientSquared = MatrixUtils.pow(gradient,2);
    this.gradient = gradient.clone();
        this.historicalGradient = this.historicalGradient.plus(gradientSquared);
    double currentLearningRate = this.masterStepSize;
    if(decayLr && numIterations > 0) {
      this.masterStepSize *= lrDecay;
      if(masterStepSize < minLearningRate)
        masterStepSize = minLearningRate;
    }


    numIterations++;
    
    
    this.adjustedGradient = MatrixUtils.div(this.gradient,MatrixUtils.sqrt(gradientSquared.plus(fudgeFactor)));
        this.adjustedGradient = this.adjustedGradient.times(masterStepSize);
    //ensure no zeros
//    this.adjustedGradient.addi(1e-6);
    this.adjustedGradient = this.adjustedGradient.plus( 1e-6 );
    
    
    return adjustedGradient;
  }
  
  public AdagradLearningRate clone() {
    
    AdagradLearningRate ret = new AdagradLearningRate( this.rows, this.cols );
    ret.adjustedGradient.assign( this.adjustedGradient );
    //ret.autoCorrect = this.autoCorrect;
    ret.decayLr = this.decayLr;
    ret.fudgeFactor = this.fudgeFactor;
    if ( null == this.gradient ) {
      ret.gradient = null;
    } else {
      ret.gradient.assign( this.gradient );
    }
    ret.historicalGradient.assign( this.historicalGradient );
    ret.masterStepSize = this.masterStepSize;
    
    return ret;
    
  }
  
  public  double getMasterStepSize() {
    return masterStepSize;
  }


  public  void setMasterStepSize(double masterStepSize) {
    this.masterStepSize = masterStepSize;
  }


  public synchronized boolean isDecayLr() {
    return decayLr;
  }


  public synchronized void setDecayLr(boolean decayLr) {
    this.decayLr = decayLr;
  }
  
  
  /**
   * Serializes this to the output stream.
   * @param os the output stream to write to
   */
  public void write(OutputStream os) {
    try {


        DataOutput d = new DataOutputStream(os);
        
      d.writeDouble( masterStepSize );
      
      MatrixWritable.writeMatrix( d, historicalGradient );
      MatrixWritable.writeMatrix( d, adjustedGradient );
      
      d.writeDouble( fudgeFactor );
      
      MatrixWritable.writeMatrix( d, gradient );
      
      d.writeInt( rows );
      d.writeInt( cols );
      d.writeInt( numIterations );
      
      d.writeDouble( lrDecay );
      d.writeBoolean(  decayLr );
      d.writeDouble( minLearningRate );
        
        
        
    } catch (IOException e) {
      throw new RuntimeException(e);
    }


  }  
  
  /**
   * Load (using {@link ObjectInputStream}
   * @param is the input stream to load from (usually a file)
   */
  public void load(InputStream is) {
    try {


      DataInput di = new DataInputStream(is);
      
      masterStepSize = di.readDouble();
      
      historicalGradient = MatrixWritable.readMatrix( di );
      adjustedGradient = MatrixWritable.readMatrix( di );
      
      fudgeFactor = di.readDouble();
      
      gradient = MatrixWritable.readMatrix( di );
      
      rows = di.readInt();
      cols = di.readInt();
      numIterations = di.readInt();
      
      lrDecay = di.readDouble();
      decayLr = di.readBoolean();
      minLearningRate = di.readDouble();      
      
    } catch (Exception e) {
      throw new RuntimeException(e);
    }


  }  
  
  


}
Source Code of tv.floe.metronome.deeplearning.neuralnetwork.core.learning.AdagradLearningRate

Related Classes of tv.floe.metronome.deeplearning.neuralnetwork.core.learning.AdagradLearningRate