agibsonccc · August 27, 2014 02:07
diff --git a/NeuralNetwork.java b/NeuralNetwork.java
 package org.deeplearning4j.nn.api;

 import java.io.Serializable;
 import java.util.Map;

 import org.apache.commons.math3.distribution.RealDistribution;
 import org.apache.commons.math3.random.RandomGenerator;
 import org.deeplearning4j.berkeley.Pair;
 import org.deeplearning4j.linalg.api.ndarray.INDArray;
 import org.deeplearning4j.nn.Output;
 import org.deeplearning4j.nn.WeightInit;
 import org.deeplearning4j.nn.gradient.NeuralNetworkGradient;
 import org.deeplearning4j.nn.learning.AdaGrad;
 import org.deeplearning4j.optimize.NeuralNetEpochListener;
 /**
 * Single layer neural network, this is typically one that has 
 * the objective function of reconstruction the input: also called feature detectors
 * @author Adam Gibson
 *
 */
 public interface NeuralNetwork extends Serializable,Cloneable,NeuralNetEpochListener,Output {

 	
 	
 	/**
 	 * Optimization algorithm to use
 	 * @author Adam Gibson
 	 *
 	 */
 	public static enum OptimizationAlgorithm {
 		GRADIENT_DESCENT,CONJUGATE_GRADIENT,HESSIAN_FREE
 	}
 	/**
 	 * Which loss function to use
 	 * @author Adam Gibson
 	 *
 	 */
 	public static enum LossFunction {
 		SQUARED_LOSS,RECONSTRUCTION_CROSSENTROPY,NEGATIVELOGLIKELIHOOD,MSE,RMSE_XENT
 	}

    /**
     * Clears the input from the neural net
     */
    public void clearInput();

    /**
     * Whether to cache the input at training time
     * @return true if the input should be cached at training time otherwise false
     */
    public boolean cacheInput();

    /**
     * Backprop with the output being the reconstruction
     * @param lr the learning rate to use
     * @param epochs the max number of epochs to run
     * @param extraParams implementation specific params
     */
    public void backProp(float lr,int epochs,Object[] extraParams);

    /**
     * The loss function for this network
     * @return the loss function for this network
     */
 	public LossFunction getLossFunction();
 	public void setLossFunction(LossFunction lossFunction);

    /**
     * The optimization algorithm.
     * SGD and CG are currently supported
     * @return the optimization algorithm for this network
     */
 	public OptimizationAlgorithm getOptimizationAlgorithm();
 	public void setOptimizationAlgorithm(OptimizationAlgorithm optimziationAlgorithm);
 	
 	public boolean normalizeByInputRows();
 	
 	public  int getnVisible();

 	public  void setnVisible(int nVisible);

 	public  int getnHidden();

 	public  void setnHidden(int nHidden);

 	public INDArray getW();

 	public  void setW(INDArray w);

 	public  INDArray gethBias();

 	public  void sethBias(INDArray hBias);

 	public  INDArray getvBias();

 	public  void setvBias(INDArray vBias);

 	public  RandomGenerator getRng();

 	public  void setRng(RandomGenerator rng);

 	public  INDArray getInput();

 	public  void setInput(INDArray input);
 	
 	public WeightInit getWeightInit();
    public void setWeightInit(WeightInit weightInit);
 	public float squaredLoss();
 	
 	public float negativeLogLikelihood();
 	
 	public float getSparsity();
 	public  void setSparsity(float sparsity);
 	
 	public void setDist(RealDistribution dist);
 	public RealDistribution getDist();


    /**
     * Transform the given input.
     * This means outputting
     * @param input
     * @return
     */
    public INDArray transform(INDArray input);

 	
 	INDArray hBiasMean();
 	
 	public AdaGrad getAdaGrad();
 	public void setAdaGrad(AdaGrad adaGrad);
 	

    public void setUseRegularization(boolean useRegularization);
    public boolean isUseRegularization();

 	public AdaGrad gethBiasAdaGrad();
 	public void setHbiasAdaGrad(AdaGrad adaGrad);
 	
 	
 	public AdaGrad getVBiasAdaGrad();
 	public void setVBiasAdaGrad(AdaGrad adaGrad);
 	
 	
 	public NeuralNetworkGradient getGradient(Object[] params);


    public void setConstrainGradientToUnitNorm(boolean constrainGradientToUnitNorm);
    /**
     * Whether to constrain the gradient to unit norm or not
     */
    public boolean isConstrainGradientToUnitNorm();

    /**
     * L2 regularization coefficient
     * @return
     */
 	public float getL2();
 	public void setL2(float l2);

    /**
     * Mean squared error. Used for regression tasks
     * @return the mean squared error with respect to the output
     * of the network
     */
    public float mse();

    /**
     * RMSE for reconstruction entropy
     * @return rmse for reconstruction entropy
     */
    public float mseRecon();

 	public float getMomentum();
 	public void setMomentum(float momentum);
 	
 	public void setRenderEpochs(int renderEpochs);
 	public int getRenderIterations();

 	public NeuralNetwork transpose();
 	public  NeuralNetwork clone();

 	public float fanIn();
 	public void setFanIn(float fanIn);
 	/**
 	 * Sample hidden mean and sample
 	 * given visible
 	 * @param v the  the visible input
 	 * @return a pair with mean, sample
 	 */
 	public Pair<INDArray,INDArray> sampleHiddenGivenVisible(INDArray v);


    public boolean isUseAdaGrad();
 	
 	public void setDropOut(float dropOut);
 	public float dropOut();
 	
 	/**
 	 * Sample visible mean and sample
 	 * given hidden
 	 * @param h the  the hidden input
 	 * @return a pair with mean, sample
 	 */
 	public Pair<INDArray,INDArray> sampleVisibleGivenHidden(INDArray h);
 	
 	void resetAdaGrad(float lr);
 	
 	void iterationDone(int epoch);
 	
 	public float l2RegularizedCoefficient();



    public void setConcatBiases(boolean concatBiases);
    boolean isConcatBiases();

    /**
     * Error on reconstruction
     * @return the error on reconstruction
     */
 	public float getReConstructionCrossEntropy();

    /**
     * Run one iteration
     * @param input the input to iterate on
     * @param lr the learning rate to use
     * @param params the extra params for the neural network(k, corruption level, max epochs,...)
     */
 	public void iterate(INDArray input, float lr, Object[] params);

    /**
     * Trains via an optimization algorithm such as SGD or Conjugate Gradient
     * @param input the input to iterate on
     * @param lr the learning rate to use
     * @param params the params (k,corruption level, max epochs,...)
     */
 	public void fit(INDArray input, float lr, Object[] params);
 	/**
 	 * Performs a network merge in the form of
 	 * a += b - a / n
 	 * where a is a matrix here
 	 * b is a matrix on the incoming network
 	 * and n is the batch size
 	 * @param network the network to merge with
 	 * @param batchSize the batch size (number of training examples)
 	 * to average by
 	 */
 	void merge(NeuralNetwork network,int batchSize);

    /**
     * Whether to apply sparsity or not
     * @return
     */
    boolean isApplySparsity();

    /**
     * Reset ada grad after n iterations
     * @return
     */
    public int getResetAdaGradIterations();

    /**
     * Reset adagrad after n iterations
     * @param resetAdaGradEpochs
     */
    public void setResetAdaGradIterations(int resetAdaGradEpochs);

    /**
     * Getter for momentum after n iterations
     * @return
     */
    public Map<Integer, Float> getMomentumAfter();

    /**
     * Setter for momentum after n iterations
     * @param momentumAfter
     */
    public void setMomentumAfter(Map<Integer, Float> momentumAfter);

 }
	package org.deeplearning4j.nn.api;

	import java.io.Serializable;
	import java.util.Map;

	import org.apache.commons.math3.distribution.RealDistribution;
	import org.apache.commons.math3.random.RandomGenerator;
	import org.deeplearning4j.berkeley.Pair;
	import org.deeplearning4j.linalg.api.ndarray.INDArray;
	import org.deeplearning4j.nn.Output;
	import org.deeplearning4j.nn.WeightInit;
	import org.deeplearning4j.nn.gradient.NeuralNetworkGradient;
	import org.deeplearning4j.nn.learning.AdaGrad;
	import org.deeplearning4j.optimize.NeuralNetEpochListener;
	/**
	* Single layer neural network, this is typically one that has
	* the objective function of reconstruction the input: also called feature detectors
	* @author Adam Gibson
	*
	*/
	public interface NeuralNetwork extends Serializable,Cloneable,NeuralNetEpochListener,Output {



	/**
	* Optimization algorithm to use
	* @author Adam Gibson
	*
	*/
	public static enum OptimizationAlgorithm {
	GRADIENT_DESCENT,CONJUGATE_GRADIENT,HESSIAN_FREE
	}
	/**
	* Which loss function to use
	* @author Adam Gibson
	*
	*/
	public static enum LossFunction {
	SQUARED_LOSS,RECONSTRUCTION_CROSSENTROPY,NEGATIVELOGLIKELIHOOD,MSE,RMSE_XENT
	}

	/**
	* Clears the input from the neural net
	*/
	public void clearInput();

	/**
	* Whether to cache the input at training time
	* @return true if the input should be cached at training time otherwise false
	*/
	public boolean cacheInput();

	/**
	* Backprop with the output being the reconstruction
	* @param lr the learning rate to use
	* @param epochs the max number of epochs to run
	* @param extraParams implementation specific params
	*/
	public void backProp(float lr,int epochs,Object[] extraParams);

	/**
	* The loss function for this network
	* @return the loss function for this network
	*/
	public LossFunction getLossFunction();
	public void setLossFunction(LossFunction lossFunction);

	/**
	* The optimization algorithm.
	* SGD and CG are currently supported
	* @return the optimization algorithm for this network
	*/
	public OptimizationAlgorithm getOptimizationAlgorithm();
	public void setOptimizationAlgorithm(OptimizationAlgorithm optimziationAlgorithm);

	public boolean normalizeByInputRows();

	public int getnVisible();

	public void setnVisible(int nVisible);

	public int getnHidden();

	public void setnHidden(int nHidden);

	public INDArray getW();

	public void setW(INDArray w);

	public INDArray gethBias();

	public void sethBias(INDArray hBias);

	public INDArray getvBias();

	public void setvBias(INDArray vBias);

	public RandomGenerator getRng();

	public void setRng(RandomGenerator rng);

	public INDArray getInput();

	public void setInput(INDArray input);

	public WeightInit getWeightInit();
	public void setWeightInit(WeightInit weightInit);
	public float squaredLoss();

	public float negativeLogLikelihood();

	public float getSparsity();
	public void setSparsity(float sparsity);

	public void setDist(RealDistribution dist);
	public RealDistribution getDist();


	/**
	* Transform the given input.
	* This means outputting
	* @param input
	* @return
	*/
	public INDArray transform(INDArray input);


	INDArray hBiasMean();

	public AdaGrad getAdaGrad();
	public void setAdaGrad(AdaGrad adaGrad);


	public void setUseRegularization(boolean useRegularization);
	public boolean isUseRegularization();

	public AdaGrad gethBiasAdaGrad();
	public void setHbiasAdaGrad(AdaGrad adaGrad);


	public AdaGrad getVBiasAdaGrad();
	public void setVBiasAdaGrad(AdaGrad adaGrad);


	public NeuralNetworkGradient getGradient(Object[] params);


	public void setConstrainGradientToUnitNorm(boolean constrainGradientToUnitNorm);
	/**
	* Whether to constrain the gradient to unit norm or not
	*/
	public boolean isConstrainGradientToUnitNorm();

	/**
	* L2 regularization coefficient
	* @return
	*/
	public float getL2();
	public void setL2(float l2);

	/**
	* Mean squared error. Used for regression tasks
	* @return the mean squared error with respect to the output
	* of the network
	*/
	public float mse();

	/**
	* RMSE for reconstruction entropy
	* @return rmse for reconstruction entropy
	*/
	public float mseRecon();

	public float getMomentum();
	public void setMomentum(float momentum);

	public void setRenderEpochs(int renderEpochs);
	public int getRenderIterations();

	public NeuralNetwork transpose();
	public NeuralNetwork clone();

	public float fanIn();
	public void setFanIn(float fanIn);
	/**
	* Sample hidden mean and sample
	* given visible
	* @param v the the visible input
	* @return a pair with mean, sample
	*/
	public Pair<INDArray,INDArray> sampleHiddenGivenVisible(INDArray v);


	public boolean isUseAdaGrad();

	public void setDropOut(float dropOut);
	public float dropOut();

	/**
	* Sample visible mean and sample
	* given hidden
	* @param h the the hidden input
	* @return a pair with mean, sample
	*/
	public Pair<INDArray,INDArray> sampleVisibleGivenHidden(INDArray h);

	void resetAdaGrad(float lr);

	void iterationDone(int epoch);

	public float l2RegularizedCoefficient();



	public void setConcatBiases(boolean concatBiases);
	boolean isConcatBiases();

	/**
	* Error on reconstruction
	* @return the error on reconstruction
	*/
	public float getReConstructionCrossEntropy();

	/**
	* Run one iteration
	* @param input the input to iterate on
	* @param lr the learning rate to use
	* @param params the extra params for the neural network(k, corruption level, max epochs,...)
	*/
	public void iterate(INDArray input, float lr, Object[] params);

	/**
	* Trains via an optimization algorithm such as SGD or Conjugate Gradient
	* @param input the input to iterate on
	* @param lr the learning rate to use
	* @param params the params (k,corruption level, max epochs,...)
	*/
	public void fit(INDArray input, float lr, Object[] params);
	/**
	* Performs a network merge in the form of
	* a += b - a / n
	* where a is a matrix here
	* b is a matrix on the incoming network
	* and n is the batch size
	* @param network the network to merge with
	* @param batchSize the batch size (number of training examples)
	* to average by
	*/
	void merge(NeuralNetwork network,int batchSize);

	/**
	* Whether to apply sparsity or not
	* @return
	*/
	boolean isApplySparsity();

	/**
	* Reset ada grad after n iterations
	* @return
	*/
	public int getResetAdaGradIterations();

	/**
	* Reset adagrad after n iterations
	* @param resetAdaGradEpochs
	*/
	public void setResetAdaGradIterations(int resetAdaGradEpochs);

	/**
	* Getter for momentum after n iterations
	* @return
	*/
	public Map<Integer, Float> getMomentumAfter();

	/**
	* Setter for momentum after n iterations
	* @param momentumAfter
	*/
	public void setMomentumAfter(Map<Integer, Float> momentumAfter);

	}