chen0040
diff --git a/‎README.md‎
Lines changed: 1 addition & 1 deletion b/‎README.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎pom.xml‎
Lines changed: 1 addition & 1 deletion b/‎pom.xml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/main/java/com/github/chen0040/mlp/ann/MLP.java‎
Lines changed: 5 additions & 3 deletions b/‎src/main/java/com/github/chen0040/mlp/ann/MLP.java‎
Lines changed: 5 additions & 3 deletions
diff --git a/‎src/main/java/com/github/chen0040/mlp/ann/MLPLayer.java‎
Lines changed: 13 additions & 10 deletions b/‎src/main/java/com/github/chen0040/mlp/ann/MLPLayer.java‎
Lines changed: 13 additions & 10 deletions
diff --git a/‎src/main/java/com/github/chen0040/mlp/ann/MLPNet.java‎
Lines changed: 8 additions & 20 deletions b/‎src/main/java/com/github/chen0040/mlp/ann/MLPNet.java‎
Lines changed: 8 additions & 20 deletions
diff --git a/‎src/main/java/com/github/chen0040/mlp/ann/MLPNeuron.java‎
Lines changed: 11 additions & 18 deletions b/‎src/main/java/com/github/chen0040/mlp/ann/MLPNeuron.java‎
Lines changed: 11 additions & 18 deletions
diff --git a/‎src/main/java/com/github/chen0040/mlp/ann/regression/MLPRegression.java‎
Lines changed: 7 additions & 1 deletion b/‎src/main/java/com/github/chen0040/mlp/ann/regression/MLPRegression.java‎
Lines changed: 7 additions & 1 deletion
diff --git a/‎src/main/java/com/github/chen0040/mlp/functions/BiPolarLogSig.java‎
Lines changed: 0 additions & 14 deletions b/‎src/main/java/com/github/chen0040/mlp/functions/BiPolarLogSig.java‎
Lines changed: 0 additions & 14 deletions
diff --git a/‎src/main/java/com/github/chen0040/mlp/functions/IdentityFunction.java‎
Lines changed: 0 additions & 16 deletions b/‎src/main/java/com/github/chen0040/mlp/functions/IdentityFunction.java‎
Lines changed: 0 additions & 16 deletions
diff --git a/‎src/main/java/com/github/chen0040/mlp/functions/LogSig.java‎
Lines changed: 7 additions & 0 deletions b/‎src/main/java/com/github/chen0040/mlp/functions/LogSig.java‎
Lines changed: 7 additions & 0 deletions
@@ -9,7 +9,7 @@ Add the following dependency to your POM file:
 <dependency>
   <groupId>com.github.chen0040</groupId>
   <artifactId>java-ann-mlp</artifactId>
-  <version>1.0.1</version>
+  <version>1.0.2</version>
 </dependency>
 ```
 
 
@@ -6,7 +6,7 @@
 
     <groupId>com.github.chen0040</groupId>
     <artifactId>java-ann-mlp</artifactId>
-    <version>1.0.2</version>
+    <version>1.0.3</version>
 
     <licenses>
         <license>
 
@@ -1,7 +1,9 @@
 package com.github.chen0040.mlp.ann;
 import com.github.chen0040.data.frame.DataFrame;
 import com.github.chen0040.data.frame.DataRow;
+import com.github.chen0040.data.utils.Scaler;
 import com.github.chen0040.data.utils.transforms.Standardization;
+import com.github.chen0040.mlp.functions.RangeScaler;
 
 import java.util.ArrayList;
 import java.util.List;
@@ -12,7 +14,7 @@
  */
 public abstract class MLP extends MLPNet {
     private Standardization inputNormalization;
-    private Standardization outputNormalization;
+    private RangeScaler outputNormalization;
 
     private boolean normalizeOutputs;
 
@@ -22,7 +24,7 @@ public void copy(MLPNet rhs) throws CloneNotSupportedException {
 
         MLP rhs2 = (MLP)rhs;
         inputNormalization = rhs2.inputNormalization == null ? null : (Standardization)rhs2.inputNormalization.clone();
-        outputNormalization = rhs2.outputNormalization == null ? null : (Standardization)rhs2.outputNormalization.clone();
+        outputNormalization = rhs2.outputNormalization == null ? null : (RangeScaler) rhs2.outputNormalization.clone();
         normalizeOutputs = rhs2.normalizeOutputs;
     }
 
@@ -54,7 +56,7 @@ public void train(DataFrame batch, int training_epoches)
                     targets.add(target);
                 }
             }
-            outputNormalization = new Standardization(targets);
+            outputNormalization = new RangeScaler(targets);
         }
 
 
 
@@ -6,14 +6,13 @@
 import com.github.chen0040.mlp.functions.TransferFunction;
 
 import java.util.ArrayList;
-import java.util.Random;
+import java.util.List;
 
 
 //default network assumes input and output are in the range of [0, 1]
 public class MLPLayer implements Cloneable {
-	private static Random rand = new Random();
 	private TransferFunction transfer = new LogSig();
-    private ArrayList<MLPNeuron> neurons;
+    private List<MLPNeuron> neurons;
 
     public void copy(MLPLayer rhs){
         transfer = rhs.transfer == null ? null : (TransferFunction) ((AbstractTransferFunction)rhs.transfer).clone();
@@ -69,7 +68,7 @@ public void setTransfer(TransferFunction transfer) {
         this.transfer = transfer;
     }
 
-    public ArrayList<MLPNeuron> getNeurons() {
+    public List<MLPNeuron> getNeurons() {
         return neurons;
     }
 
@@ -90,7 +89,7 @@ public double[] forward_propagate(double[] input)
         return output;
 	}
 
-	protected void adjust_weights(double[] input, double learningRate, double momentum)
+	protected void adjust_weights(double[] input, double learningRate)
 	{
         for(int j=0; j< neurons.size(); j++)
         {
@@ -99,13 +98,12 @@ protected void adjust_weights(double[] input, double learningRate, double moment
             for(int i=0; i < dimension; ++i) {
 
                 double sink_error = neuron.error;
-                double dWeight = neuron.getWeightDelta(i);
+
                 double weight = neuron.getWeight(i);
 
                 double dw = learningRate * sink_error * input[i];
-                weight += (dw + momentum * dWeight);
-                dWeight = dw;
-                neuron.setWeightDelta(i, dWeight);
+                weight += dw;
+                neuron.setWeightDelta(i, dw);
                 neuron.setWeight(i, weight);
             }
         }
@@ -130,7 +128,10 @@ public double[] back_propagate(double[] error)
         {
             MLPNeuron neuron= neurons.get(i);
             double y = neuron.output;
-            neuron.error = y * (1-y) * error[i];
+            double[] values = neuron.values;
+            double hx = neuron.getValue(values);
+
+            neuron.error = transfer.gradient(hx, y) * error[i];
         }
 
         int k = dimension();
@@ -149,4 +150,6 @@ public double[] back_propagate(double[] error)
 
         return propagated_error;
 	}
+
+
 }
@@ -13,7 +13,7 @@
 //default network assumes input and output are in the range of [0, 1]
 public class MLPNet implements  Cloneable {
 	protected MLPLayer inputLayer =null;
-	protected MLPLayer outputLayer =null;
+	public MLPLayer outputLayer =null;
 
 	protected List<MLPLayer> hiddenLayers;
 
@@ -23,9 +23,6 @@ public class MLPNet implements  Cloneable {
 	@Setter
 	protected double learningRate =0.25; //learning rate
 
-	@Getter
-	@Setter
-	protected double momentum =0.9; //momentum term for \Delta w[i][j]
 
 	public void copy(MLPNet rhs) throws CloneNotSupportedException {
 		inputLayer = rhs.inputLayer == null ? null : (MLPLayer)rhs.inputLayer.clone();
@@ -37,7 +34,6 @@ public void copy(MLPNet rhs) throws CloneNotSupportedException {
 		}
 
 		learningRate = rhs.learningRate;
-		momentum = rhs.momentum;
 	}
 
 	public MLPLayer createInputLayer(int dimension){
@@ -55,7 +51,7 @@ public MLPLayer createOutputLayer(int dimension){
 
 	public MLPNet()
 	{
-		hiddenLayers = new ArrayList<MLPLayer>();
+		hiddenLayers = new ArrayList<>();
 	}
 
 
@@ -81,8 +77,10 @@ public double train(double[] input, double[] target)
 			propagated_output = hiddenLayers.get(i).forward_propagate(propagated_output);
 		}
 		propagated_output = outputLayer.forward_propagate(propagated_output);
-		
+
+
 		double error = get_target_error(target);
+
 
 		//backward propagate
 		double[] propagated_error = outputLayer.back_propagate(minus(target, propagated_output));
@@ -93,10 +91,10 @@ public double train(double[] input, double[] target)
 		//adjust weights
 		double[] input2 = inputLayer.output();
 		for(int i = 0; i < hiddenLayers.size(); ++i){
-			hiddenLayers.get(i).adjust_weights(input2, getLearningRate(), getMomentum());
+			hiddenLayers.get(i).adjust_weights(input2, getLearningRate());
 			input2 = hiddenLayers.get(i).output();
 		}
-		outputLayer.adjust_weights(input2, getLearningRate(), getMomentum());
+		outputLayer.adjust_weights(input2, getLearningRate());
 
 
 		return error; 
@@ -109,6 +107,7 @@ public double[] minus(double[] a, double[] b){
 		}
 		return c;
 	}
+
 
 	protected double get_target_error(double[] target)
 	{
@@ -124,17 +123,6 @@ protected double get_target_error(double[] target)
 		return t_error;
 	}
 
-	public double test(double[] input, double[] target)
-	{
-		double[] propagated_output = inputLayer.setOutput(input);
-		for(int i=0; i < hiddenLayers.size(); ++i) {
-			propagated_output = hiddenLayers.get(i).forward_propagate(propagated_output);
-		}
-		propagated_output = outputLayer.forward_propagate(propagated_output);
-		
-		return get_target_error(target);
-	}
-	
 	public double[] transform(double[] input)
 	{
 		double[] propagated_output = inputLayer.setOutput(input);
 
@@ -6,11 +6,13 @@
 
 
 public class MLPNeuron implements Cloneable {
-	public double bias_weight = 0;
-	public double bias = 0;
+	double bias_weight = 0;
+	private double bias = 0;
 
-	public double output = 0;
-	public double error = 0;
+	double output = 0;
+	double error = 0;
+
+	double[] values = null;
 
 	private static Random rand = new Random();
 
@@ -48,22 +50,12 @@ public double getWeight(int index){
         if(weights.containsKey(index)){
             return weights.get(index);
         }else{
-            double weight = rand.nextDouble() - 0.5;
+            double weight = (rand.nextDouble() - 0.5) / 10;
             weights.put(index, weight);
             return weight;
         }
     }
 
-    public double getWeightDelta(int index){
-        if(weightDeltas.containsKey(index)){
-            return weightDeltas.get(index);
-        }else{
-            double dweight = rand.nextDouble() - 0.5;
-            weightDeltas.put(index, dweight);
-            return dweight;
-        }
-    }
-
     public void setWeightDelta(int index, double val){
         weightDeltas.put(index, val);
     }
@@ -77,12 +69,13 @@ public MLPNeuron()
 		bias_weight =rand.nextDouble()-0.5;
 		bias =-1;
 
-        weights = new HashMap<Integer, Double>();
-        weightDeltas = new HashMap<Integer, Double>();
+        weights = new HashMap<>();
+        weightDeltas = new HashMap<>();
 	}
 
-	public double getValue(double[] x)
+	double getValue(double[] x)
 	{
+	   values = x;
 		double sum=0;
 
 		for(int i=0; i < x.length; i++)
 
@@ -2,6 +2,8 @@
 
 import com.github.chen0040.data.frame.DataFrame;
 import com.github.chen0040.data.frame.DataRow;
+import com.github.chen0040.mlp.functions.LogSig;
+import com.github.chen0040.mlp.functions.TransferFunction;
 import lombok.Getter;
 import lombok.Setter;
 
@@ -70,14 +72,18 @@ public void fit(DataFrame batch) {
         mlp = new MLPWithNumericOutput();
         mlp.setNormalizeOutputs(true);
 
+        TransferFunction transferFunction = new LogSig();
+
+
         int dimension = batch.row(0).toArray().length;
 
         mlp.setLearningRate(learningRate);
         mlp.createInputLayer(dimension);
         for (int hiddenLayerNeuronCount : hiddenLayers){
-            mlp.addHiddenLayer(hiddenLayerNeuronCount);
+            mlp.addHiddenLayer(hiddenLayerNeuronCount, transferFunction);
         }
         mlp.createOutputLayer(1);
+        mlp.outputLayer.setTransfer(transferFunction);
 
         mlp.train(batch, epoches);
     }
 
@@ -10,6 +10,13 @@ public double calculate(double x)
 		return 1/(Math.exp(-x)+1);
 	}
 
+
+	@Override public double gradient(double hx, double y) {
+		y = calculate(hx);
+		return y * (1-y);
+	}
+
+
 	@Override
 	public Object clone(){
 		return new LogSig();
Original file line number	Diff line number	Diff line change
`@@ -6,14 +6,13 @@`
`6`	`6`	`import com.github.chen0040.mlp.functions.TransferFunction;`
`7`	`7`
`8`	`8`	`import java.util.ArrayList;`
`9`		`-import java.util.Random;`
	`9`	`+import java.util.List;`
`10`	`10`
`11`	`11`
`12`	`12`	`//default network assumes input and output are in the range of [0, 1]`
`13`	`13`	`public class MLPLayer implements Cloneable {`
`14`		`- private static Random rand = new Random();`
`15`	`14`	`private TransferFunction transfer = new LogSig();`
`16`		`- private ArrayList<MLPNeuron> neurons;`
	`15`	`+ private List<MLPNeuron> neurons;`
`17`	`16`
`18`	`17`	`public void copy(MLPLayer rhs){`
`19`	`18`	`transfer = rhs.transfer == null ? null : (TransferFunction) ((AbstractTransferFunction)rhs.transfer).clone();`
`@@ -69,7 +68,7 @@ public void setTransfer(TransferFunction transfer) {`
`69`	`68`	`this.transfer = transfer;`
`70`	`69`	`}`
`71`	`70`
`72`		`- public ArrayList<MLPNeuron> getNeurons() {`
	`71`	`+ public List<MLPNeuron> getNeurons() {`
`73`	`72`	`return neurons;`
`74`	`73`	`}`
`75`	`74`
`@@ -90,7 +89,7 @@ public double[] forward_propagate(double[] input)`
`90`	`89`	`return output;`
`91`	`90`	`}`
`92`	`91`
`93`		`- protected void adjust_weights(double[] input, double learningRate, double momentum)`
	`92`	`+ protected void adjust_weights(double[] input, double learningRate)`
`94`	`93`	`{`
`95`	`94`	`for(int j=0; j< neurons.size(); j++)`
`96`	`95`	`{`
`@@ -99,13 +98,12 @@ protected void adjust_weights(double[] input, double learningRate, double moment`
`99`	`98`	`for(int i=0; i < dimension; ++i) {`
`100`	`99`
`101`	`100`	`double sink_error = neuron.error;`
`102`		`- double dWeight = neuron.getWeightDelta(i);`
	`101`	`+`
`103`	`102`	`double weight = neuron.getWeight(i);`
`104`	`103`
`105`	`104`	`double dw = learningRate * sink_error * input[i];`
`106`		`- weight += (dw + momentum * dWeight);`
`107`		`- dWeight = dw;`
`108`		`- neuron.setWeightDelta(i, dWeight);`
	`105`	`+ weight += dw;`
	`106`	`+ neuron.setWeightDelta(i, dw);`
`109`	`107`	`neuron.setWeight(i, weight);`
`110`	`108`	`}`
`111`	`109`	`}`
`@@ -130,7 +128,10 @@ public double[] back_propagate(double[] error)`
`130`	`128`	`{`
`131`	`129`	`MLPNeuron neuron= neurons.get(i);`
`132`	`130`	`double y = neuron.output;`
`133`		`- neuron.error = y * (1-y) * error[i];`
	`131`	`+ double[] values = neuron.values;`
	`132`	`+ double hx = neuron.getValue(values);`
	`133`	`+`
	`134`	`+ neuron.error = transfer.gradient(hx, y) * error[i];`
`134`	`135`	`}`
`135`	`136`
`136`	`137`	`int k = dimension();`
`@@ -149,4 +150,6 @@ public double[] back_propagate(double[] error)`
`149`	`150`
`150`	`151`	`return propagated_error;`
`151`	`152`	`}`
	`153`	`+`
	`154`	`+`
`152`	`155`	`}`