use the standardization as the default scaling instead of range scaler

chen0040 · chen0040 · commit 25ea87a1f279 · 2017-06-11T14:20:08.000+08:00
diff --git a/pom.xml b/pom.xml
@@ -501,7 +501,7 @@
         <dependency>
             <groupId>com.github.chen0040</groupId>
             <artifactId>java-data-frame</artifactId>
-            <version>1.0.9</version>
+            <version>1.0.11</version>
         </dependency>
 
 
diff --git a/src/main/java/com/github/chen0040/mlp/ann/MLP.java b/src/main/java/com/github/chen0040/mlp/ann/MLP.java
@@ -5,6 +5,8 @@
 import com.github.chen0040.mlp.enums.LearningMethod;
 import com.github.chen0040.mlp.enums.WeightUpdateMode;
 import com.github.chen0040.mlp.functions.RangeScaler;
+import lombok.Getter;
+import lombok.Setter;
 
 import java.util.ArrayList;
 import java.util.List;
@@ -13,14 +15,14 @@
 /**
  * Created by xschen on 21/8/15.
  */
+@Getter
+@Setter
 public abstract class MLP extends MLPNet {
     private Standardization inputNormalization;
-    private RangeScaler outputNormalization;
+    private Standardization outputNormalization = new Standardization();
 
     private boolean adaptiveLearningRateEnabled = false;
 
-
-
     private boolean normalizeOutputs;
 
     public MLP(){
@@ -55,7 +57,7 @@ public void train(DataFrame batch, int training_epoches)
                     targets.add(target);
                 }
             }
-            outputNormalization = new RangeScaler(targets);
+            outputNormalization.fit(targets);
         }
 
         double[][][] dE_dwji_prev = null;
diff --git a/src/main/java/com/github/chen0040/mlp/ann/regression/MLPRegression.java b/src/main/java/com/github/chen0040/mlp/ann/regression/MLPRegression.java
@@ -2,9 +2,11 @@
 
 import com.github.chen0040.data.frame.DataFrame;
 import com.github.chen0040.data.frame.DataRow;
+import com.github.chen0040.data.utils.transforms.Standardization;
 import com.github.chen0040.mlp.enums.LearningMethod;
 import com.github.chen0040.mlp.enums.WeightUpdateMode;
 import com.github.chen0040.mlp.functions.Identity;
+import com.github.chen0040.mlp.functions.RangeScaler;
 import com.github.chen0040.mlp.functions.Sigmoid;
 import com.github.chen0040.mlp.functions.TransferFunction;
 import lombok.Getter;
@@ -61,6 +63,10 @@ public void enabledAdaptiveLearningRate(boolean enabled){
     @Setter
     private double learningRate = 0.2;
 
+    @Getter
+    @Setter
+    private Standardization outputNormalization = new Standardization();
+
     public MLPRegression(){
         epoches = 1000;
 
@@ -89,6 +95,7 @@ public void fit(DataFrame batch) {
 
         mlp = new MLPWithNumericOutput();
         mlp.setNormalizeOutputs(true);
+        mlp.setOutputNormalization(outputNormalization);
         mlp.setMiniBatchSize(miniBatchSize);
         mlp.setLearningMethod(learningMethod);
         mlp.setWeightUpdateMode(weightUpdateMode);
diff --git a/src/main/java/com/github/chen0040/mlp/functions/RangeScaler.java b/src/main/java/com/github/chen0040/mlp/functions/RangeScaler.java
@@ -1,6 +1,7 @@
 package com.github.chen0040.mlp.functions;
 
 
+import com.github.chen0040.data.utils.transforms.Standardization;
 import lombok.Getter;
 import lombok.Setter;
 
@@ -14,13 +15,14 @@
  */
 @Getter
 @Setter
-public class RangeScaler implements Cloneable {
+public class RangeScaler extends Standardization {
 
    private final Map<Integer, Double> minValue = new HashMap<>();
    private final Map<Integer, Double> maxValue = new HashMap<>();
 
 
-   public RangeScaler(List<double[]> targets) {
+   @Override
+   public void fit(List<double[]> targets) {
       for(int i = 0; i < targets.size(); ++i){
          double[] values = targets.get(i);
          for(int j=0; j < values.length; ++j) {
@@ -42,6 +44,7 @@ public Object clone() throws CloneNotSupportedException {
    }
 
 
+   @Override
    public double[] standardize(double[] target) {
       double[] result = new double[target.length];
       for(int i=0; i < result.length; ++i){
@@ -51,6 +54,7 @@ public double[] standardize(double[] target) {
    }
 
 
+   @Override
    public double[] revert(double[] target) {
       double[] result = new double[target.length];
       for(int i=0; i < result.length; ++i){
diff --git a/src/test/java/com/github/chen0040/mlp/ann/regression/MLPRegressionUnitTest.java b/src/test/java/com/github/chen0040/mlp/ann/regression/MLPRegressionUnitTest.java
@@ -5,9 +5,11 @@
 import com.github.chen0040.data.frame.DataQuery;
 import com.github.chen0040.data.frame.Sampler;
 import com.github.chen0040.data.utils.TupleTwo;
+import com.github.chen0040.data.utils.transforms.Standardization;
 import com.github.chen0040.mlp.enums.LearningMethod;
 import com.github.chen0040.mlp.enums.WeightUpdateMode;
 import com.github.chen0040.mlp.functions.Identity;
+import com.github.chen0040.mlp.functions.RangeScaler;
 import com.github.chen0040.mlp.functions.ReLU;
 import com.github.chen0040.mlp.functions.Sigmoid;
 import com.github.chen0040.mlp.utils.FileUtils;
@@ -40,18 +42,33 @@ public static double randn(){
       return r * Math.sin(theta);
    }
 
+  
+
    @Test
-   public void testSimple() {
-      InputStream inputStream = FileUtils.getResource("heart_scale");
+   public void test_simple_regression() {
+      DataQuery.DataFrameQueryBuilder schema = DataQuery.blank()
+              .newInput("x1")
+              .newInput("x2")
+              .newOutput("y")
+              .end();
+
+      // y = 4 + 0.5 * x1 + 0.2 * x2
+      Sampler.DataSampleBuilder sampler = new Sampler()
+              .forColumn("x1").generate((name, index) -> randn() * 0.3 + index / 100.0)
+              .forColumn("x2").generate((name, index) -> randn() * 0.3 + index * index / 10000.0)
+              .forColumn("y").generate((name, index) -> 4 + 0.5 * index / 100.0 + 0.2 * index * index / 10000.0 + randn() * 0.3)
+              .end();
 
-      DataFrame dataFrame = DataQuery.libsvm().from(inputStream).build();
+      DataFrame data = schema.build();
 
-      System.out.println(dataFrame.head(10));
+      data = sampler.sample(data, 200);
 
-      TupleTwo<DataFrame, DataFrame> miniFrames = dataFrame.shuffle().split(0.9);
+      TupleTwo<DataFrame, DataFrame> frames = data.shuffle().split(0.9);
 
-      DataFrame trainingData = miniFrames._1();
-      DataFrame crossValidationData = miniFrames._2();
+      DataFrame trainingData = frames._1();
+      System.out.println(trainingData.head(10));
+
+      DataFrame crossValidationData = frames._2();
 
       MLPRegression regression = new MLPRegression();
       regression.setHiddenLayers(8);
@@ -68,7 +85,7 @@ public void testSimple() {
    }
 
    @Test
-   public void test_simple_regression() {
+   public void test_simple_regression_scaled_output() {
       DataQuery.DataFrameQueryBuilder schema = DataQuery.blank()
               .newInput("x1")
               .newInput("x2")
@@ -95,6 +112,7 @@ public void test_simple_regression() {
 
       MLPRegression regression = new MLPRegression();
       regression.setHiddenLayers(8);
+      regression.setOutputNormalization(new RangeScaler());
       regression.setEpoches(1000);
       regression.fit(trainingData);
 
@@ -135,6 +153,7 @@ public void test_simple_regression_weight_constraint() {
 
       MLPRegression regression = new MLPRegression();
       regression.setHiddenLayers(8);
+      regression.setOutputNormalization(new RangeScaler());
       regression.setEpoches(1000);
       regression.setWeightConstraint(80);
       regression.fit(trainingData);
@@ -218,6 +237,7 @@ public void test_simple_regression_mini_batch_gradient_descend() {
       MLPRegression regression = new MLPRegression();
       regression.setWeightUpdateMode(WeightUpdateMode.MiniBatchGradientDescend);
       regression.setMiniBatchSize(20);
+      regression.setOutputNormalization(new RangeScaler());
       regression.setHiddenLayers(8);
       regression.setEpoches(1000);
       regression.fit(trainingData);
@@ -261,6 +281,7 @@ public void test_simple_regression_mini_batch_gradient_descend_L2_regularization
       regression.setWeightUpdateMode(WeightUpdateMode.MiniBatchGradientDescend);
       regression.setMiniBatchSize(20);
       regression.setHiddenLayers(8);
+      regression.setOutputNormalization(new RangeScaler());
       regression.setL2Penalty(0.001);
       regression.setEpoches(1000);
       regression.fit(trainingData);
@@ -305,6 +326,7 @@ public void test_simple_regression_mini_batch_gradient_descend_adaptive_learning
       regression.enabledAdaptiveLearningRate(true);
       regression.setMiniBatchSize(20);
       regression.setHiddenLayers(8);
+      regression.setOutputNormalization(new RangeScaler());
       regression.setEpoches(1000);
       regression.fit(trainingData);