0001
0002
0003
0004
0005
0006
0007
0008
0009
0010
0011
0012
0013
0014
0015
0016
0017
0018 package org.apache.spark.examples.ml;
0019
0020 import org.apache.spark.sql.SparkSession;
0021
0022
0023 import org.apache.spark.ml.feature.RobustScaler;
0024 import org.apache.spark.ml.feature.RobustScalerModel;
0025 import org.apache.spark.sql.Dataset;
0026 import org.apache.spark.sql.Row;
0027
0028
0029 public class JavaRobustScalerExample {
0030 public static void main(String[] args) {
0031 SparkSession spark = SparkSession
0032 .builder()
0033 .appName("JavaRobustScalerExample")
0034 .getOrCreate();
0035
0036
0037 Dataset<Row> dataFrame =
0038 spark.read().format("libsvm").load("data/mllib/sample_libsvm_data.txt");
0039
0040 RobustScaler scaler = new RobustScaler()
0041 .setInputCol("features")
0042 .setOutputCol("scaledFeatures")
0043 .setWithScaling(true)
0044 .setWithCentering(false)
0045 .setLower(0.25)
0046 .setUpper(0.75);
0047
0048
0049 RobustScalerModel scalerModel = scaler.fit(dataFrame);
0050
0051
0052 Dataset<Row> scaledData = scalerModel.transform(dataFrame);
0053 scaledData.show();
0054
0055 spark.stop();
0056 }
0057 }