0001
0002
0003
0004
0005
0006
0007
0008
0009
0010
0011
0012
0013
0014
0015
0016
0017
0018 """
0019 Logistic Regression With LBFGS Example.
0020 """
0021 from __future__ import print_function
0022
0023 from pyspark import SparkContext
0024
0025 from pyspark.mllib.classification import LogisticRegressionWithLBFGS, LogisticRegressionModel
0026 from pyspark.mllib.regression import LabeledPoint
0027
0028
0029 if __name__ == "__main__":
0030
0031 sc = SparkContext(appName="PythonLogisticRegressionWithLBFGSExample")
0032
0033
0034
0035 def parsePoint(line):
0036 values = [float(x) for x in line.split(' ')]
0037 return LabeledPoint(values[0], values[1:])
0038
0039 data = sc.textFile("data/mllib/sample_svm_data.txt")
0040 parsedData = data.map(parsePoint)
0041
0042
0043 model = LogisticRegressionWithLBFGS.train(parsedData)
0044
0045
0046 labelsAndPreds = parsedData.map(lambda p: (p.label, model.predict(p.features)))
0047 trainErr = labelsAndPreds.filter(lambda lp: lp[0] != lp[1]).count() / float(parsedData.count())
0048 print("Training Error = " + str(trainErr))
0049
0050
0051 model.save(sc, "target/tmp/pythonLogisticRegressionWithLBFGSModel")
0052 sameModel = LogisticRegressionModel.load(sc,
0053 "target/tmp/pythonLogisticRegressionWithLBFGSModel")
0054