Skip to content

Commit 2ed613a

Browse files
committed
change libsvm read format
1 parent 9ba1d4a commit 2ed613a

12 files changed

+12
-20
lines changed

examples/src/main/java/org/apache/spark/examples/ml/JavaGradientBoostedTreeClassifierExample.java

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -42,8 +42,7 @@ public static void main(String[] args) {
4242

4343
// $example on$
4444
// Load and parse the data file, converting it to a DataFrame.
45-
RDD<LabeledPoint> rdd = MLUtils.loadLibSVMFile(jsc.sc(), "data/mllib/sample_libsvm_data.txt");
46-
DataFrame data = sqlContext.createDataFrame(rdd, LabeledPoint.class);
45+
DataFrame data = sqlContext.read().format("libsvm").load("data/mllib/sample_libsvm_data.txt");
4746

4847
// Index labels, adding metadata to the label column.
4948
// Fit on whole dataset to include all labels in index.

examples/src/main/java/org/apache/spark/examples/ml/JavaGradientBoostedTreeRegressorExample.java

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -43,8 +43,7 @@ public static void main(String[] args) {
4343

4444
// $example on$
4545
// Load and parse the data file, converting it to a DataFrame.
46-
RDD<LabeledPoint> rdd = MLUtils.loadLibSVMFile(jsc.sc(), "data/mllib/sample_libsvm_data.txt");
47-
DataFrame data = sqlContext.createDataFrame(rdd, LabeledPoint.class);
46+
DataFrame data = sqlContext.read().format("libsvm").load("data/mllib/sample_libsvm_data.txt");
4847

4948
// Automatically identify categorical features, and index them.
5049
// Set maxCategories so features with > 4 distinct values are treated as continuous.

examples/src/main/java/org/apache/spark/examples/ml/JavaRandomForestClassifierExample.java

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -42,8 +42,7 @@ public static void main(String[] args) {
4242

4343
// $example on$
4444
// Load and parse the data file, converting it to a DataFrame.
45-
RDD<LabeledPoint> rdd = MLUtils.loadLibSVMFile(jsc.sc(), "data/mllib/sample_libsvm_data.txt");
46-
DataFrame data = sqlContext.createDataFrame(rdd, LabeledPoint.class);
45+
DataFrame data = sqlContext.read().format("libsvm").load("data/mllib/sample_libsvm_data.txt");
4746

4847
// Index labels, adding metadata to the label column.
4948
// Fit on whole dataset to include all labels in index.

examples/src/main/java/org/apache/spark/examples/ml/JavaRandomForestRegressorExample.java

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -43,8 +43,7 @@ public static void main(String[] args) {
4343

4444
// $example on$
4545
// Load and parse the data file, converting it to a DataFrame.
46-
RDD<LabeledPoint> rdd = MLUtils.loadLibSVMFile(jsc.sc(), "data/mllib/sample_libsvm_data.txt");
47-
DataFrame data = sqlContext.createDataFrame(rdd, LabeledPoint.class);
46+
DataFrame data = sqlContext.read().format("libsvm").load("data/mllib/sample_libsvm_data.txt");
4847

4948
// Automatically identify categorical features, and index them.
5049
// Set maxCategories so features with > 4 distinct values are treated as continuous.

examples/src/main/python/ml/gradient_boosted_tree_classifier_example.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -37,7 +37,7 @@
3737

3838
# $example on$
3939
# Load and parse the data file, converting it to a DataFrame.
40-
data = MLUtils.loadLibSVMFile(sc, "data/mllib/sample_libsvm_data.txt").toDF()
40+
data = sqlContext.read.format("libsvm").load("data/mllib/sample_libsvm_data.txt")
4141

4242
# Index labels, adding metadata to the label column.
4343
# Fit on whole dataset to include all labels in index.

examples/src/main/python/ml/gradient_boosted_tree_regressor_example.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -37,7 +37,7 @@
3737

3838
# $example on$
3939
# Load and parse the data file, converting it to a DataFrame.
40-
data = MLUtils.loadLibSVMFile(sc, "data/mllib/sample_libsvm_data.txt").toDF()
40+
data = sqlContext.read.format("libsvm").load("data/mllib/sample_libsvm_data.txt")
4141

4242
# Automatically identify categorical features, and index them.
4343
# Set maxCategories so features with > 4 distinct values are treated as continuous.

examples/src/main/python/ml/random_forest_classifier_example.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -37,7 +37,7 @@
3737

3838
# $example on$
3939
# Load and parse the data file, converting it to a DataFrame.
40-
data = MLUtils.loadLibSVMFile(sc, "data/mllib/sample_libsvm_data.txt").toDF()
40+
data = sqlContext.read.format("libsvm").load("data/mllib/sample_libsvm_data.txt")
4141

4242
# Index labels, adding metadata to the label column.
4343
# Fit on whole dataset to include all labels in index.

examples/src/main/python/ml/random_forest_regressor_example.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -37,7 +37,7 @@
3737

3838
# $example on$
3939
# Load and parse the data file, converting it to a DataFrame.
40-
data = MLUtils.loadLibSVMFile(sc, "data/mllib/sample_libsvm_data.txt").toDF()
40+
data = sqlContext.read.format("libsvm").load("data/mllib/sample_libsvm_data.txt")
4141

4242
# Automatically identify categorical features, and index them.
4343
# Set maxCategories so features with > 4 distinct values are treated as continuous.

examples/src/main/scala/org/apache/spark/examples/ml/GradientBoostedTreeClassifierExample.scala

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -33,11 +33,10 @@ object GradientBoostedTreeClassifierExample {
3333
val conf = new SparkConf().setAppName("GradientBoostedTreeClassifierExample")
3434
val sc = new SparkContext(conf)
3535
val sqlContext = new SQLContext(sc)
36-
import sqlContext.implicits._
3736

3837
// $example on$
3938
// Load and parse the data file, converting it to a DataFrame.
40-
val data = MLUtils.loadLibSVMFile(sc, "data/mllib/sample_libsvm_data.txt").toDF()
39+
val data = sqlContext.read.format("libsvm").load("data/mllib/sample_libsvm_data.txt")
4140

4241
// Index labels, adding metadata to the label column.
4342
// Fit on whole dataset to include all labels in index.

examples/src/main/scala/org/apache/spark/examples/ml/GradientBoostedTreeRegressorExample.scala

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -33,11 +33,10 @@ object GradientBoostedTreeRegressorExample {
3333
val conf = new SparkConf().setAppName("GradientBoostedTreeRegressorExample")
3434
val sc = new SparkContext(conf)
3535
val sqlContext = new SQLContext(sc)
36-
import sqlContext.implicits._
3736

3837
// $example on$
3938
// Load and parse the data file, converting it to a DataFrame.
40-
val data = MLUtils.loadLibSVMFile(sc, "data/mllib/sample_libsvm_data.txt").toDF()
39+
val data = sqlContext.read.format("libsvm").load("data/mllib/sample_libsvm_data.txt")
4140

4241
// Automatically identify categorical features, and index them.
4342
// Set maxCategories so features with > 4 distinct values are treated as continuous.

0 commit comments

Comments
 (0)