add utill class to load and save csv

신은섭(Shin Eun Seop)
Commit fb2c76dd4f5e15dffc1c497e88c1e1648749406a fb2c76dd 1 parent 930c2e80
Showing 3 changed files with 30 additions and 23 deletions
src/main/java/Aggregation.java
src/main/java/MapExample.java → src/main/java/MLModel.java
src/main/java/Utill.java
--- a/src/main/java/Aggregation.java
View file @fb2c76d
+++ b/src/main/java/Aggregation.java
View file @fb2c76d
@@ -22,7 +22,7 @@ public class Aggregation {
         // Aggregation
         Aggregation agg = new Aggregation();
         
-         Dataset<Row> dataset = agg.loadCSVDataSet("./train_sample.csv", spark);
+         Dataset<Row> dataset = Utill.loadCSVDataSet("./train_sample.csv", spark);
         dataset = agg.changeTimestempToLong(dataset);
         dataset = agg.averageValidClickCount(dataset);
         dataset = agg.clickTimeDelta(dataset);
@@ -31,16 +31,7 @@ public class Aggregation {
         //test
         dataset.where("ip == '5348' and app == '19'").show(10);
         
-         agg.saveCSVDataSet(dataset, "./agg_data");
-     }
-         
-         
-     private Dataset<Row> loadCSVDataSet(String path, SparkSession spark){
-         // Read SCV to DataSet
-         return spark.read().format("csv")
-                 .option("inferSchema", "true")
-                 .option("header", "true")
-                 .load(path);
+         Utill.saveCSVDataSet(dataset, "./agg_data");
     }
     
     private Dataset<Row> changeTimestempToLong(Dataset<Row> dataset){
@@ -87,12 +78,4 @@ public class Aggregation {
         return newDF;
     }
     
-     private void saveCSVDataSet(Dataset<Row> dataset, String path){
-         // Read SCV to DataSet
-         dataset.repartition(1)
-                 .write().format("csv")
-                 .option("inferSchema", "true")
-                 .option("header", "true")
-                 .save(path);
-     }
 }
--- a/src/main/java/MapExample.java → src/main/java/MLModel.java
View file @fb2c76d
+++ b/src/main/java/MapExample.java → src/main/java/MLModel.java
View file @fb2c76d
@@ -24,14 +24,15 @@ import java.util.*;
 
 public class MapExample {
     
-     static SparkConf conf = new SparkConf().setMaster("local[*]").setAppName("Cesco");
-     static JavaSparkContext sc = new JavaSparkContext(conf);
-     static SQLContext sqlContext = new SQLContext(sc);
-     
     public static void main(String[] args) throws Exception {
         
         // Automatically identify categorical features, and index them.
         // Set maxCategories so features with > 4 distinct values are treated as continuous.
+         
+         Aggregation agg = new Aggregation();
+         
+         agg.
+         
         Dataset<Row> resultds = sqlContext.createDataFrame(result);
 
         System.out.println("schema start");
--- a/src/main/java/Utill.java 0 → 100644
View file @fb2c76d
+++ b/src/main/java/Utill.java 0 → 100644
View file @fb2c76d
+ import org.apache.spark.sql.Dataset;
+ import org.apache.spark.sql.Row;
+ import org.apache.spark.sql.SparkSession;
+ 
+ public class Utill {
+     
+     public static Dataset<Row> loadCSVDataSet(String path, SparkSession spark){
+         // Read SCV to DataSet
+         return spark.read().format("csv")
+                 .option("inferSchema", "true")
+                 .option("header", "true")
+                 .load(path);
+     }
+ 
+     public static void saveCSVDataSet(Dataset<Row> dataset, String path){
+         // Read SCV to DataSet
+         dataset.repartition(1)
+                 .write().format("csv")
+                 .option("inferSchema", "true")
+                 .option("header", "true")
+                 .save(path);
+     }
+ }