Skip to content

Commit

Permalink
Create DataAnalyzer.py
Browse files Browse the repository at this point in the history
  • Loading branch information
KOSASIH authored Jul 25, 2024
1 parent 042452c commit 5ae26d7
Showing 1 changed file with 26 additions and 0 deletions.
26 changes: 26 additions & 0 deletions sidra_chain_integration/project/sidra_nexus/src/DataAnalyzer.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,26 @@
package com.sidra.nexus;

import org.apache.spark.SparkConf;
import org.apache.spark.api.java.JavaSparkContext;
import org.apache.spark.sql.Dataset;
import org.apache.spark.sql.Row;
import org.apache.spark.sql.SparkSession;

public class DataAnalyzer {
private SparkSession sparkSession;

public DataAnalyzer() {
// Set up a Spark session
SparkConf conf = new SparkConf().setAppName("Data Analyzer").setMaster("local[2]");
JavaSparkContext sc = new JavaSparkContext(conf);
sparkSession = new SparkSession(sc.sc());
}

public void analyzeData(String filePath) {
// Load data from a file
Dataset<Row> data = sparkSession.read().format("csv").option("header", "true").load(filePath);

// Perform data analysis
data.groupBy("column1").count().show();
}
}

0 comments on commit 5ae26d7

Please sign in to comment.