-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathapplication_main.py
More file actions
30 lines (18 loc) · 824 Bytes
/
application_main.py
File metadata and controls
30 lines (18 loc) · 824 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
import sys
from lib import DataManipulation, DataReader, Utils
from pyspark.sql.functions import *
if __name__=='__main__' :
if len(sys.argv)<2:
print("Pleasespecifytheenvironment")
sys.exit(-1)
job_run_env = sys.argv[1]
print("Creating SparkSession")
spark = Utils.get_spark_session(job_run_env)
print("Created SparkSession")
orders_df = DataReader.read_orders(spark, job_run_env)
orders_filtered = DataManipulation.filter_closed_orders(orders_df)
customers_df = DataReader.read_customers(spark, job_run_env)
joined_df = DataManipulation.join_orders_customers(orders_filtered, customers_df)
aggregated_results = DataManipulation.count_orders_state(joined_df)
aggregated_results.show()
print("end of main")