-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathapplication_main.py
More file actions
34 lines (20 loc) · 826 Bytes
/
application_main.py
File metadata and controls
34 lines (20 loc) · 826 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
import sys
from lib import DataManipulation, DataReader, Utils
from pyspark.sql.functions import *
from lib.logger import Log4j
if __name__ == '__main__':
if len(sys.argv) < 2:
print("Please specify the environment")
sys.exit(-1)
job_run_env = sys.argv[1]
print("Creating Spark Session")
spark = Utils.get_spark_session(job_run_env)
logger = Log4j(spark)
logger.warn("Created Spark Session")
orders_df = DataReader.read_orders(spark,job_run_env)
orders_filtered = DataManipulation.filter_closed_orders(orders_df)
customers_df = DataReader.read_customers(spark,job_run_env)
joined_df =DataManipulation.join_orders_customers(orders_filtered,customers_df)
aggregated_results = DataManipulation.count_orders_state(joined_df)
aggregated_results.show(50)
logger.info("end of main")