# Deal or No Deal
**Results interpretation and visualization**

In [7]:
import pyspark.sql.functions as F
from pyspark.sql import SparkSession

spark = SparkSession \
    .builder \
    .appName("Python Spark SQL basic example") \
    .config("spark.some.config.option", "some-value") \
    .getOrCreate()


In [8]:
# Read results as Spark DataFrames 

sdf_trial_highest_results = spark.read.parquet("trial_highest_results.parquet")
sdf_trial_results = spark.read.parquet("trial_results.parquet")

In [9]:
# Aggregate highest results for descriptive statistics 

sdf_trial_highest_results_agg = (sdf_trial_highest_results
                                    .filter(F.col('highest_round') != 0)
                                    .agg(F.mode('highest_round').alias('most_frequent_highest_round'),
                                        F.max('offer').alias('highest_offer'),
                                        F.min('offer').alias('lowest_offer'),
                                        F.mean('offer').alias('average_offer'),
                                        F.median('offer').alias('median_offer')
                                        )
                                    )
sdf_trial_highest_results_agg.show()

+---------------------------+-------------+------------+------------------+------------+
|most_frequent_highest_round|highest_offer|lowest_offer|     average_offer|median_offer|
+---------------------------+-------------+------------+------------------+------------+
|                          5|    1000000.0|        0.01|227577.70843222225|  230958.155|
+---------------------------+-------------+------------+------------------+------------+

