In [0]:
df = spark.read.option("header", True).csv("dbfs:/FileStore/tables/ipl_2021_matches.csv")

In [0]:
df.printSchema()
df.show(5, truncate=False)

root
 |-- year: string (nullable = true)
 |-- series_type: string (nullable = true)
 |-- series_name: string (nullable = true)
 |-- match_no: string (nullable = true)
 |-- match_type: string (nullable = true)
 |-- match_name: string (nullable = true)
 |-- match_href: string (nullable = true)
 |-- match_team1: string (nullable = true)
 |-- match_team2: string (nullable = true)
 |-- match_datetime_start: string (nullable = true)
 |-- match_date_end: string (nullable = true)
 |-- match_venue: string (nullable = true)

+----+-----------+--------------------------+--------+----------+--------------------------------------------------------+---------------------------------------------------------------------------------------------+-----------+-----------+--------------------+--------------+-----------+
|year|series_type|series_name               |match_no|match_type|match_name                                              |match_href                                                          

In [0]:
# Display the column names of the DataFrame
df.columns


Out[4]: ['year',
 'series_type',
 'series_name',
 'match_no',
 'match_type',
 'match_name',
 'match_href',
 'match_team1',
 'match_team2',
 'match_datetime_start',
 'match_date_end',
 'match_venue']

In [0]:
df.select("match_type").distinct().show(truncate=False)


+----------+
|match_type|
+----------+
|League    |
+----------+



In [0]:
df.select("match_name").distinct().show(50, truncate=False)

+----------------------------------------------------------------+
|match_name                                                      |
+----------------------------------------------------------------+
|DELHI CAPITALS vs SUNRISERS HYDERABAD, 33rd Match               |
|ROYAL CHALLENGERS BENGALURU vs CHENNAI SUPER KINGS, 35th Match  |
|SUNRISERS HYDERABAD vs MUMBAI INDIANS, 31st Match               |
|SUNRISERS HYDERABAD vs DELHI CAPITALS, 20th Match               |
|PUNJAB KINGS vs SUNRISERS HYDERABAD, 14th Match                 |
|MUMBAI INDIANS vs PUNJAB KINGS, 42nd Match                      |
|PUNJAB KINGS vs DELHI CAPITALS, 29th Match                      |
|DELHI CAPITALS vs MUMBAI INDIANS, 13th Match                    |
|DELHI CAPITALS vs ROYAL CHALLENGERS BENGALURU, 22nd Match       |
|SUNRISERS HYDERABAD vs ROYAL CHALLENGERS BENGALURU, 6th Match   |
|PUNJAB KINGS vs ROYAL CHALLENGERS BENGALURU, 26th Match         |
|SUNRISERS HYDERABAD vs KOLKATA KNIGHT RIDERS, 3rd Match      

In [0]:
tie_breakers = df.select("match_type", "match_name") \
                 .where("match_name LIKE '%Super Over%' OR match_type LIKE '%Qualifier%'") \
                 .distinct()

In [0]:
tie_breakers.show(truncate=False)

+----------+----------+
|match_type|match_name|
+----------+----------+
+----------+----------+



In [0]:
df.write.format("delta").mode("overwrite").save("/mnt/delta/ipl_2021_matches")


In [0]:
spark.sql("CREATE TABLE IF NOT EXISTS ipl_2021_matches USING DELTA LOCATION '/mnt/delta/ipl_2021_matches'")

Out[16]: DataFrame[]

In [0]:
delta_df = spark.read.format("delta").load("/mnt/delta/ipl_2021_matches")

In [0]:
delta_df.show()

+----+-----------+--------------------+--------+----------+--------------------+--------------------+-----------+-----------+--------------------+--------------+-----------+
|year|series_type|         series_name|match_no|match_type|          match_name|          match_href|match_team1|match_team2|match_datetime_start|match_date_end|match_venue|
+----+-----------+--------------------+--------+----------+--------------------+--------------------+-----------+-----------+--------------------+--------------+-----------+
|2021|        T20|Indian Premier Le...|    null|    League|MUMBAI INDIANS vs...|https://www.cricb...|       null|       null|                null|          null|       null|
|2021|        T20|Indian Premier Le...|    null|    League|CHENNAI SUPER KIN...|https://www.cricb...|       null|       null|                null|          null|       null|
|2021|        T20|Indian Premier Le...|    null|    League|SUNRISERS HYDERAB...|https://www.cricb...|       null|       null|     