In [None]:
The split() function in PySpark is used to split a column of strings into an array of substrings based on a delimiter.

In [1]:
from pyspark.sql import SparkSession
from pyspark.sql.functions import split

# Initialize Spark session
spark = SparkSession.builder.master("local[1]") \
                    .appName('SparkByExamples.com') \
                    .getOrCreate()

# Sample Data
data = [("John Doe",), ("Alice Johnson",), ("Bob Smith",)]
df = spark.createDataFrame(data, ["full_name"])

# Split the full_name column into first_name and last_name
df = df.withColumn("first_name", split(df["full_name"], " ")[0])
df = df.withColumn("last_name", split(df["full_name"], " ")[1])

# Show results
df.show()

+-------------+----------+---------+
|    full_name|first_name|last_name|
+-------------+----------+---------+
|     John Doe|      John|      Doe|
|Alice Johnson|     Alice|  Johnson|
|    Bob Smith|       Bob|    Smith|
+-------------+----------+---------+



In [2]:
#Splitting column with multiple delimiters
from pyspark.sql.functions import explode

# Sample Data
data = [("apple,banana,grape",), ("car,bike,truck",)]
df = spark.createDataFrame(data, ["items"])

# Split into an array
df = df.withColumn("items_array", split(df["items"], ","))

# Show results
df.show(truncate=False)

+------------------+----------------------+
|items             |items_array           |
+------------------+----------------------+
|apple,banana,grape|[apple, banana, grape]|
|car,bike,truck    |[car, bike, truck]    |
+------------------+----------------------+



In [3]:
df_exploded = df.withColumn("item", explode(df["items_array"]))
df_exploded.show()

+------------------+--------------------+------+
|             items|         items_array|  item|
+------------------+--------------------+------+
|apple,banana,grape|[apple, banana, g...| apple|
|apple,banana,grape|[apple, banana, g...|banana|
|apple,banana,grape|[apple, banana, g...| grape|
|    car,bike,truck|  [car, bike, truck]|   car|
|    car,bike,truck|  [car, bike, truck]|  bike|
|    car,bike,truck|  [car, bike, truck]| truck|
+------------------+--------------------+------+

