In [2]:
from pyspark.sql import SparkSession
from pyspark.sql.functions import col

def main():
    # Create a Spark session
    spark = SparkSession.builder \
        .appName("PySpark Test") \
        .master("local[3]") \
        .getOrCreate()

    print("✅ Spark session created successfully.")

    # Sample data
    data = [("Alice", 25), ("Bob", 30), ("Charlie", 35)]
    columns = ["Name", "Age"]

    # Create DataFrame
    df = spark.createDataFrame(data, columns)
    print("✅ DataFrame created.")
    df.show()

    # Add 5 years to age
    df_transformed = df.withColumn("AgePlusFive", col("Age") + 5)
    print("✅ Transformed DataFrame:")
    df_transformed.show()

    # Stop Spark session
    spark.stop()
    print("✅ Spark session stopped.")

if __name__ == "__main__":
    main()


✅ Spark session created successfully.
✅ DataFrame created.
+-------+---+
|   Name|Age|
+-------+---+
|  Alice| 25|
|    Bob| 30|
|Charlie| 35|
+-------+---+

✅ Transformed DataFrame:
+-------+---+-----------+
|   Name|Age|AgePlusFive|
+-------+---+-----------+
|  Alice| 25|         30|
|    Bob| 30|         35|
|Charlie| 35|         40|
+-------+---+-----------+

✅ Spark session stopped.
