In [0]:
data = [
    ("Alice", 30, "Full-time", "Female", 60000),
    ("Bob", 25, "Part-time", "Male", 30000),
    ("Charlie", 35, "Contract", "Male", 70000)
]

# Create DataFrame
columns = ["name", "age", "emp_type", "gender", "salary"]
df = spark.createDataFrame(data, columns)

In [0]:
df.show()

+-------+---+---------+------+------+
|   name|age| emp_type|gender|salary|
+-------+---+---------+------+------+
|  Alice| 30|Full-time|Female| 60000|
|    Bob| 25|Part-time|  Male| 30000|
|Charlie| 35| Contract|  Male| 70000|
+-------+---+---------+------+------+



In [0]:
%fs
ls FileStore/tables/

path,name,size,modificationTime
dbfs:/FileStore/tables/bad_record_data/,bad_record_data/,0,0
dbfs:/FileStore/tables/bad_records_data/,bad_records_data/,0,0
dbfs:/FileStore/tables/corrupted_data-1.csv,corrupted_data-1.csv,556,1720882253000
dbfs:/FileStore/tables/corrupted_data.csv,corrupted_data.csv,551,1720881464000
dbfs:/FileStore/tables/corrupted_extraOrMissing_comma.json,corrupted_extraOrMissing_comma.json,905,1720957350000
dbfs:/FileStore/tables/flight_data_hive.csv,flight_data_hive.csv,7286,1720872140000


In [0]:
df.write.csv(path = r"/FileStore/tables/my_saved_file.csv", header = True, mode = "overwrite")

In [0]:
%fs
ls FileStore/tables/

path,name,size,modificationTime
dbfs:/FileStore/tables/_SUCCESS,_SUCCESS,0,1721026988000
dbfs:/FileStore/tables/_committed_6631259619680670224,_committed_6631259619680670224,737,1721026987000
dbfs:/FileStore/tables/_committed_7263832663890301440,_committed_7263832663890301440,479,1721026660000
dbfs:/FileStore/tables/_started_6631259619680670224,_started_6631259619680670224,0,1721026986000
dbfs:/FileStore/tables/_started_7263832663890301440,_started_7263832663890301440,0,1721026659000
dbfs:/FileStore/tables/bad_record_data/,bad_record_data/,0,0
dbfs:/FileStore/tables/bad_records_data/,bad_records_data/,0,0
dbfs:/FileStore/tables/my_saved_file.csv/,my_saved_file.csv/,0,0
dbfs:/FileStore/tables/part-00000-tid-6631259619680670224-44fe7390-efd7-47e9-ba4d-f9e4bebe7752-16-1-c000.csv,part-00000-tid-6631259619680670224-44fe7390-efd7-47e9-ba4d-f9e4bebe7752-16-1-c000.csv,32,1721026987000
dbfs:/FileStore/tables/part-00002-tid-6631259619680670224-44fe7390-efd7-47e9-ba4d-f9e4bebe7752-18-1-c000.csv,part-00002-tid-6631259619680670224-44fe7390-efd7-47e9-ba4d-f9e4bebe7752-18-1-c000.csv,64,1721026987000


In [0]:
df = spark.read.csv(path = r"/FileStore/tables/my_saved_file.csv",header = True, inferSchema = True)

In [0]:
df.show()

+-------+---+---------+------+------+
|   name|age| emp_type|gender|salary|
+-------+---+---------+------+------+
|  Alice| 30|Full-time|Female| 60000|
|Charlie| 35| Contract|  Male| 70000|
|    Bob| 25|Part-time|  Male| 30000|
+-------+---+---------+------+------+



#### Working with append Mode

In [0]:
df.write.csv(path = r"/FileStore/tables/my_saved_file.csv", header = True, mode = "append")

In [0]:
df = spark.read.csv(path = r"/FileStore/tables/my_saved_file.csv",header = True, inferSchema = True)
df.show()

+-------+---+---------+------+------+
|   name|age| emp_type|gender|salary|
+-------+---+---------+------+------+
|  Alice| 30|Full-time|Female| 60000|
|  Alice| 30|Full-time|Female| 60000|
|Charlie| 35| Contract|  Male| 70000|
|Charlie| 35| Contract|  Male| 70000|
|    Bob| 25|Part-time|  Male| 30000|
|    Bob| 25|Part-time|  Male| 30000|
+-------+---+---------+------+------+



#### Working with mode : errorIfExist

In [0]:
df.write.csv(path = r"/FileStore/tables/my_saved_file.csv", header = True, mode = "errorifexists")

[0;31m---------------------------------------------------------------------------[0m
[0;31mAnalysisException[0m                         Traceback (most recent call last)
File [0;32m<command-2578010127403162>:1[0m
[0;32m----> 1[0m [43mdf[49m[38;5;241;43m.[39;49m[43mwrite[49m[38;5;241;43m.[39;49m[43mcsv[49m[43m([49m[43mpath[49m[43m [49m[38;5;241;43m=[39;49m[43m [49m[38;5;124;43mr[39;49m[38;5;124;43m"[39;49m[38;5;124;43m/FileStore/tables/my_saved_file.csv[39;49m[38;5;124;43m"[39;49m[43m,[49m[43m [49m[43mheader[49m[43m [49m[38;5;241;43m=[39;49m[43m [49m[38;5;28;43;01mTrue[39;49;00m[43m,[49m[43m [49m[43mmode[49m[43m [49m[38;5;241;43m=[39;49m[43m [49m[38;5;124;43m"[39;49m[38;5;124;43merrorIfExist[39;49m[38;5;124;43m"[39;49m[43m)[49m

File [0;32m/databricks/spark/python/pyspark/instrumentation_utils.py:48[0m, in [0;36m_wrap_function.<locals>.wrapper[0;34m(*args, **kwargs)[0m
[1;32m     46[0m start [38;5;241m=[39m t

#### Working with mode : ignore

In [0]:
df.write.csv(path = "/FileStore/tables/mysaved_file.cdv",
             header = True, 
             mode = "ignore")

In [0]:
df = spark.read.csv(path = "/FileStore/tables/my_saved_file.csv",
                    header = True,
                    inferSchema = True)
df.show()

+-------+---+---------+------+------+
|   name|age| emp_type|gender|salary|
+-------+---+---------+------+------+
|  Alice| 30|Full-time|Female| 60000|
|  Alice| 30|Full-time|Female| 60000|
|Charlie| 35| Contract|  Male| 70000|
|Charlie| 35| Contract|  Male| 70000|
|    Bob| 25|Part-time|  Male| 30000|
|    Bob| 25|Part-time|  Male| 30000|
+-------+---+---------+------+------+

