In [0]:
# ============================================
# SETUP: Set Working Catalog and Schema
# ============================================

# Set catalog
spark.sql("USE CATALOG smart_claims_dev")

# Set schema (bronze layer for raw ingested data)
spark.sql("USE SCHEMA bronze")

# Verify current context
print(f"Current Catalog: {spark.catalog.currentCatalog()}")
print(f"Current Database: {spark.catalog.currentDatabase()}")


In [0]:
from pyspark.sql import SparkSession

# File path in Managed Volume
claims_csv_path = "/Volumes/smart_claims_dev/landing/raw_files/sql_server/claims.csv"

# Read CSV as DataFrame
claims_df = spark.read.option("header", True).csv(claims_csv_path)

# Quick preview
claims_df.show(5)


In [0]:
spark.sql("SELECT * FROM claims_raw LIMIT 5").show()


In [0]:
# ============================================
# WRITE: Save Claims Data to Bronze Delta Table
# ============================================

# Table name (will be created in smart_claims_dev.bronze)
bronze_table = "claims_raw"

# Write DataFrame to Delta table
claims_df.write \
    .format("delta") \
    .mode("overwrite") \
    .option("mergeSchema", "true") \
    .saveAsTable(bronze_table)

print(f"âœ… Successfully created Bronze table: {bronze_table}")


In [0]:
spark.sql("SELECT * FROM claims_raw LIMIT 5").show()