# Medallion Architecture (Bronze → Silver → Gold) designed to build an end-to-end healthcare AI pipeline.

In [0]:
# Load raw diabetes data from Bronze table as Spark DataFrame (starting point for Silver layer)
df = spark.read.table("default.diabetic_data") 
df.display()


In [0]:
## Persist raw data as a Bronze Delta table (ACID-compliant storage for downstream processing)
df.write.format("delta") \
  .mode("overwrite") \
  .saveAsTable("bronze_patient_readmission")


In [0]:
# # Counting total number of records in the bronze_patient_readmission table

spark.sql("SELECT COUNT(*) FROM bronze_patient_readmission").display()


In [0]:
# Count patients grouped by readmission status 
spark.sql("SELECT readmitted, COUNT(*) AS patient_count FROM bronze_patient_readmission GROUP BY readmitted").display()

In [0]:
# BRONZE INGESTION
df_raw = spark.table("default.diabetic_data")

df_raw.write \
    .format("delta") \
    .mode("overwrite") \
    .saveAsTable("default.bronze_patient_readmission")

In [0]:
## Query to count total records in bronze_patient_readmission

spark.sql("""
SELECT COUNT(*) 
FROM default.bronze_patient_readmission
""").display()

In [0]:
%sql
show tables;

In [0]:
%sql
describe detail gold_patient_features;

In [0]:

%sql
--Preview first 10 records from gold_patient_features
SELECT
  utilization_score,
  treatment_changed,
  readmit_30d
FROM gold_patient_features
LIMIT 10;