In [None]:
# Databricks notebook source ## test#

import pandas as pd
from pyspark.sql import SparkSession

# Initialize SparkSession if not already available (for local testing or non-Databricks environments)
spark = SparkSession.builder.appName("Orders Ingest").getOrCreate()

# Define the path to the input CSV file (relative to the project root)
input_csv_path = "/Workspace/Shared/data/orders.csv"

# Define Unity Catalog catalog and schema names
# IMPORTANT: Replace 'your_catalog' and 'your_schema' with your actual desired Unity Catalog catalog and schema names.
catalog_name = "main_catalog"
schema_name = "bronze_orders_schema"

# Create catalog and schema if they don't exist
spark.sql(f"CREATE CATALOG IF NOT EXISTS {catalog_name}")
spark.sql(f"USE CATALOG {catalog_name}")
spark.sql(f"CREATE SCHEMA IF NOT EXISTS {schema_name}")
spark.sql(f"USE SCHEMA {schema_name}")

output_table_name = f"{catalog_name}.{schema_name}.orders_raw"

# Read the CSV file using pandas
pdf = pd.read_csv(input_csv_path)

# Convert pandas DataFrame to Spark DataFrame
df = spark.createDataFrame(pdf)

# Write the data to a Unity Catalog Delta table
# Ensure you have appropriate permissions to write to the specified catalog and schema.
df.write.format("delta").mode("overwrite").saveAsTable(output_table_name)

print(f"Successfully ingested orders data to Unity Catalog table: {output_table_name}")
