### Load `crm_cust_info` table to bronze

In [0]:
%run ./config

In [0]:
%sql
DROP TABLE IF EXISTS etl.bronze.crm_cust_info;

CREATE OR REPLACE TABLE etl.bronze.crm_cust_info(
  cst_id STRING,
  cst_key STRING,
  cst_firstname STRING,
  cst_lastname STRING,
  cst_marital_status STRING,
  cst_gndr STRING,
  cst_create_date STRING
);

COPY INTO etl.bronze.crm_cust_info FROM
"abfss://landing@storagee2eproject.dfs.core.windows.net/crm/cust_info.csv" FILEFORMAT = CSV
FORMAT_OPTIONS ("header" = "true")

num_affected_rows,num_inserted_rows,num_skipped_corrupt_files
18494,18494,0


### Azure Data Lake Connection Setup

#### Description
This notebook sets up Spark configurations to securely connect Databricks with an Azure Data Lake Storage (ADLS) account.
It establishes the necessary credentials and Spark settings required for reading from and writing to the storage account.

#### Key Actions
- Sets up Spark configuration parameters (e.g., account keys or service principal credentials).
- Enables access to containers and folders within the Azure Data Lake.

#### Usage
1. Update the configuration section with the appropriate storage account name, container name, and credentials.
2. Run this notebook before executing any data pipelines or notebooks that interact with Azure Data Lake.
3. This configuration remains active for the duration of the current Spark session.

### Load `crm_prd_info` table to bronze

In [0]:
%sql
DROP TABLE IF EXISTS etl.bronze.crm_prd_info;

CREATE OR REPLACE TABLE etl.bronze.crm_prd_info(
  prd_id STRING,
  prd_key STRING,
  prd_nm STRING,
  prd_cost STRING,
  prd_line STRING,
  prd_start_dt STRING,
  prd_end_dt STRING
);

COPY INTO etl.bronze.crm_prd_info FROM
"abfss://landing@storagee2eproject.dfs.core.windows.net/crm/prd_info.csv" FILEFORMAT = CSV
FORMAT_OPTIONS ("header" = "true")

num_affected_rows,num_inserted_rows,num_skipped_corrupt_files
397,397,0


### Load `crm_sales_details` table to bronze

In [0]:
%sql
DROP TABLE IF EXISTS etl.bronze.crm_sales_details;

CREATE OR REPLACE TABLE etl.bronze.crm_sales_details(
  sls_ord_num STRING,
  sls_prd_key STRING,
  sls_cust_id STRING,
  sls_order_dt STRING,
  sls_ship_dt STRING,
  sls_due_dt STRING,
  sls_sales STRING,
  sls_quantity STRING,
  sls_price STRING
);

COPY INTO etl.bronze.crm_sales_details FROM
"abfss://landing@storagee2eproject.dfs.core.windows.net/crm/sales_details.csv" FILEFORMAT = CSV
FORMAT_OPTIONS ("header" = "true")

num_affected_rows,num_inserted_rows,num_skipped_corrupt_files
60398,60398,0


### Load `erp_cust_az12` table to bronze

In [0]:
%sql
DROP TABLE IF EXISTS etl.bronze.erp_CUST_AZ12;

CREATE OR REPLACE TABLE etl.bronze.erp_CUST_AZ12(
  CID STRING,
  BDATE STRING,
  GEN STRING
);

COPY INTO etl.bronze.erp_CUST_AZ12 FROM
"abfss://landing@storagee2eproject.dfs.core.windows.net/erp/CUST_AZ12.csv" FILEFORMAT = CSV
FORMAT_OPTIONS ("header" = "true")

num_affected_rows,num_inserted_rows,num_skipped_corrupt_files
18484,18484,0


### Load `erp_loc_a101` table to bronze

In [0]:
%sql
DROP TABLE IF EXISTS etl.bronze.erp_LOC_A101;

CREATE OR REPLACE TABLE etl.bronze.erp_LOC_A101(
  CID STRING,
  CNTRY STRING
);

COPY INTO etl.bronze.erp_LOC_A101 FROM
"abfss://landing@storagee2eproject.dfs.core.windows.net/erp/LOC_A101.csv" FILEFORMAT = CSV
FORMAT_OPTIONS ("header" = "true")

num_affected_rows,num_inserted_rows,num_skipped_corrupt_files
18484,18484,0


### Load `erp_px_cat_g1v2` table to bronze

In [0]:
%sql
DROP TABLE IF EXISTS etl.bronze.erp_PX_CAT_G1V2;

CREATE OR REPLACE TABLE etl.bronze.erp_PX_CAT_G1V2(
  ID STRING,
  CAT STRING,
  SUBCAT STRING,
  MAINTENANCE STRING
);

COPY INTO etl.bronze.erp_PX_CAT_G1V2 FROM
"abfss://landing@storagee2eproject.dfs.core.windows.net/erp/PX_CAT_G1V2.csv" FILEFORMAT = CSV
FORMAT_OPTIONS ("header" = "true")

num_affected_rows,num_inserted_rows,num_skipped_corrupt_files
37,37,0
