###create database 

In [0]:
%sql
create database if not exists my_db;

###switching to a newly created database

In [0]:
%sql
use database my_db;

###create a table within the database

In [0]:
%sql
drop table if exists my_test_table;
create table my_test_table(
  customer_id int,
  customer_name string
);

###insert data into the table

In [0]:
%sql
insert into my_test_table values
(0001,"vikky"),(0002,"sam");
SELECT * FROM my_test_table;

In [0]:
# The previous cells demonstrate how to insert data into a table using SQL and then query it in Databricks.
# Here is a more detailed breakdown and additional operations you can perform on Spark tables and DataFrames.

# 1. Create a table (if not exists)
spark.sql("""
CREATE TABLE IF NOT EXISTS my_test_table (
  id INT,
  name STRING
)
""")

# 2. Insert data into the table
spark.sql("""
INSERT INTO my_test_table VALUES
  (1, 'vikky'),
  (2, 'sam')
""")

# 3. Query the table using SQL
df_sql = spark.sql("SELECT * FROM my_test_table")
display(df_sql)

# 4. Query the table using DataFrame API
df = spark.table("my_test_table")
display(df)

# 5. Filter rows where name is 'vikky'
filtered_df = df.filter(df.name == 'vikky')
display(filtered_df)

# 6. Add a new column (e.g., uppercase name)
from pyspark.sql.functions import upper
df_with_upper = df.withColumn("name_upper", upper(df.name))
display(df_with_upper)

# 7. Count the number of rows
row_count = df.count()
print(f"Row count: {row_count}")

# 8. Drop the table (cleanup)
spark.sql("DROP TABLE IF EXISTS my_test_table")

In [0]:
df_sql = spark.sql("SELECT * FROM my_test_table")
display(df_sql)

###convert table into dataframe

In [0]:
#import packages to run below code
from pyspark.sql.functions import col
sql2df=spark.table("my_test_table")
display(sql2df)

###catalog
Unity Catalog in Databricks

Unity Catalog is a unified governance solution for all data and AI assets, including files, tables, and machine learning models in your Databricks workspace. It provides a centralized governance model that standardizes data governance across all data assets.

Let's explore some basic operations with Unity Catalog.

1. Create a Catalog
A catalog is the highest level of organization in Unity Catalog. It contains schemas (databases), which in turn contain tables and views.


In [0]:
%sql
--Create a catalog using SQL
create catalog if not exists my_catalog;


--switch to the newly created catalog
use catalog my_catalog;

--2. Create a Schema (Database) within the Catalog.Schemas are used to organize tables and views within a catalog.

create schema if not exists my_schema;

--switch to the newly created schema
use schema my_schema;

--3. Create a Table within the Schema.Tables are used to store structured data.
--Create a table using SQL
drop table if exists my_test;
create table if not exists my_test(
  name string,
  salary int,
  gender string
);
    
--4. Insert data into the table using SQL
insert into my_test values
("vikky",10000,"male"),("sam",20000,"female"),("hema",30000,"female");
select * from my_test;
    
--5. Create a view within the schema.Views are used to present a subset of data from a table or another view.
--Create a view using SQL
--create or replace view my_view as select * from my_test where gender = "female";
    
--6. Query the table using SQL
select * from my_test;
--select * from my_view;



In [0]:

#7. Interact with the Table using Python
#Load the table into a DataFrame

df = spark.sql('select * from my_catalog.my_schema.my_test')
display(df)

In [0]:
%sh
pwd