## Set up

### Imports

In [None]:
import logging
import pandas as pd

from scripts import get_session, load_data_to_db, load_config, setup_logging, clean_data

### Config

In [None]:
try:
    config = load_config()
    setup_logging(config["paths"]["log_path"])
    logging.info("Starting the data analysis project.")
except Exception as e:
    logging.error(f"Failed to load config or setup logging: {e}")
    raise

### Create session

In [None]:
try:
    session = get_session()
    logging.info("Database session created successfully.")
except Exception as e:
    logging.error(f"Failed to create database session: {e}")
    raise

### Fetch data

In [None]:
netflix_df = pd.read_csv("../../data/raw/netflix_catalog.csv")

netflix_df.fillna("", inplace=True)
netflix_df["text"] = (
    netflix_df["title"]
    + " "
    + netflix_df["cast"]
    + " "
    + netflix_df["country"]
    + " "
    + netflix_df["listed_in"]
    + " "
    + netflix_df["description"]
)

cleaned_data = clean_data(netflix_df)
print(cleaned_data.head())

### Load data to database

In [None]:
load_data_to_db(cleaned_data, table_name="netflix_catalog")