# Exploratory Data Analysis for Financial Data at Nova Financial Solutions
## 1. Import Libraries and utility functions

In [None]:
import sys
import os
import pandas as pd

notebook_dir = os.getcwd()  # Get current working directory (notebooks folder)
project_dir = os.path.abspath(os.path.join(notebook_dir, '..'))  # Go up one level
scripts_dir = os.path.join(project_dir, 'src')  # Path to scripts
sys.path.append(scripts_dir)


In [None]:
from IPython.display import display
from load_data import load_data

In [None]:
import importlib
import eda_data
importlib.reload(eda_data)
from eda_data import (data_overview, descriptive_statistics, text_analysis, time_series_analysis, publisher_analysis)

## 2. Importing Financial News and Stock Price Integration Data

In [None]:
# Load data
df = load_data('../data/raw/raw_analyst_ratings.csv')

## 3. Data Overviewing

In [None]:
overview = data_overview(df)
print(overview)

In [None]:
#Droping unamed column
df = df.drop(columns=['Unnamed: 0'], inplace=True)

## 1. Descriptive Statistics

In [None]:
ds = descriptive_statistics(df)

In [None]:
#Headline length description
print("Headline Length",ds['headline_length'])

In [None]:
#Active publishers description
print("active_publishers",ds['active_publishers'])

In [None]:
# Frequency per day
print("date_counts",ds['date_counts'])

In [None]:
# Frequency per hr
print("time_counts", ds['time_counts'])

## 2. Text Analysis

In [None]:
# Text analysis
txt_analysis = text_analysis(df)
print(txt_analysis)

## 3. Time Series Analysis

In [None]:
#Time series analysis
fig1, fig2 = time_series_analysis(df)
display(fig1)
display(fig2)

## 4. Publisher Analysis


In [None]:
#Publisher Analysis
fig1 = publisher_analysis(df)
display(fig1)