# Exploratory Data Analysis (EDA) - Spending Data
This notebook analyzes the synthetic financial data generated for the project.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

df = pd.read_csv('../data/raw/transactions.csv')
df['Date'] = pd.to_datetime(df['Date'])
df.head()

## 1. Category Distribution
Visualizing which categories have the most transactions.

In [None]:
plt.figure(figsize=(10, 6))
spending_df = df[df['Is_Expense'] == True]
sns.countplot(data=spending_df, y='Category', order=spending_df['Category'].value_counts().index)
plt.title('Transaction Count by Category')
plt.show()

## 2. Anomalies Detection Visualization
Plotting amounts to see the outliers (Anomalies) which we injected.

In [None]:
plt.figure(figsize=(10, 6))
sns.scatterplot(data=spending_df, x='Category', y='Amount', hue='Is_Anomaly', palette={False: 'blue', True: 'red'})
plt.title('Spending Anomalies')
plt.show()