In [None]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
import sys
sys.path.append('..')

from src.data.collector import DataCollector
from src.data.processor import DataProcessor

%matplotlib inline
sns.set_style('darkgrid')


In [None]:
collector = DataCollector()
df = collector.fetch_historical_data('AAPL', interval='5m', period='7d', save=False)
print(f"Data shape: {df.shape}")
df.head()

In [None]:
df.describe()

In [None]:
plt.figure(figsize=(14, 6))
plt.plot(df.index, df['Close'], label='Close Price')
plt.title('AAPL Price Chart')
plt.xlabel('Date')
plt.ylabel('Price ($)')
plt.legend()
plt.show()

In [None]:
plt.figure(figsize=(14, 6))
plt.bar(df.index, df['Volume'], alpha=0.7)
plt.title('Trading Volume')
plt.xlabel('Date')
plt.ylabel('Volume')
plt.show()

In [None]:
df['Returns'] = df['Close'].pct_change()
plt.figure(figsize=(10, 6))
df['Returns'].hist(bins=50)
plt.title('Returns Distribution')
plt.xlabel('Returns')
plt.ylabel('Frequency')
plt.show()

In [None]:
print("Missing values:")
print(df.isnull().sum())

In [None]:
numeric_cols = df.select_dtypes(include=[np.number]).columns
correlation = df[numeric_cols].corr()

plt.figure(figsize=(10, 8))
sns.heatmap(correlation, annot=True, cmap='coolwarm', center=0)
plt.title('Feature Correlation Matrix')
plt.show()