# Exploratory Data Analysis (AQI Predictor)

## Goal
- Analyze seasonality and trends in AQI.
- Check feature correlations.
- Visualize distribution of AQI levels.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
import hopsworks
import os
from dotenv import load_dotenv

load_dotenv()

# Connect to Feature Store
project = hopsworks.login()
fs = project.get_feature_store()
aqi_fg = fs.get_feature_group(name='aqi_readings', version=1)
df = aqi_fg.read()
df['date'] = pd.to_datetime(df['date'])
df = df.sort_values('date')
df.head()

In [None]:
# Trend Analysis
plt.figure(figsize=(15, 6))
plt.plot(df['date'], df['aqi'])
plt.title('AQI Trend over Time')
plt.xlabel('Date')
plt.ylabel('AQI')
plt.show()

In [None]:
# Correlation Matrix
plt.figure(figsize=(12, 10))
sns.heatmap(df.corr(), annot=True, cmap='coolwarm')
plt.title('Feature Correlation Matrix')
plt.show()