# Housing Insights & Risk Dashboard  
## Data Engineering & Forecasting Notebook  
### Models: ARIMA, Prophet, LSTM
#### Author: Yuri Spizhovyi
#### Environment: Google Colab + Python + Pandas + Statsmodels + TensorFlow
#### Objective:
- Load datasets (HPI, rent, demographics, macro, metrics)
- Explore trends, seasonality, missingness
- Define feature engineering strategy
- Prepare feature tables for ARIMA, Prophet, LSTM

In [1]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns

plt.style.use("seaborn-v0_8")
pd.set_option("display.max_columns", None)

In [None]:
# Load datasets
df_hpi = pd.read_csv("/data/raw/house_price_index.csv")
df_rent = pd.read_csv("/data/raw/rent_index.csv")
df_demo = pd.read_csv("/data/raw/demographics.csv")
df_macro = pd.read_csv("/data/raw/macro_economic_data.csv")
df_metrics = pd.read_csv("/data/raw/metrics.csv")

dfs = {
    "house_price_index": df_hpi,
    "rent_index": df_rent,
    "demographics": df_demo,
    "macro_economic": df_macro,
    "metrics": df_metrics,
}

for name, df in dfs.items():
    print(f"\n===== {name.upper()} =====")
    print(df.head())
    print(df.info())