# Feature Importance

## Purpose
This notebook identifies the most important features influencing house prices.

## Key Objectives
- Extract feature importances from the trained model.
- Visualize the impact of different features.


In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
import pickle

# Load trained model
model = pickle.load(open("scripts/random_forest.pkl", "rb"))

# Load feature names
X_train = pd.read_csv("data/X_train.csv")
feature_names = X_train.columns


In [None]:
# Extract feature importance from the trained model
importance = model.feature_importances_

# Create a DataFrame for feature importances
feature_importance_df = pd.DataFrame({
    "Feature": feature_names,
    "Importance": importance
})

# Sort the features by importance
feature_importance_df = feature_importance_df.sort_values(by="Importance", ascending=False)

# Plot the feature importances
plt.figure(figsize=(10, 6))
sns.barplot(x="Importance", y="Feature", data=feature_importance_df)
plt.title("Feature Importance - Housing Price Prediction")
plt.show()
