In [2]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
from sklearn.linear_model import LinearRegression
from sklearn.metrics import r2_score, mean_squared_error, accuracy_score, precision_score, recall_score
from sklearn.tree import DecisionTreeClassifier, plot_tree
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler, LabelEncoder
from sklearn.cluster import KMeans

In [3]:
try:
    df_house = pd.read_csv('trainHouse.csv')
    features_q8 = ['OverallQual', 'GrLivArea', 'GarageCars', 'YearBuilt']
    df_q8 = df_house[features_q8 + ['SalePrice']].dropna()
    X_q8 = df_q8[features_q8]
    y_q8 = df_q8['SalePrice']
    model_q8 = LinearRegression()
    model_q8.fit(X_q8, y_q8)
    print(f"Intercept: ${model_q8.intercept_:,.2f}")
    print("\nCoefficients:")
    for feat, coef in zip(features_q8, model_q8.coef_):
        print(f"  {feat}: ${coef:,.2f}")
    print("\nINTERPRETATION:")
    print(f"  OverallQual: Each point increase adds ${model_q8.coef_[0]:,.2f}")
    print(f"  GrLivArea: Each sq ft adds ${model_q8.coef_[1]:,.2f}")
    print(f"  GarageCars: Each car space adds ${model_q8.coef_[2]:,.2f}")
    print(f"  YearBuilt: Each year newer adds ${model_q8.coef_[3]:,.2f}")
    y_pred_q8 = model_q8.predict(X_q8)
    r2_q8 = r2_score(y_q8, y_pred_q8)
    rmse_q8 = np.sqrt(mean_squared_error(y_q8, y_pred_q8))
    print(f"\nR²: {r2_q8:.4f}")
    print(f"RMSE: ${rmse_q8:,.2f}")
    max_impact_idx = np.argmax(np.abs(model_q8.coef_ * X_q8.std().values))
    print(f"\nMost impactful feature: {features_q8[max_impact_idx]}")
except FileNotFoundError:
    print("House prices dataset (train.csv) not found. Please download from Kaggle.")
except Exception as e:
    print(f"Error: {e}")

Intercept: $-791,736.19

Coefficients:
  OverallQual: $22,922.74
  GrLivArea: $56.47
  GarageCars: $16,116.10
  YearBuilt: $364.63

INTERPRETATION:
  OverallQual: Each point increase adds $22,922.74
  GrLivArea: Each sq ft adds $56.47
  GarageCars: Each car space adds $16,116.10
  YearBuilt: Each year newer adds $364.63

R²: 0.7499
RMSE: $39,712.91

Most impactful feature: OverallQual
