In [None]:
# Import required libraries

import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns

from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression
from sklearn.metrics import mean_squared_error, r2_score

In [None]:
# Load dataset
data = pd.read_csv("train.csv")

# Display first 5 rows
data.head()

In [None]:
# Select required columns
data = data[['GrLivArea', 'BedroomAbvGr', 'FullBath', 'SalePrice']]

# Remove missing values if any
data.dropna(inplace=True)

data.head()

In [None]:
# Correlation matrix
plt.figure(figsize=(6,4))
sns.heatmap(data.corr(), annot=True, cmap="coolwarm")
plt.title("Feature Correlation Matrix")
plt.show()

In [None]:
X = data[['GrLivArea', 'BedroomAbvGr', 'FullBath']]
y = data['SalePrice']

In [None]:
X_train, X_test, y_train, y_test = train_test_split(
    X, y, test_size=0.2, random_state=42
)

In [None]:
model = LinearRegression()
model.fit(X_train, y_train)

In [None]:
y_pred = model.predict(X_test)

In [None]:
mse = mean_squared_error(y_test, y_pred)
r2 = r2_score(y_test, y_pred)

print("Mean Squared Error (MSE):", mse)
print("R2 Score:", r2)

In [None]:
plt.figure(figsize=(6,4))
plt.scatter(y_test, y_pred)
plt.xlabel("Actual Prices")
plt.ylabel("Predicted Prices")
plt.title("Actual vs Predicted House Prices")
plt.show()

In [None]:
print("Intercept:", model.intercept_)
print("Coefficients:", model.coef_)

In [None]:
print("\nRegression Equation:")
print("SalePrice =",
      model.intercept_,
      "+", model.coef_[0], "* GrLivArea",
      "+", model.coef_[1], "* BedroomAbvGr",
      "+", model.coef_[2], "* FullBath")

In [None]:
#In this project, a Linear Regression model was implemented to predict house prices using:
#Square Footage
#Number of Bedrooms
#Number of Bathrooms

#The model achieved an RÂ² score of approximately 0.63, indicating moderate predictive power.
#Square footage was found to be the most influential feature.

#This demonstrates that linear regression can effectively model housing prices using structural features.