In [None]:
!unzip house-prices-advanced-regression-techniques.zip -d data

Archive:  house-prices-advanced-regression-techniques.zip
  inflating: data/data_description.txt  
  inflating: data/sample_submission.csv  
  inflating: data/test.csv           
  inflating: data/train.csv          


In [None]:
# Import Required Libraries
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression
from sklearn.metrics import mean_squared_error, r2_score

In [None]:
# 📥 Load Dataset
df = pd.read_csv('data/train.csv')
df.head()

Unnamed: 0,Id,MSSubClass,MSZoning,LotFrontage,LotArea,Street,Alley,LotShape,LandContour,Utilities,...,PoolArea,PoolQC,Fence,MiscFeature,MiscVal,MoSold,YrSold,SaleType,SaleCondition,SalePrice
0,1,60,RL,65.0,8450,Pave,,Reg,Lvl,AllPub,...,0,,,,0,2,2008,WD,Normal,208500
1,2,20,RL,80.0,9600,Pave,,Reg,Lvl,AllPub,...,0,,,,0,5,2007,WD,Normal,181500
2,3,60,RL,68.0,11250,Pave,,IR1,Lvl,AllPub,...,0,,,,0,9,2008,WD,Normal,223500
3,4,70,RL,60.0,9550,Pave,,IR1,Lvl,AllPub,...,0,,,,0,2,2006,WD,Abnorml,140000
4,5,60,RL,84.0,14260,Pave,,IR1,Lvl,AllPub,...,0,,,,0,12,2008,WD,Normal,250000


In [None]:

# ✅ Select Features and Target Variable
X = df[['GrLivArea', 'BedroomAbvGr', 'FullBath']]
y = df['SalePrice']

In [None]:
# 📊 Split Dataset into Training and Testing Sets
X_train, X_test, y_train, y_test = train_test_split(
    X, y, test_size=0.2, random_state=42
)

In [None]:
# 🚀 Train the Linear Regression Model
model = LinearRegression()
model.fit(X_train, y_train)

In [None]:
# 🔮 Make Predictions on Test Set
y_pred = model.predict(X_test)

In [None]:
# 📏 Evaluate the Model
mse = mean_squared_error(y_test, y_pred)
r2 = r2_score(y_test, y_pred)

print("📊 Model Evaluation:")
print(f"Mean Squared Error (MSE): {mse:.2f}")
print(f"R² Score: {r2:.4f}")

📊 Model Evaluation:
Mean Squared Error (MSE): 2806426667.25
R² Score: 0.6341


In [None]:
# 📌 Display Model Coefficients
print("\n📌 Model Coefficients:")
print(f"Intercept: {model.intercept_:.2f}")
for feature, coef in zip(X.columns, model.coef_):
    print(f"{feature}: {coef:.2f}")


📌 Model Coefficients:
Intercept: 52261.75
GrLivArea: 104.03
BedroomAbvGr: -26655.17
FullBath: 30014.32


In [None]:
# 🏡 Predict Price of a New House
new_house = pd.DataFrame({
    'GrLivArea': [2000],   # 2000 sq ft
    'BedroomAbvGr': [3],   # 3 bedrooms
    'FullBath': [2]        # 2 bathrooms
})
predicted_price = model.predict(new_house)[0]

In [None]:
# 💱 Convert to INR
usd_to_inr = 85.83  # Current USD to INR rate
predicted_price_inr = predicted_price * usd_to_inr

print(f"\n💰 Predicted Price for New House:")
print(f"USD: ${predicted_price:,.2f}")
print(f"INR: ₹{predicted_price_inr:,.2f}")


💰 Predicted Price for New House:
USD: $240,377.51
INR: ₹20,631,602.10
