### Week 12: AI in Data Science – Case Studies (House Price Prediction)

In [1]:
import pandas as pd
import numpy as np
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.metrics import mean_absolute_error, mean_squared_error, r2_score
import matplotlib.pyplot as plt
import warnings

warnings.filterwarnings("ignore")


### Load Dataset

In [2]:
# Load your project dataset
df = pd.read_csv(r"C:\Users\123\Documents\Semester 7\Data-Science-AI-Course\Data\Raw\house_prices.csv")

# Strip spaces from column names
df.columns = df.columns.str.strip()

# Check columns
print("Columns in CSV:", df.columns.tolist())


Columns in CSV: ['Id', 'MSSubClass', 'MSZoning', 'LotFrontage', 'LotArea', 'Street', 'Alley', 'LotShape', 'LandContour', 'Utilities', 'LotConfig', 'LandSlope', 'Neighborhood', 'Condition1', 'Condition2', 'BldgType', 'HouseStyle', 'OverallQual', 'OverallCond', 'YearBuilt', 'YearRemodAdd', 'RoofStyle', 'RoofMatl', 'Exterior1st', 'Exterior2nd', 'MasVnrType', 'MasVnrArea', 'ExterQual', 'ExterCond', 'Foundation', 'BsmtQual', 'BsmtCond', 'BsmtExposure', 'BsmtFinType1', 'BsmtFinSF1', 'BsmtFinType2', 'BsmtFinSF2', 'BsmtUnfSF', 'TotalBsmtSF', 'Heating', 'HeatingQC', 'CentralAir', 'Electrical', '1stFlrSF', '2ndFlrSF', 'LowQualFinSF', 'GrLivArea', 'BsmtFullBath', 'BsmtHalfBath', 'FullBath', 'HalfBath', 'BedroomAbvGr', 'KitchenAbvGr', 'KitchenQual', 'TotRmsAbvGrd', 'Functional', 'Fireplaces', 'FireplaceQu', 'GarageType', 'GarageYrBlt', 'GarageFinish', 'GarageCars', 'GarageArea', 'GarageQual', 'GarageCond', 'PavedDrive', 'WoodDeckSF', 'OpenPorchSF', 'EnclosedPorch', '3SsnPorch', 'ScreenPorch', 'Poo

#### Features & Target

In [3]:
target_column = 'SalePrice'

# Keep only numeric features
X = df.select_dtypes(include=[np.number]).drop(target_column, axis=1)
y = df[target_column]

# Fill missing values
X = X.fillna(0)        # Or X.fillna(X.mean())
y = y.fillna(y.mean())

# Train/test split
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Feature scaling
scaler = StandardScaler()
X_train = scaler.fit_transform(X_train)
X_test = scaler.transform(X_test)


### Train Baseline Model

In [4]:
from sklearn.linear_model import LinearRegression

lr = LinearRegression()
lr.fit(X_train, y_train)

y_pred_lr = lr.predict(X_test)

mae_lr = mean_absolute_error(y_test, y_pred_lr)
rmse_lr = np.sqrt(mean_squared_error(y_test, y_pred_lr))
r2_lr = r2_score(y_test, y_pred_lr)

print("Linear Regression Performance:")
print("MAE:", mae_lr)
print("RMSE:", rmse_lr)
print("R2 Score:", r2_lr)


Linear Regression Performance:
MAE: 22232.276449969402
RMSE: 36102.10157801991
R2 Score: 0.8300774043836086


#### Week 12 Focus: AI Case Studies Reflection

In [6]:
# Example text output summarizing case studies
ai_healthcare = """
In healthcare, AI is used for disease prediction, medical imaging, and patient risk assessment. 
Techniques like deep learning help doctors make accurate and timely decisions.
"""

ai_finance = """
In finance, AI assists in fraud detection, credit scoring, algorithmic trading, and risk management. 
Machine learning models process large volumes of data to improve financial decision-making.
"""

print("AI in Healthcare Case Study:\n", ai_healthcare)
print("\nAI in Finance Case Study:\n", ai_finance)

# Reflect how your House Price Prediction project could fit real-world context
project_real_world = """
House Price Prediction can be applied in the real estate sector to estimate property prices, 
assist banks for mortgage assessment, and support investors in buying/selling decisions. 
Integrating AI models ensures data-driven predictions, reduces human bias, and increases transparency in property valuation.
"""
print("\nProject Real-World Application:\n", project_real_world)


AI in Healthcare Case Study:
 
In healthcare, AI is used for disease prediction, medical imaging, and patient risk assessment. 
Techniques like deep learning help doctors make accurate and timely decisions.


AI in Finance Case Study:
 
In finance, AI assists in fraud detection, credit scoring, algorithmic trading, and risk management. 
Machine learning models process large volumes of data to improve financial decision-making.


Project Real-World Application:
 
House Price Prediction can be applied in the real estate sector to estimate property prices, 
assist banks for mortgage assessment, and support investors in buying/selling decisions. 
Integrating AI models ensures data-driven predictions, reduces human bias, and increases transparency in property valuation.



#### Weekly Assignment Output

In [7]:
# Summarize performance metrics of previous models + LSTM (Week 10)
results = pd.DataFrame({
    'Model': ['Linear Regression', 'Decision Tree', 'Random Forest', 'ANN (Week 9)', 'LSTM (Week 10)'],
    'MAE': [mae_lr, 0, 0, 0, 0],  # Replace 0 with previous results
    'RMSE': [rmse_lr, 0, 0, 0, 0],
    'R2 Score': [r2_lr, 0, 0, 0, 0]
})

results


Unnamed: 0,Model,MAE,RMSE,R2 Score
0,Linear Regression,22232.27645,36102.101578,0.830077
1,Decision Tree,0.0,0.0,0.0
2,Random Forest,0.0,0.0,0.0
3,ANN (Week 9),0.0,0.0,0.0
4,LSTM (Week 10),0.0,0.0,0.0


#### Project Milestone (Week 12)

In [8]:
# Milestone output
milestone = """
This week’s milestone: Connected the House Price Prediction project to real-world applications 
in the real estate and finance sectors. Demonstrated AI case study understanding and practical relevance.
"""
print(milestone)



This week’s milestone: Connected the House Price Prediction project to real-world applications 
in the real estate and finance sectors. Demonstrated AI case study understanding and practical relevance.

