<a href="https://colab.research.google.com/github/ashfiya-06/GenAi_2303A52366/blob/main/GenAI_Assignment_7_1.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [None]:
import pandas as pd
import numpy as np
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler, OneHotEncoder
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense
from tensorflow.keras.optimizers import Adadelta
from sklearn.metrics import mean_absolute_error, mean_squared_error, r2_score
from sklearn.compose import ColumnTransformer

# 1. Load the dataset
df = pd.read_csv("Housing (1).csv")  # Ensure the correct filename

# 2. Preprocess the data (Handle missing values, normalize)
df.dropna(inplace=True)  # Drop missing values

# Correctly identify categorical and numerical features
categorical_features = ['mainroad', 'guestroom', 'basement', 'hotwaterheating', 'airconditioning', 'prefarea', 'furnishingstatus']
numerical_features = ['area', 'bedrooms', 'bathrooms', 'stories', 'parking']

# Create a ColumnTransformer to handle different feature types
preprocessor = ColumnTransformer(
    transformers=[
        ('num', StandardScaler(), numerical_features),
        ('cat', OneHotEncoder(sparse_output=False, handle_unknown='ignore'), categorical_features) # One-hot encode categorical features
    ])

# Assume the 'price' column is the target and the rest are features
X = df[numerical_features + categorical_features]  # Features (numerical and categorical)
y = df['price'].values   # Target (House Price)

# Train-test split
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Apply the preprocessing pipeline
X_train = preprocessor.fit_transform(X_train)
X_test = preprocessor.transform(X_test)

# 3. Build ANN Model
model = Sequential([
    Dense(8, activation='relu', input_shape=(X_train.shape[1],)),
    Dense(16, activation='relu'),
    Dense(20, activation='relu'),
    Dense(10, activation='relu'),
    Dense(1, activation='linear')  # Linear activation for regression
])

# Compile the model
model.compile(optimizer=Adadelta(), loss='mean_squared_error', metrics=['mae'])

# 4. Train the model
model.fit(X_train, y_train, epochs=150, batch_size=64, validation_data=(X_test, y_test), verbose=1)

# 5. Evaluate the model
y_pred = model.predict(X_test)
mae = mean_absolute_error(y_test, y_pred)
mse = mean_squared_error(y_test, y_pred)
r2 = r2_score(y_test, y_pred)

print(f"Mean Absolute Error: {mae}")
print(f"Mean Squared Error: {mse}")
print(f"R2 Score: {r2}")

# 6. Save the trained model
model.save("house_price_model.h5")

print("Model saved as 'house_price_model.h5' 🚀")

  super().__init__(activity_regularizer=activity_regularizer, **kwargs)


Epoch 1/150
[1m7/7[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m2s[0m 30ms/step - loss: 23838582636544.0000 - mae: 4592207.0000 - val_loss: 30129992499200.0000 - val_mae: 5007536.5000
Epoch 2/150
[1m7/7[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 9ms/step - loss: 25955600957440.0000 - mae: 4746811.5000 - val_loss: 30129992499200.0000 - val_mae: 5007536.5000
Epoch 3/150
[1m7/7[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 9ms/step - loss: 25421229850624.0000 - mae: 4729150.0000 - val_loss: 30129992499200.0000 - val_mae: 5007536.5000
Epoch 4/150
[1m7/7[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 9ms/step - loss: 24097801109504.0000 - mae: 4623217.0000 - val_loss: 30129992499200.0000 - val_mae: 5007536.5000
Epoch 5/150
[1m7/7[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 10ms/step - loss: 25281945403392.0000 - mae: 4713323.0000 - val_loss: 30129992499200.0000 - val_mae: 5007536.5000
Epoch 6/150
[1m7/7[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m 



Mean Absolute Error: 5007536.5
Mean Squared Error: 30129990402048.0
R2 Score: -4.960939884185791
Model saved as 'house_price_model.h5' 🚀
