In [None]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler, LabelEncoder
from sklearn.metrics import mean_absolute_error
from sklearn.linear_model import LinearRegression
import tensorflow as tf
from tensorflow import keras
from tensorflow.keras import layers

# Load the dataset
url = 'path_to_your_dataset.csv'
data = pd.read_csv(url)

# Display the first few rows of the dataset
data.head()


In [None]:
# Define the model
model = keras.Sequential([
    layers.Input(shape=(X_train_scaled.shape[1],)),
    layers.Dense(64, activation='relu'),
    layers.Dense(32, activation='relu'),
    layers.Dense(1)
])

# Compile the model
model.compile(optimizer='adam', loss='mean_absolute_error')

# Train the model
history = model.fit(X_train_scaled, y_train, epochs=50, validation_split=0.2, verbose=1)


In [None]:
# Convert categorical columns to numeric
label_encoders = {}
for column in ['sex', 'smoker', 'region']:  # Example categorical columns
    le = LabelEncoder()
    data[column] = le.fit_transform(data[column])
    label_encoders[column] = le

# Split the data into features and labels
X = data.drop(columns=['expenses'])
y = data['expenses']

# Split into training and test datasets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Standardize the features
scaler = StandardScaler()
X_train_scaled = scaler.fit_transform(X_train)
X_test_scaled = scaler.transform(X_test)


In [None]:
# Evaluate the model
test_loss = model.evaluate(X_test_scaled, y_test, verbose=0)
print(f"Mean Absolute Error on test data: {test_loss}")

# Predict on the test dataset
y_pred = model.predict(X_test_scaled)

# Plot the true vs predicted values
plt.figure(figsize=(10, 6))
plt.scatter(y_test, y_pred, alpha=0.5)
plt.xlabel('True Values')
plt.ylabel('Predictions')
plt.title('True Values vs Predictions')
plt.show()
