# Hybrid Multiple Linear Regression Model

In [2]:
import pandas as pd
from sklearn.linear_model import LinearRegression
from sklearn.metrics import mean_squared_error, r2_score
import joblib

# Load the dataset
data = pd.read_excel("data4.xlsx")

# Define the independent (X) and dependent (Y) variables
X = data[['AD', 'AD2', 'E', 'T']]  # Independent variables: Advertising spend (AD), E, T
Y = data['R']               # Dependent variable: Sales revenue

# Initialize the Linear Regression model
model = LinearRegression()

# Train the model on the entire dataset (no train-test split)
model.fit(X, Y)

# Make predictions on the same dataset (since we are not splitting)
Y_pred = model.predict(X)

# Evaluate the model
mse = mean_squared_error(Y, Y_pred)
r2 = r2_score(Y, Y_pred)

# Report evaluation metrics
print("Mean Squared Error (MSE):", mse)
print("R-squared (R²):", r2)

# Report model coefficients and intercept
print("\nModel Coefficients:")
for i, col in enumerate(X.columns):
    print(f"{col}: {model.coef_[i]}")

print("Intercept (a):", model.intercept_)

# Save the model to a file
model_filename = 'final_regression_model.joblib'
joblib.dump(model, model_filename)

print(f"\nModel saved as {model_filename}")


Mean Squared Error (MSE): 1.658626168344379e-20
R-squared (R²): 1.0

Model Coefficients:
AD: 1000.0000000000003
AD2: -1.0000000000000004
E: 2.616798896237023e-14
T: -6.361921006974356e-13
Intercept (a): 8.731149137020111e-11

Model saved as final_regression_model.joblib
