# **3d** Graph plot multi_regression

In [2]:
from sklearn.datasets import make_regression
import pandas as pd
import numpy as np

import plotly.express as px
import plotly.graph_objects as go

from sklearn.metrics import mean_absolute_error, mean_squared_error, r2_score

# Manually create dataset with the help of **make_regression()**

In [3]:
x,y = make_regression(n_samples=100, n_features=2, n_informative=2, n_targets=1, noise=50)

In [6]:
df = pd.DataFrame({'feature_1' : x[:,0], 'feature_2' : x[:, 1], 'target' : y})

In [7]:
df.head()

Unnamed: 0,feature_1,feature_2,target
0,0.503911,1.332433,142.560317
1,-1.169756,0.467829,38.678248
2,2.826082,-0.756746,1.600958
3,-1.048692,1.227508,44.56443
4,0.047444,0.114967,-3.353617


plot 3d graph

In [8]:
fig = px.scatter_3d(df, x='feature_1', y='feature_2', z='target', title='Regression Dataset')
fig.show()

In [31]:
from sklearn.model_selection import train_test_split
x_train, x_test, y_train, y_test = train_test_split(x, y, test_size=0.2, random_state=2)

In [32]:
from sklearn.linear_model import LinearRegression

In [33]:
lr = LinearRegression()

In [34]:
lr.fit(x_train, y_train)

In [35]:
y_pred = lr.predict(x_test)

In [36]:
print("MSE  : ", mean_squared_error(y_test, y_pred))
print("MAE : ", mean_absolute_error(y_test, y_pred))
print("R2 : ", r2_score(y_test, y_pred))
r2 = r2_score(y_test, y_pred)
ad_r2 = 1 - ((1-r2) * (len(y_test) - 1)) / (len(y_test) - 1 - 2)
print("adjacent r2 : ", ad_r2)

MSE  :  2949.703135297777
MAE :  45.473324835792745
R2 :  0.6548126357140708
adjacent r2 :  0.614202357562785


### Regression Evaluation Metrics

Here's an explanation of the regression evaluation metrics used:

*   **Mean Squared Error (MSE):**
    *   MSE measures the average of the squared differences between the predicted and actual values.
    *   It is calculated by taking the average of the squared errors.
    *   MSE gives more weight to larger errors because the errors are squared.
    *   The lower the MSE, the better the model's performance.

*   **Mean Absolute Error (MAE):**
    *   MAE measures the average of the absolute differences between the predicted and actual values.
    *   It is calculated by taking the average of the absolute errors.
    *   MAE is less sensitive to outliers compared to MSE because it doesn't square the errors.
    *   The lower the MAE, the better the model's performance.

*   **R-squared (R2) Score:**
    *   R-squared, also known as the coefficient of determination, is a measure that represents the proportion of the variance in the dependent variable that is predictable from the independent variables.
    *   It ranges from 0 to 1.
    *   An R-squared of 1 indicates that the model explains all the variability of the target variable.
    *   An R-squared of 0 indicates that the model explains none of the variability of the target variable.
    *   A higher R-squared generally indicates a better fit.

*   **Adjusted R-squared:**
    *   Adjusted R-squared is a modified version of R-squared that has been adjusted for the number of predictors in the model.
    *   It increases only if the new term improves the model more than would be expected by chance.
    *   It is useful when comparing models with different numbers of predictors.

In [38]:
x = np.linspace(-5, 5, 10)
y = np.linspace(-5, 5, 10)

xGrid, yGrid = np.meshgrid(y,x)


final = np.vstack((xGrid.ravel().reshape(1,100),yGrid.ravel().reshape(1,100))).T

z_final = lr.predict(final).reshape(10,10)

z = z_final



In [40]:
fig = px.scatter_3d(df, x='feature_1', y='feature_2', z='target', title='Regression Dataset')

fig.add_trace(go.Surface(x=x,y=y,z=z))
fig.show()