In [1]:
# IMPLEMENTING LINEAR REGRESSION FROM SCRATCH USING PYTHON

# STEP 1: Create dataset manually
import numpy as np
import matplotlib.pyplot as plt
from sklearn.linear_model import LinearRegression
from sklearn.metrics import mean_absolute_error, mean_squared_error, r2_score

np.random.seed(42)
X = np.linspace(1, 10, 50)
y = 2.5 * X + 5 + np.random.randn(50) * 2

# Reshape for calculations
X_reshaped = X.reshape(-1, 1)

# STEP 2: Visualize the data
plt.figure()
plt.scatter(X, y)
plt.xlabel("X")
plt.ylabel("y")
plt.title("Dataset")
plt.show()

# STEP 3: Define loss function (MSE)
def mse(y_true, y_pred):
    return np.mean((y_true - y_pred) ** 2)

# STEP 4: Define gradient descent
def gradient_descent(X, y, lr=0.01, epochs=1000):
    m = 0.0  # slope
    b = 0.0  # intercept
    n = len(X)
    loss_history = []

    for _ in range(epochs):
        y_pred = m * X + b
        dm = (-2/n) * np.sum(X * (y - y_pred))
        db = (-2/n) * np.sum(y - y_pred)
        m -= lr * dm
        b -= lr * db
        loss_history.append(mse(y, y_pred))

    return m, b, loss_history

# STEP 5: Train the model
m, b, loss_history = gradient_descent(X, y)
y_pred_custom = m * X + b

# STEP 6: Evaluate with MAE, RMSE, R²
mae_custom = mean_absolute_error(y, y_pred_custom)
rmse_custom = np.sqrt(mean_squared_error(y, y_pred_custom))
r2_custom = r2_score(y, y_pred_custom)

print("Custom Linear Regression")
print("MAE:", mae_custom)
print("RMSE:", rmse_custom)
print("R2 Score:", r2_custom)

# STEP 7: Visualize model fit & loss curve
plt.figure()
plt.scatter(X, y)
plt.plot(X, y_pred_custom)
plt.xlabel("X")
plt.ylabel("y")
plt.title("Model Fit (From Scratch)")
plt.show()

plt.figure()
plt.plot(loss_history)
plt.xlabel("Epochs")
plt.ylabel("MSE Loss")
plt.title("Loss Curve (From Scratch)")
plt.show()

# STEP 8: Compare with sklearn
model = LinearRegression()
model.fit(X_reshaped, y)
y_pred_sklearn = model.predict(X_reshaped)

# STEP 9: Compare R² scores
r2_sklearn = r2_score(y, y_pred_sklearn)
print("\nSklearn Linear Regression")
print("R2 Score:", r2_sklearn)

# STEP 10: Compare loss curves
loss_sklearn = (y - y_pred_sklearn) ** 2

plt.figure()
plt.plot(loss_history, label="From Scratch")
plt.plot(loss_sklearn, label="Sklearn")
plt.xlabel("Epochs / Samples")
plt.ylabel("Loss")
plt.legend()
plt.title("Loss Curve Comparison")
plt.show()



A module that was compiled using NumPy 1.x cannot be run in
NumPy 2.2.6 as it may crash. To support both 1.x and 2.x
versions of NumPy, modules must be compiled with NumPy 2.0.
Some module may need to rebuild instead e.g. with 'pybind11>=2.12'.

If you are a user of the module, the easiest solution will be to
downgrade to 'numpy<2' or try to upgrade the affected module.
We expect that some modules will need time to support NumPy 2.

Traceback (most recent call last):  File "<frozen runpy>", line 198, in _run_module_as_main
  File "<frozen runpy>", line 88, in _run_code
  File "C:\Users\mukes\AppData\Roaming\Python\Python312\site-packages\ipykernel_launcher.py", line 18, in <module>
    app.launch_new_instance()
  File "C:\ProgramData\anaconda3\Lib\site-packages\traitlets\config\application.py", line 1075, in launch_instance
    app.start()
  File "C:\Users\mukes\AppData\Roaming\Python\Python312\site-packages\ipykernel\kernelapp.py", line 739, in start
    self.io_loop.start()
  File "

ImportError: 
A module that was compiled using NumPy 1.x cannot be run in
NumPy 2.2.6 as it may crash. To support both 1.x and 2.x
versions of NumPy, modules must be compiled with NumPy 2.0.
Some module may need to rebuild instead e.g. with 'pybind11>=2.12'.

If you are a user of the module, the easiest solution will be to
downgrade to 'numpy<2' or try to upgrade the affected module.
We expect that some modules will need time to support NumPy 2.



ImportError: numpy.core.multiarray failed to import