In [None]:

import numpy as np
from sklearn.model_selection import train_test_split
from sklearn import datasets
import matplotlib.pyplot as plt
X, y = datasets.make_regression(n_samples=100, n_features=1, noise=20, random_state=4)
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=1234)


fig = plt.figure(figsize=(8,6))
plt.scatter(X[:, 0], y, color = "b", marker = "o", s = 30)
plt.show()
print(X_train.shape)
print(y_train.shape)

In [None]:
class LinearRegression:
  def __init__(self, lr=0.001, n_iters=1000):
    self.lr = lr
    self.n_iters = n_iters
    self.weights = None
    self.bias = None

  def fit(self, X, y):
    # init parameters
    n_samples, n_features = X.shape
    self.weights = np.zeros(n_features)
    self.bias = 0

    # gradient descent
    for _ in range(self.n_iters):
      y_pred = np.dot(X, self.weights) + self.bias
      dw = (1/n_samples) * np.dot(X.T, (y_pred-y))  # for each feature->X.T
      db = (1/n_samples) * np.sum(y_pred-y)

      self.weights -= self.lr*dw
      self.bias -= self.lr*db
  
  def predict(self, X):
    return np.dot(X, self.weights) + self.bias

In [None]:
regressor = LinearRegression(lr=0.01)
regressor.fit(X_train, y_train)
pred = regressor.predict(X_test)

def mse(y_true, y_pred):
  return np.mean((y_true - y_pred)**2)

mse_value = mse(y_test, pred)
mse_value

In [None]:

y_pred_line = regressor.predict(X)
cmap = plt.get_cmap('viridis')
fig = plt.figure(figsize=(8,6))
m1 = plt.scatter(X_train, y_train, color=cmap(0.9), s=10)
m2 = plt.scatter(X_test, y_test, color=cmap(0.5), s=10)
plt.plot(X, y_pred_line, color='black', linewidth=2, label="Prediction")
plt.show()