# Stochastic Gradient Descent

In [21]:
import numpy as np
import matplotlib.pyplot as plt
%matplotlib notebook

In [22]:
# Generate sample data
np.random.seed(42)
X = 2 * np.random.rand(100, 1)
y = 4 + 3 * X + np.random.randn(100, 1)

In [23]:
# Function to compute the cost function (Mean Squared Error)
def compute_cost(theta, X, y):
    m = len(y)
    predictions = X.dot(theta)
    cost = (1/(2*m)) * np.sum(np.square(predictions - y))
    return cost

In [24]:
# Function to perform stochastic gradient descent
def stochastic_gradient_descent(X, y, theta, learning_rate, epochs):
    m = len(y)
    cost_history = np.zeros(epochs * m)
    theta_history = np.zeros((epochs * m, 2))
    
    index = 0  # To keep track of cost and theta history index
    
    for epoch in range(epochs):
        # Shuffle the dataset at the beginning of each epoch
        indices = np.random.permutation(m)
        X_shuffled = X[indices]
        y_shuffled = y[indices]
        
        for i in range(m):
            xi = X_shuffled[i:i+1]
            yi = y_shuffled[i:i+1]
            prediction = xi.dot(theta)
            error = prediction - yi
            gradient = xi.T.dot(error)
            theta = theta - learning_rate * gradient
            
            # Store cost and theta history
            cost_history[index] = compute_cost(theta, X, y)
            theta_history[index] = theta.T
            index += 1
            
    return theta, cost_history, theta_history

In [25]:
# Adding x0 = 1 to each instance
X_b = np.c_[np.ones((len(X), 1)), X]  # Add x0 = 1 to each instance
theta = np.random.randn(2, 1)  # Random initialization of theta

# Hyperparameters
learning_rate = 0.01
epochs = 50

In [26]:
# Performing stochastic gradient descent
theta, cost_history, theta_history = stochastic_gradient_descent(X_b, y, theta, learning_rate, epochs)

# Plotting the cost function history
plt.figure(figsize=(8, 6))
plt.plot(range(len(cost_history)), cost_history, 'b.')
plt.xlabel("Number of Iterations")
plt.ylabel("Cost (J)")
plt.title("Cost Function History (SGD)")
plt.show()

<IPython.core.display.Javascript object>

In [28]:
# Plotting the data and the fitted line
plt.figure(figsize=(8, 6))
plt.scatter(X, y, color='blue', label='Data Points')
plt.plot(X, X_b.dot(theta), color='red', label='Fitted Line')
plt.xlabel("X")
plt.ylabel("y")
plt.title("Linear Regression Fit with Stochastic Gradient Descent")
plt.legend()
plt.show()

<IPython.core.display.Javascript object>