In [1]:
import numpy as np

In [2]:
def compute_error_for_line_given_points(b, m, points):
    totalError = 0
    for i in range(0, len(points)):
        x = points[i, 0]
        y = points[i, 1]
        totalError += (y - (m * x + b)) ** 2
    return totalError / float(len(points))


def step_gradient(b_current, w_current, points, learningRate):
    # gradient descent
    b_gradient = 0
    w_gradient = 0
    N = float(len(points))
    for i in range(0, len(points)):
        x = points[i, 0]
        y = points[i, 1]
        # direction with respect to b and w
        # computing partial derivatives of our error function
        b_gradient += -(2/N) * (y - ((w_current * x) + b_current))
        w_gradient += -(2/N) * x * (y - ((w_current * x) + b_current))
    # update our b and w values using our partial derivatives
    new_b = b_current - (learningRate * b_gradient)
    new_w = w_current - (learningRate * w_gradient)
    return [new_b, new_w]


def gradient_descent_runner(points, starting_b, starting_w, learning_rate, num_iterations):
    # starting b and w
    b = starting_b
    w = starting_w
    # gradient descent
    for i in range(num_iterations):
        # update b and w with the new more accurate b and w by performing
        # this gradient step
        b, w = step_gradient(b, w, np.array(points), learning_rate)
    return [b, w]


def run():
    # Step 1 - collect our data in a numpy array
    points = np.genfromtxt("data.csv", delimiter=",")
    # Step 2 - define our hyperparameters
    # how fast should our model converge?
    learning_rate = 0.0001
    # y = mx + b (slope formula)
    initial_b = 0
    initial_w = 0
    num_iterations = 1000
    # Step 3 - train our model
    print("Starting gradient descent at b = {0}, w = {1}, error = {2}".format(
        initial_b, initial_w,
        compute_error_for_line_given_points(initial_b, initial_w, points))
    )
    print("Running...")
    [b, w] = gradient_descent_runner(
        points, initial_b, initial_w, learning_rate, num_iterations)
    print("After {0} iterations b = {1}, w = {2}, error = {3}".format(
        num_iterations, b, w,
        compute_error_for_line_given_points(b, w, points))
    )