# Linear Regression with the help of gradient descent
Basics collected from - https://khanacademy.org/math/statistics-probability 
and 
https://developers.google.com/machine-learning/crash-course

In [23]:
# import basic math functions
from numpy import *

# line equation - y = mx + b -- (x, y) is the random point on a 2D plane
# and m is slope, b is y-intercept        

# calculate the error of the line from each point plotted
def pointwise_error(b, m, points):
    totalError = 0
    for i in range(0, len(points)):
        x = points[i, 0] # get X
        y = points[i, 1] # get Y
        totalError += (y - (m * x + b)) ** 2 # squared error, as we need to see magnitude of error
    return totalError / float(len(points)) # average it out

# take steps towards points by learningRate 
def step_gradient(b_current, m_current, points, learning_rate):
    b_gradient = 0
    m_gradient = 0
    N = float(len(points))
    for i in range(0, len(points)):
        x = points[i, 0]
        y = points[i, 1]
        b_gradient += -(2/N) * (y - ((m_current * x) + b_current))
        m_gradient += -(2/N) * x * (y - ((m_current * x) + b_current))
        # advance the line based on calculated gradient 
    new_b = b_current - (learning_rate * b_gradient)
    new_m = m_current - (learning_rate * m_gradient)
    return [new_b, new_m]

def gradient_descent_runner(points, starting_b, starting_m, learning_rate, num_iterations):
    b = starting_b
    m = starting_m
    for i in range(num_iterations):
        b, m = step_gradient(b, m, array(points), learning_rate)
    return [b, m]

# initialize b and m and start taking steps towards each point
def run():
    points = genfromtxt("random_num.csv", delimiter=",")
    learning_rate = 0.0001
    initial_b = 0 # initial y-intercept
    initial_m = 0 # initial slope
    num_iterations = 100
    print("Starting gradient descent at b = {0}, m = {1}, error = {2}".format(initial_b, initial_m, pointwise_error(initial_b, initial_m, points)))
    print("Running...")
    [b, m] = gradient_descent_runner(points, initial_b, initial_m, learning_rate, num_iterations)
    print("After {0} iterations b = {1}, m = {2}, error = {3}".format(num_iterations, b, m, pointwise_error(b, m, points)))

if __name__ == '__main__':
    run()

Starting gradient descent at b = 0, m = 0, error = 5565.107834490552
Running...
After 100 iterations b = 0.03507497059521459, m = 1.4788027175308887, error = 112.64705662802109
