In [10]:
import numpy as np
from io import BytesIO

### Try out np.genfromtxt to create np.array from csv

In [12]:
data = "1, 2, 3\n4, 5, 6"
print BytesIO(data)
print data
np.genfromtxt(BytesIO(data), delimiter=",")

<_io.BytesIO object at 0x104edb290>
1, 2, 3
4, 5, 6


array([[ 1.,  2.,  3.],
       [ 4.,  5.,  6.]])

In [13]:
points = genfromtxt("data.csv", delimiter=",")
points[:2]

array([[ 32.50234527,  31.70700585],
       [ 53.42680403,  68.77759598]])

### gradient descent find the best m and b quickly

In [15]:

from IPython.display import Image
Image(url='https://raw.githubusercontent.com/mattnedrich/GradientDescentExample/master/gradient_descent_example.gif', 
     width = 500, height=200)  
# <img src="https://raw.githubusercontent.com/mattnedrich/GradientDescentExample/master/gradient_descent_example.gif">

### Sum of squared distances formula (to calculate our error)

In [16]:
Image(url = 'https://spin.atomicobject.com/wp-content/uploads/linear_regression_error1.png',
     width = 500, height = 200)

### Partial derivative with respect to b and m (to perform gradient descent)

In [17]:
Image(url = "https://spin.atomicobject.com/wp-content/uploads/linear_regression_gradient1.png",
        width = 500, height = 200)

### demo.py source code

In [4]:
%pycat demo.py

from numpy import *
# y = mx + b
# m is slope, b is y-intercept
def compute_error_for_line_given_points(b, m, points):
    totalError = 0
    for i in range(0, len(points)):
        x = points[i, 0]
        y = points[i, 1]
        totalError += (y - (m * x + b)) ** 2
    return totalError / float(len(points))

def step_gradient(b_current, m_current, points, learningRate):
    b_gradient = 0
    m_gradient = 0
    N = float(len(points))
    for i in range(0, len(points)):
        x = points[i, 0]
        y = points[i, 1]
        b_gradient += -(2/N) * (y - ((m_current * x) + b_current))
        m_gradient += -(2/N) * x * (y - ((m_current * x) + b_current))
    new_b = b_current - (learningRate * b_gradient)
    new_m = m_current - (learningRate * m_gradient)
    return [new_b, new_m]

def gradient_descent_runner(points, starting_b, starting_m, learning_rate, num_iterations):
    b = starting_b
    m = starting_m
    for i in range(num_iterations):
        b, m = step_gradient(b, m, array(points), learning_rate)
    return [b, m]

def run():
    points = genfromtxt("data.csv", delimiter=",")
    learning_rate = 0.0001
    initial_b = 0 # initial y-intercept guess
    initial_m = 0 # initial slope guess
    num_iterations = 1000
    print "Starting gradient descent at b = {0}, m = {1}, error = {2}".format(initial_b, \
                      initial_m, compute_error_for_line_given_points(initial_b, initial_m, points))
    print "Running..."
    [b, m] = gradient_descent_runner(points, initial_b, initial_m, learning_rate, num_iterations)
    print "After {0} iterations b = {1}, m = {2}, error = {3}".format(num_iterations, b, m, \
                      compute_error_for_line_given_points(b, m, points))

if __name__ == '__main__':
    run()

Starting gradient descent at b = 0, m = 0, error = 5565.10783448
Running...
After 1000 iterations b = 0.0889365199374, m = 1.47774408519, error = 112.614810116


In [5]:
run()

Starting gradient descent at b = 0, m = 0, error = 5565.10783448
Running...
After 1000 iterations b = 0.0889365199374, m = 1.47774408519, error = 112.614810116
