** Linear Regression Implementation **

----

Original code by Siraj Raval https://github.com/llSourcell/linear_regression_live

In [1]:
from numpy import *

# Coding linear regression from scratch to exaplain gradiend descent

def compute_error_for_points(b, m, points):
    # error, loss
    # sum of the squared errors sse
    
    totalError = 0
    for i in range(0, len(points)):
        x = points[i, 0]
        y = points[i, 1]
        totalError += (y - (m * x + b)) **2
        
    averageError = totalError/float(len(points))
    return averageError

    
def step_gradient(b_current, m_current, points, learning_rate):
    # how gradient descent works
    b_gradient = 0
    m_gradient = 0
    N = float(len(points))
    
    for i in range(0, len(points)):
        x = points[i,0]
        y = points[i,1]
        
        b_gradient += -(2/N) * (y - ((m_current * x) + b_current))
        m_gradient += -(2/N) * x * (y - ((m_current * x) + b_current))
        
    new_b = b_current - (learning_rate * b_gradient)
    new_m = m_current - (learning_rate * m_gradient)
    
    return [new_b, new_m]


def gradient_descent_runner(points, starting_b, starting_m, learning_rate, iterations):
    b = starting_b
    m = starting_m
    
    for i in range(iterations):
        b,m = step_gradient(b, m, array(points), learning_rate)
    return [b,m]


def run():
    points = genfromtxt('data/income.csv', delimiter = ",")
    
    learning_rate = 0.0001 # how fast the model learns
    initial_b = 0 # y = mx + b
    initial_m = 0
    iterations = 1000
    
    #print("Starting graient descent at b = {0}, m = {1}, error = {2}".format(initial_b, initial_m, compute_error_for_line_given_points(initial_b, initial_m, points)))
    print("Running...")
    
    [b, m] = gradient_descent_runner(points, initial_b, initial_m, learning_rate, iterations)
    
    print("SSE : ", compute_error_for_points(b, m, points))
    print("Equation: y = ", m, "x + ", b)
    
    #print("After {0} iterations b = {1}, m = {2}, error = {3}".format(num_iterations, b, m, compute_error_for_line_given_points(b, m, points)))

if __name__ == "__main__":
    run()

Running...
SSE :  103.398422917
Equation: y =  3.2621822676 x +  -0.182342553765


**Answer the following questions**

2.Modifique o código original para imprimir o RSS a cada iteração do gradiente descendente.

In [2]:
import sys
from numpy import *


def rss_data(error, iteration):
    with open("rss.csv", "a+") as rss:
        rss.write(str(error) + ',' + str(iteration) + '\n')
        print(str(error) + ',' + str(iteration))
    rss.close() 


def compute_error_for_points(b, m, points):
    # error, loss
    # sum of the squared errors sse
    
    totalError = 0
    for i in range(0, len(points)):
        x = points[i, 0]
        y = points[i, 1]
        totalError += (y - (m * x + b)) **2
        
    averageError = totalError/float(len(points))
    return averageError


def step_gradient(b_current, m_current, points, learning_rate):
    # how gradient descent works
    b_gradient = 0
    m_gradient = 0
    N = float(len(points))
    
    for i in range(0, len(points)):
        x = points[i,0]
        y = points[i,1]
        
        b_gradient += -(2/N) * (y - ((m_current * x) + b_current))
        m_gradient += -(2/N) * x * (y - ((m_current * x) + b_current))
        
    new_b = b_current - (learning_rate * b_gradient)
    new_m = m_current - (learning_rate * m_gradient)
    
    return [new_b, new_m]


def gradient_descent_runner(points, starting_b, starting_m, learning_rate, iterations):
    b = starting_b
    m = starting_m
    
    for i in range(iterations):
        b,m = step_gradient(b, m, array(points), learning_rate)
        error = compute_error_for_points(b, m, points)
        #print("RSS: ", error)
        rss_data(error, i)
    return [b,m]


def run(learningRate, numIterations):
    points = genfromtxt('data/income.csv', delimiter = ",")
    
    learning_rate = learningRate 
    initial_b = 0 # y = mx + b
    initial_m = 0
    iterations = numIterations
    
    [b, m] = gradient_descent_runner(points, initial_b, initial_m, learning_rate, iterations)
    
    #print("RSS : ", compute_error_for_points(b, m, points))
    print("Equation: y = ", m, "x + ", b)
    

if __name__ == "__main__":
    run(0.001, 1000)

Equation: y =  3.453929781 x +  -3.40347631759


3.O que acontece com o RSS ao longo das iterações (aumenta ou diminui) se você usar 1000 iterações e um learning_rate (tamanho do passo do gradiente) de 0.001? Por que você acha que isso acontece?

In [13]:
# celula para grafico do rss
#from ggplot import *

4.Teste valores diferentes do número de iterações e learning_rate até que w0 e w1 sejam aproximadamente iguais a -39 e 5 respectivamente. Reporte os valores do número de iterações e learning_rate usados para atingir esses valores.



5.O algoritmo do vídeo usa o número de iterações como critério de parada. Mude o algoritmo para considerar um critério de tolerância que é comparado ao tamanho do gradiente (como no algoritmo dos slides apresentados em sala).



6.Ache um valor de tolerância que se aproxime dos valores dos parâmetros do item 4 acima. Que valor foi esse?