# Federal University of Campina Grande (UFCG)
# Author: Rayana Souza Rocha
# Adapted from: Siraj Raval
# Available at: https://github.com/rayanarocha/machinelearning/tree/master/regress%C3%A3o_linear_simples

In [None]:
import numpy as np
import matplotlib.pyplot as plt
points = np.genfromtxt("income.csv", delimiter=",")

# Resposta da Questão 1

Eu criei a função print_graf_rmse para plotagem do gráfico que é chamado dentro da função gradient_descent_runner

In [None]:

def compute_error_for_line_given_points(b, m, points):
    totalError = 0
    for i in range(0, len(points)):
        x = points[i, 0]
        y = points[i, 1]
        totalError += (y - (m * x + b)) ** 2    
    return totalError / float(len(points))

def step_gradient(b_current, m_current, points, learningRate):
    b_gradient = 0
    m_gradient = 0
    N = float(len(points))
    for i in range(0, len(points)):
        x = points[i, 0]
        y = points[i, 1]
        b_gradient += -(2/N) * (y - ((m_current * x) + b_current))
        m_gradient += -(2/N) * x * (y - ((m_current * x) + b_current))
    new_b = b_current - (learningRate * b_gradient)
    new_m = m_current - (learningRate * m_gradient)
    return [new_b, new_m]

def gradient_descent_runner(points, starting_b, starting_m, learning_rate, num_iterations):
    b = starting_b
    m = starting_m
    RMSE = compute_error_for_line_given_points(b, m, points)
    array_rmse = np.array([[RMSE, 0]])
    print("RMSE: {:.3f}, interacao: {}".format(RMSE, 0))
    for i in range(num_iterations):
        b, m = step_gradient(b, m, np.array(points), learning_rate)
        RMSE = compute_error_for_line_given_points(b, m, points)
        # resposta da parte 1 da questão 1, imprimindo o RMSE para cada iteração
        print("RMSE: {:.3f}, interacao: {}".format(RMSE, i))
        # inicio = resposta da parte 2 da questão 1 - gráfico do RMSE por iteração
        iteration = i + 1
        array_item = np.array([RMSE, iteration])
        array_rmse = np.vstack([array_rmse, array_item]) 
    print_graf_rmse(array_rmse)
    return [b, m]

# método pra plotar o gráfico da parte 2 da questão 1 - gráfico do RMSE por iteração
def print_graf_rmse(array_):
    print(array_)
    y, x = array_.T
    plt.scatter(x, y, color="black")
    plt.xlabel("Interação")
    plt.ylabel("RMSE")
    plt.plot(x, y, color="blue", linewidth=3)
    plt.show()

def run():
    
    learning_rate = 0.0001
    initial_b = 0 # initial y-intercept guess
    initial_m = 0 # initial slope guess
    num_iterations = 1000
    print ("Starting gradient descent at b = {0}, m = {1}, error = {2}".format(initial_b, initial_m, compute_error_for_line_given_points(initial_b, initial_m, points)))
    print ("Running...")
    [b, m] = gradient_descent_runner(points, initial_b, initial_m, learning_rate, num_iterations)
    print ("After {0} iterations b = {1}, m = {2}, error = {3}".format(num_iterations, b, m, compute_error_for_line_given_points(b, m, points)))

if __name__ == '__main__':
    run()

# Resposta da Questão 2

Pra cada learning_rate, eu alterei o valor e é possível perceber que quando o learning_rate aumenta, a taxa de erro diminui.



Parte 1 da resposta da questão 2, que calcula o alpha mínimo

In [None]:
def compute_error_for_line_given_points(b, m, points):
    totalError = 0
    for i in range(0, len(points)):
        x = points[i, 0]
        y = points[i, 1]
        totalError += (y - (m * x + b)) ** 2    
    return totalError / float(len(points))

def step_gradient(b_current, m_current, points, learningRate):
    b_gradient = 0
    m_gradient = 0
    N = float(len(points))
    for i in range(0, len(points)):
        x = points[i, 0]
        y = points[i, 1]
        b_gradient += -(2/N) * (y - ((m_current * x) + b_current))
        m_gradient += -(2/N) * x * (y - ((m_current * x) + b_current))
    new_b = b_current - (learningRate * b_gradient)
    new_m = m_current - (learningRate * m_gradient)
    return [new_b, new_m]

def gradient_descent_runner(points, starting_b, starting_m, learning_rate, num_iterations):
    b = starting_b
    m = starting_m
    RMSE = compute_error_for_line_given_points(b, m, points)
    array_rmse = np.array([[RMSE, 0]])
    print("RMSE: {:.3f}, interacao: {}".format(RMSE, 0))
    for i in range(num_iterations):
        b, m = step_gradient(b, m, np.array(points), learning_rate)
        RMSE = compute_error_for_line_given_points(b, m, points)
        print("RMSE: {:.3f}, interacao: {}".format(RMSE, i))
        iteration = i + 1
        array_item = np.array([RMSE, iteration])
        array_rmse = np.vstack([array_rmse, array_item]) 
    print_graf_rmse(array_rmse)
    return [b, m]

def print_graf_rmse(array_):
    print(array_)
    y, x = array_.T
    plt.scatter(x, y, color="black")
    plt.xlabel("Interação")
    plt.ylabel("RMSE")
    plt.plot(x, y, color="blue", linewidth=3)
    plt.show()

def run():
    
    learning_rate = 0.00009
    initial_b = 0 # initial y-intercept guess
    initial_m = 0 # initial slope guess
    num_iterations = 1000
    print ("Starting gradient descent at b = {0}, m = {1}, error = {2}".format(initial_b, initial_m, compute_error_for_line_given_points(initial_b, initial_m, points)))
    print ("Running...")
    [b, m] = gradient_descent_runner(points, initial_b, initial_m, learning_rate, num_iterations)
    print ("After {0} iterations b = {1}, m = {2}, error = {3}".format(num_iterations, b, m, compute_error_for_line_given_points(b, m, points)))

if __name__ == '__main__':
    run()

Parte 2 da questão 2, calcula o alpha médio

In [None]:
def compute_error_for_line_given_points(b, m, points):
    totalError = 0
    for i in range(0, len(points)):
        x = points[i, 0]
        y = points[i, 1]
        totalError += (y - (m * x + b)) ** 2    
    return totalError / float(len(points))

def step_gradient(b_current, m_current, points, learningRate):
    b_gradient = 0
    m_gradient = 0
    N = float(len(points))
    for i in range(0, len(points)):
        x = points[i, 0]
        y = points[i, 1]
        b_gradient += -(2/N) * (y - ((m_current * x) + b_current))
        m_gradient += -(2/N) * x * (y - ((m_current * x) + b_current))
    new_b = b_current - (learningRate * b_gradient)
    new_m = m_current - (learningRate * m_gradient)
    return [new_b, new_m]

def gradient_descent_runner(points, starting_b, starting_m, learning_rate, num_iterations):
    b = starting_b
    m = starting_m
    RMSE = compute_error_for_line_given_points(b, m, points)
    array_rmse = np.array([[RMSE, 0]])
    print("RMSE: {:.3f}, interacao: {}".format(RMSE, 0))
    for i in range(num_iterations):
        b, m = step_gradient(b, m, np.array(points), learning_rate)
        RMSE = compute_error_for_line_given_points(b, m, points)
        print("RMSE: {:.3f}, interacao: {}".format(RMSE, i))
        iteration = i + 1
        array_item = np.array([RMSE, iteration])
        array_rmse = np.vstack([array_rmse, array_item]) 
    print_graf_rmse(array_rmse)
    return [b, m]

def print_graf_rmse(array_):
    print(array_)
    y, x = array_.T
    plt.scatter(x, y, color="black")
    plt.xlabel("Interação")
    plt.ylabel("RMSE")
    plt.plot(x, y, color="blue", linewidth=3)
    plt.show()

def run():
    
    learning_rate = 0.0001
    initial_b = 0 # initial y-intercept guess
    initial_m = 0 # initial slope guess
    num_iterations = 1000
    print ("Starting gradient descent at b = {0}, m = {1}, error = {2}".format(initial_b, initial_m, compute_error_for_line_given_points(initial_b, initial_m, points)))
    print ("Running...")
    [b, m] = gradient_descent_runner(points, initial_b, initial_m, learning_rate, num_iterations)
    print ("After {0} iterations b = {1}, m = {2}, error = {3}".format(num_iterations, b, m, compute_error_for_line_given_points(b, m, points)))

if __name__ == '__main__':
    run()

Parte 3 da resposta da questão 2, que calcula o alpha máximo

In [None]:
def compute_error_for_line_given_points(b, m, points):
    totalError = 0
    for i in range(0, len(points)):
        x = points[i, 0]
        y = points[i, 1]
        totalError += (y - (m * x + b)) ** 2    
    return totalError / float(len(points))

def step_gradient(b_current, m_current, points, learningRate):
    b_gradient = 0
    m_gradient = 0
    N = float(len(points))
    for i in range(0, len(points)):
        x = points[i, 0]
        y = points[i, 1]
        b_gradient += -(2/N) * (y - ((m_current * x) + b_current))
        m_gradient += -(2/N) * x * (y - ((m_current * x) + b_current))
    new_b = b_current - (learningRate * b_gradient)
    new_m = m_current - (learningRate * m_gradient)
    return [new_b, new_m]

def gradient_descent_runner(points, starting_b, starting_m, learning_rate, num_iterations):
    b = starting_b
    m = starting_m
    RMSE = compute_error_for_line_given_points(b, m, points)
    array_rmse = np.array([[RMSE, 0]])
    print("RMSE: {:.3f}, interacao: {}".format(RMSE, 0))
    for i in range(num_iterations):
        b, m = step_gradient(b, m, np.array(points), learning_rate)
        RMSE = compute_error_for_line_given_points(b, m, points)
        print("RMSE: {:.3f}, interacao: {}".format(RMSE, i))
        iteration = i + 1
        array_item = np.array([RMSE, iteration])
        array_rmse = np.vstack([array_rmse, array_item]) 
    print_graf_rmse(array_rmse)
    return [b, m]

def print_graf_rmse(array_):
    print(array_)
    y, x = array_.T
    plt.scatter(x, y, color="black")
    plt.xlabel("Interação")
    plt.ylabel("RMSE")
    plt.plot(x, y, color="blue", linewidth=3)
    plt.show()

def run():

    learning_rate = 0.0002
    initial_b = 0 # initial y-intercept guess
    initial_m = 0 # initial slope guess
    num_iterations = 1000
    print ("Starting gradient descent at b = {0}, m = {1}, error = {2}".format(initial_b, initial_m, compute_error_for_line_given_points(initial_b, initial_m, points)))
    print ("Running...")
    [b, m] = gradient_descent_runner(points, initial_b, initial_m, learning_rate, num_iterations)
    print ("After {0} iterations b = {1}, m = {2}, error = {3}".format(num_iterations, b, m, compute_error_for_line_given_points(b, m, points)))
    
if __name__ == '__main__':
    run()

# Resposta da Questão 3

Os valores encontrados para w0 = -39 e w1 = 5, foram learning_rate = 0.003 e o num_iteractions = 40000

In [None]:
def compute_error_for_line_given_points(b, m, points):
    totalError = 0
    for i in range(0, len(points)):
        x = points[i, 0]
        y = points[i, 1]
        totalError += (y - (m * x + b)) ** 2    
    return totalError / float(len(points))

def step_gradient(b_current, m_current, points, learningRate):
    b_gradient = 0
    m_gradient = 0
    N = float(len(points))
    for i in range(0, len(points)):
        x = points[i, 0]
        y = points[i, 1]
        b_gradient += -(2/N) * (y - ((m_current * x) + b_current))
        m_gradient += -(2/N) * x * (y - ((m_current * x) + b_current))
    new_b = b_current - (learningRate * b_gradient)
    new_m = m_current - (learningRate * m_gradient)
    return [new_b, new_m]

def gradient_descent_runner(points, starting_b, starting_m, learning_rate, num_iterations):
    b = starting_b
    m = starting_m
    RMSE = compute_error_for_line_given_points(b, m, points)
    array_rmse = np.array([[RMSE, 0]])
    print("RMSE: {:.3f}, interacao: {}".format(RMSE, 0))
    for i in range(num_iterations):
        b, m = step_gradient(b, m, np.array(points), learning_rate)
        RMSE = compute_error_for_line_given_points(b, m, points)
        print("RMSE: {:.3f}, interacao: {}".format(RMSE, i))
        iteration = i + 1
        array_item = np.array([RMSE, iteration])
        array_rmse = np.vstack([array_rmse, array_item]) 
    print_graf_rmse(array_rmse)
    return [b, m]

def print_graf_rmse(array_):
    print(array_)
    y, x = array_.T
    plt.scatter(x, y, color="black")
    plt.xlabel("Interação")
    plt.ylabel("RMSE")
    plt.plot(x, y, color="blue", linewidth=3)
    plt.show()

def run():
    
    learning_rate = 0.003
    initial_b = 0 # initial y-intercept guess
    initial_m = 0 # initial slope guess
    num_iterations = 40000
    print ("Starting gradient descent at b = {0}, m = {1}, error = {2}".format(initial_b, initial_m, compute_error_for_line_given_points(initial_b, initial_m, points)))
    print ("Running...")
    [b, m] = gradient_descent_runner(points, initial_b, initial_m, learning_rate, num_iterations)
    print ("After {0} iterations b = {1}, m = {2}, error = {3}".format(num_iterations, b, m, compute_error_for_line_given_points(b, m, points)))
if __name__ == '__main__':
    run()

# Resposta da Questão 4

Utilizei a mesma a função print_graf_rmse para plotagem do gráfico que é chamado dentro da função gradient_norm. Nessa função, eu utilizo o número de iterações como critério de tolerância. As iterações começam com uma valor x, e eu vou descrecendo até igualar a 0

In [None]:
def compute_error_for_line_given_points(b, m, points):
    totalError = 0
    for i in range(0, len(points)):
        x = points[i, 0]
        y = points[i, 1]
        totalError += (y - (m * x + b)) ** 2    
    return totalError / float(len(points))

def step_gradient(b_current, m_current, points, learningRate):
    b_gradient = 0
    m_gradient = 0
    N = float(len(points))
    for i in range(0, len(points)):
        x = points[i, 0]
        y = points[i, 1]
        b_gradient += -(2/N) * (y - ((m_current * x) + b_current))
        m_gradient += -(2/N) * x * (y - ((m_current * x) + b_current))
    new_b = b_current - (learningRate * b_gradient)
    new_m = m_current - (learningRate * m_gradient)
    return [new_b, new_m]

#resposta da questão 4
def gradient_norm(points, starting_b, starting_m, learning_rate, num_iterations):
    b = starting_b
    m = starting_m
    RMSE = compute_error_for_line_given_points(b, m, points)
    gradient_norm = np.array([[RMSE, 0]])
    while num_iterations >= 0:
        b, m = step_gradient(b, m, np.array(points), learning_rate)
        RMSE = compute_error_for_line_given_points(b, m, points)
        print("RMSE: {:.3f}, iteracao: {}".format(RMSE, num_iterations))
        num_iterations = num_iterations - 1
        array_item = np.array([RMSE, num_iterations])
        gradient_norm = np.vstack([gradient_norm, array_item]) 
    print_graf_rmse(gradient_norm)
    return [b, m]

def print_graf_rmse(array_):
    print(array_)
    y, x = array_.T
    plt.scatter(x, y, color="black")
    plt.xlabel("Interação")
    plt.ylabel("RMSE")
    plt.plot(x, y, color="blue", linewidth=3)
    plt.show()

def run():

    learning_rate = 0.0001
    initial_b = 0 # initial y-intercept guess
    initial_m = 0 # initial slope guess
    num_iterations = 1000
    print ("Starting gradient descent at b = {0}, m = {1}, error = {2}".format(initial_b, initial_m, compute_error_for_line_given_points(initial_b, initial_m, points)))
    print ("Running...")
    [b, m] = gradient_norm(points, initial_b, initial_m, learning_rate, num_iterations)
    print ("After {0} iterations b = {1}, m = {2}, error = {3}".format(num_iterations, b, m, compute_error_for_line_given_points(b, m, points)))
    
if __name__ == '__main__':
    run()