In [16]:
import numpy as np

$$loss=\sum_{i}{(w*x_i+b-y_i)^2}$$

In [17]:
def compute_error_for_line_given_points(b, w, points):
    totalError = 0
    for i in range(0, len(points)):
        x = points[i, 0]
        y = points[i, 1]
        # ((w * x + b) - y) ** 2 就是上面公式单个损失值
        totalError += ((w * x + b) - y) ** 2
    return totalError / float(len(points))

$$
w^{'}=w-lr*\frac{\partial{loss}}{\partial{w}} \\
\frac{\partial{loss}}{\partial{w}}=2*\sum_{i}{(w*x_i+b-y_i)*x_i} \\
b^{'}=b-lr*\frac{\partial{loss}}{\partial{b}} \\
\frac{\partial{loss}}{\partial{b}}=2*\sum_{i}{(w*x_i+b-y_i)}
$$

In [18]:
def step_gradient(b_current, w_current, points, learningRate):
    b_gradient = 0
    w_gradient = 0
    N = float(len(points))
    for i in range(0, len(points)):
        x = points[i, 0]
        y = points[i, 1]
        b_gradient += (2/N) * ((w_current * x + b_current) - y)
        w_gradient += (2/N) * x * ((w_current * x + b_current) - y)
    new_b = b_current - (learningRate * b_gradient)
    new_w = w_current - (learningRate * w_gradient)
    return [new_b, new_w]

In [22]:
# 给线性回归加上动画
import matplotlib.pyplot as plt
import matplotlib.animation as animation
%matplotlib osx
class DataAnimation:
    def __init__(self, b, w, points):
        self.fig = plt.figure()
        plt.scatter(points[:, 0], points[:, 1])
        self.x = np.linspace(1, 100, 10)
        self.y = w * self.x + b
        self.ln, = plt.plot(self.x, self.y)
    def animation_update(self, frame):
        self.y = frame[1] * self.x + frame[0]
        self.ln.set_data(self.x, self.y)
        return self.ln,
    def add_animation(self, fs):
        ani = animation.FuncAnimation(self.fig, self.animation_update, frames=fs, interval=10, blit=True)
        ani.save("a.gif")
    def show(self):
        plt.show()
    
def gradient_descent_runner(points, starting_b, starting_w, learning_rate, num_iterations):
    b = starting_b
    w = starting_w
    frames = []
    ba = DataAnimation(b, w, points)
    for i in range(num_iterations):
        b, w = step_gradient(b, w, np.array(points), learning_rate)
        frames.append([b, w])
    ba.add_animation(frames)
    ba.show()
    return [b, w]

In [23]:
def run():
    points = np.genfromtxt("data.csv", delimiter=",")
    learning_rate = 0.0001
    initial_b = 0
    initial_w = 0
    num_iterations = 1000
    print("b = {0}, w = {1}, error = {2}"
          .format(initial_b, initial_w, compute_error_for_line_given_points(initial_b, initial_w, points)))
    print("Running....")
    [b, w] = gradient_descent_runner(points, initial_b, initial_w, learning_rate, num_iterations)
    print("b = {0}, w = {1}, error = {2}"
          .format(b, w, compute_error_for_line_given_points(b, w, points)))

In [24]:
if __name__ == '__main__':
    run()

b = 0, w = 0, error = 5565.107834483211
Running....
b = 0.08893651993741346, w = 1.4777440851894448, error = 112.61481011613473
