# 02 梯度下降

### Gradient Descent
<img src='./images/04.png' style = "zoom:50%">

## 线性回归实战示例：

In [1]:
import numpy as np

#### <font color=green>计算损失函数:</font>
$$loss=(y-(w*x+b))^2$$

In [2]:
# y = w * x + b
def compute_error_for_line_given_points(b, w, points):
    totalError = 0
    for i in range(0, len(points)):
        x = points[i, 0]
        y = points[i, 1]
        totalError += (y - (w * x + b)) ** 2
    return totalError / float(len(points))

#### <font color=green>计算梯度下降:</font>
$$ w'=w-lr*\frac{\partial loss}{\partial w}$$

In [3]:
def step_gradient(b_current, w_current, points, learning_rate):
    b_gradient = 0
    w_gradient = 0
    N = float(len(points))
    for i in range(0, len(points)):
        x = points[i, 0]
        y = points[i, 1]
        b_gradient += -(2 / N) * (y - ((w_current * x) + b_current))
        w_gradient += -(2 / N) * x * (y - ((w_current * x) + b_current))
    new_b = b_current - (learning_rate * b_gradient)
    new_w = w_current - (learning_rate * w_gradient)
    return [new_b, new_w]

#### <font color=green>迭代优化:</font>

In [4]:
def gradient_descent_runner(points, starting_b, starting_w, learning_rate, num_iterations):
    b = starting_b
    w = starting_w
    for i in range(num_iterations):
        b,w = step_gradient(b, w, np.array(points), learning_rate)
    return [b, w]

In [5]:
def run():
    points = np.genfromtxt("./data/data.csv", delimiter=",")
    learning_rate = 0.0001
    initial_b = 0    #initial y-intercept guess
    initial_w = 0    #initial slope guess
    num_iterations = 1000
    print("Starting gradient descent at b = {0}, m = {1}, error = {2}"
         .format(initial_b, initial_w,
                compute_error_for_line_given_points(initial_b, initial_w, points))
         )
    print("Running...")
    [b,w] = gradient_descent_runner(points, initial_b, initial_w, learning_rate, num_iterations)
    print("Afer {0} iterations b = {1}, w = {2}, error = {3}"
         .format(num_iterations, b, w,
                compute_error_for_line_given_points(b, w, points))
         )

#### <font color=green>真值比较:</font>
$$y=1.477*x+0.089$$

In [6]:
run()

Starting gradient descent at b = 0, m = 0, error = 5565.107834483211
Running...
Afer 1000 iterations b = 0.08893651993741346, w = 1.4777440851894448, error = 112.61481011613473
