In [1]:
import numpy as np

x_data = np.array([1, 2, 3, 4, 5]).reshape(5,1)
t_data = np.array([2, 3, 4, 5, 6]).reshape(5,1) 

# raw_data = [ [1, 2], [2, 3], [3, 4], [4, 5], [5, 6] ]

print("x_data.shape = ", x_data.shape, ", t_data.shape = ", t_data.shape)

x_data.shape =  (5, 1) , t_data.shape =  (5, 1)


In [2]:
W = np.random.rand(1,1)  
b = np.random.rand(1)  
print("W = ", W, ", W.shape = ", W.shape, ", b = ", b, ", b.shape = ", b.shape)

W =  [[0.2732017]] , W.shape =  (1, 1) , b =  [0.09227294] , b.shape =  (1,)


In [3]:
def loss_func(x, t):
    y = np.dot(x,W) + b
    
    return ( np.sum( (t - y)**2 ) ) / ( len(x) )

In [4]:
def numerical_derivative(f, x):
    delta_x = 1e-4 # 0.0001
    grad = np.zeros_like(x)
    
    it = np.nditer(x, flags=['multi_index'], op_flags=['readwrite'])
    
    while not it.finished:
        idx = it.multi_index        
        tmp_val = x[idx]
        x[idx] = float(tmp_val) + delta_x
        fx1 = f(x) # f(x+delta_x)
        
        x[idx] = tmp_val - delta_x 
        fx2 = f(x) # f(x-delta_x)
        grad[idx] = (fx1 - fx2) / (2*delta_x)
        
        x[idx] = tmp_val 
        it.iternext()   
        
    return grad

In [5]:
# 손실함수 값 계산 함수
# 입력변수 x, t : numpy type
def error_val(x, t):
    y = np.dot(x,W) + b
    
    return ( np.sum( (t - y)**2 ) ) / ( len(x) )

# 학습을 마친 후, 임의의 데이터에 대해 미래 값 예측 함수
# 입력변수 x : numpy type
def predict(x):
    y = np.dot(x,W) + b
    
    return y

In [6]:
learning_rate = 1e-2  # 발산하는 경우, 1e-3 ~ 1e-6 등으로 바꾸어서 실행

f = lambda x : loss_func(x_data,t_data)

print("Initial error value = ", error_val(x_data, t_data), "Initial W = ", W, "\n", ", b = ", b )

for step in  range(8001):  
    
    W -= learning_rate * numerical_derivative(f, W)
    
    b -= learning_rate * numerical_derivative(f, b)
    
    if (step % 400 == 0):
        print("step = ", step, "error value = ", error_val(x_data, t_data), "W = ", W, ", b = ",b )

Initial error value =  10.592968748813842 Initial W =  [[0.2732017]] 
 , b =  [0.09227294]
step =  0 error value =  6.266690386931802 W =  [[0.48756095]] , b =  [0.14117383]
step =  400 error value =  0.005786135131648475 W =  [[1.04939591]] , b =  [0.82170873]
step =  800 error value =  0.00036918962887293644 W =  [[1.01247732]] , b =  [0.95496392]
step =  1200 error value =  2.3556480961155766e-05 W =  [[1.00315175]] , b =  [0.98862396]
step =  1600 error value =  1.5030427505977267e-06 W =  [[1.00079613]] , b =  [0.99712643]
step =  2000 error value =  9.590301343600435e-08 W =  [[1.0002011]] , b =  [0.99927414]
step =  2400 error value =  6.119179233183848e-09 W =  [[1.0000508]] , b =  [0.99981665]
step =  2800 error value =  3.9043981149672865e-10 W =  [[1.00001283]] , b =  [0.99995369]
step =  3200 error value =  2.4912368244540766e-11 W =  [[1.00000324]] , b =  [0.9999883]
step =  3600 error value =  1.5895563762901447e-12 W =  [[1.00000082]] , b =  [0.99999704]
step =  4000 err

In [7]:
predict(43) 

array([[44.]])