In [1]:
import numpy as np

x_data = np.array([2, 4, 6, 8, 10, 12, 14, 16, 18, 20]).reshape(10,1)
t_data = np.array([0, 0, 0, 0, 0, 0, 1, 1, 1, 1]).reshape(10,1)

print("x_data.shape = ", x_data.shape, ", t_data.shape = ", t_data.shape)

x_data.shape =  (10, 1) , t_data.shape =  (10, 1)


In [2]:
W = np.random.rand(1, 1)
b = np.random.rand(1)
print("W = ", W, ", W.shape = ", W.shape, ", b = ", b, ", b.shape = ", b.shape)

W =  [[0.36012997]] , W.shape =  (1, 1) , b =  [0.53277542] , b.shape =  (1,)


In [3]:
# 최종출력은 y = sigmoid(Wx + b) 이며, 손실함수는 cross-entropy로 나타냄

def sigmoid(x):
    return 1 / (1+np.exp(-x))

In [5]:
def loss_func(x, t):
    delta = 1e-7 # log 무한대 방지
    
    z = np.dot(x,W) + b
    y = sigmoid(z)
    
    return -np.sum( t*np.log(y+delta) + (1-t)*np.log((1-y)+delta))

In [6]:
def numerical_derivative(f, x):
    delta_x = 1e-4
    grad = np.zeros_like(x)
    
    it = np.nditer(x, flags=['multi_index'], op_flags=['readwrite'])
    while not it.finished:
        idx = it.multi_index
        
        tmp_val = x[idx]
        x[idx] = float(tmp_val) + delta_x
        fx1 = f(x)
        
        x[idx] = tmp_val - delta_x
        fx2 = f(x)
        grad[idx] = (fx1 - fx2) / (2*delta_x)
        
        x[idx] = tmp_val
        it.iternext()
        
    return grad

In [7]:
def error_val(x, t):
    delta = 1e-7
    
    z = np.dot(x, W) + b
    y = sigmoid(z)
    
    return -np.sum( t*np.log(y+delta) + (1-t)*np.log((1-y)+delta))

In [8]:
def predict(x):
    
    z = np.dot(x,W) + b
    y = sigmoid(z)
    
    if y >= 0.5:
        result = 1
    else: 
        result = 0
        
    return y, result

In [10]:
learning_rate = 1e-2

f = lambda x : loss_func(x_data,t_data)
    
print("Initial error value = ", error_val(x_data, t_data), "Initial W = ", W, "\n", ", b = ", b)

for step in range(10001):
    W -= learning_rate * numerical_derivative(f, W)
    b -= learning_rate * numerical_derivative(f, b)
    
    if(step % 400 == 0):
        print("step = ", step, "error value = ", error_val(x_data, t_data), "W = ", W, ", b = ", b)

Initial error value =  18.83194404232449 Initial W =  [[0.36012997]] 
 , b =  [0.53277542]
step =  0 error value =  8.05461980185721 W =  [[-0.04061467]] , b =  [0.52065513]
step =  400 error value =  2.757390958028708 W =  [[0.28359181]] , b =  [-4.15554844]
step =  800 error value =  1.7754203974486806 W =  [[0.45546722]] , b =  [-5.66912607]
step =  1200 error value =  1.5131443627330061 W =  [[0.53230546]] , b =  [-6.69220308]
step =  1600 error value =  1.3492080814032952 W =  [[0.59327941]] , b =  [-7.50184433]
step =  2000 error value =  1.2335883812269497 W =  [[0.64461123]] , b =  [-8.18197014]
step =  2400 error value =  1.1459528805526868 W =  [[0.68938275]] , b =  [-8.77412617]
step =  2800 error value =  1.076273569703595 W =  [[0.72936223]] , b =  [-9.30212894]
step =  3200 error value =  1.0189530342875015 W =  [[0.7656658]] , b =  [-9.78099533]
step =  3600 error value =  0.9705847151224852 W =  [[0.79904689]] , b =  [-10.22085082]
step =  4000 error value =  0.92895835

In [11]:
(real_val, logical_val) = predict(3)

print(real_val, logical_val)

[[1.11625318e-05]] 0


In [12]:
(real_val, logical_val) = predict(17)

print(real_val, logical_val)

[[0.99129846]] 1
