In [8]:
import numpy as np

x_data = np.array([2,4,6,8,10,12,14,16,18,20]).reshape(10,1)
t_data = np.array([0,0,0,0,0,0,1,1,1,1]).reshape(10,1)

In [9]:
W = np.random.rand(1,1)
b = np.random.rand(1)
print("W =", W, ", W,shape =", W.shape, ", b =", b, ", b.shape =", b.shape)

W = [[0.73766259]] , W,shape = (1, 1) , b = [0.1948421] , b.shape = (1,)


In [10]:
def sigmoid(x):
    return 1 / (1+np.exp(-x))

def loss_func(x, t):
    
    delta = 1e-7     # log 무한대 발산 방지
    
    z = np.dot(x, W) + b
    y = sigmoid(z)
    
    # cross-entropy
    return -np.sum( t*np.log(y + delta) + (1-t) * np.log((1 - y) + delta) )

In [11]:
# 수치미분 함수
def numerical_derivative(f, x):
    delta_x = 1e-4 # 0.000
    grad = np.zeros_like(x) # x 크기의 어레이 선언 및 초기화
    
    it = np.nditer(x, flags = ['multi_index'], op_flags = ['readwrite'])
    
    while not it.finished:
        idx = it.multi_index
        tmp_val = x[idx] # x 바뀌기 때문에 저장해둠
        x[idx]= float(tmp_val) + delta_x
        fx1 = f(x) # f(x+delta_x)
        
        x[idx] = tmp_val - delta_x
        fx2 = f(x) # f(x-delta_x)
        grad[idx] = (fx1 - fx2) / (2*delta_x)
        
        x[idx] = tmp_val
        it.iternext()
        
    return grad

In [12]:
def error_val(x, t):
    delta = 1e-7      # log 무한대 발산 방지
    
    z = np.dot(x, W) + b
    y = sigmoid(z)
    
     # cross-entropy
    return -np.sum( t*np.log(y + delta) + (1-t) * np.log((1 - y) + delta) )

def predict(x):
    
    z = np.dot(x, W) + b
    y = sigmoid(z)
    
    if y  > 0.5:
        result = 1     # True
    else :
        result = 0     # False
        
    return y, result

In [13]:
learning_rate = 1e-2 # 발산하는 경우 1e-3 ~ 1e-6 등으로 바꿔 실행

f = lambda x : loss_func(x_data, t_data) # f(x) = loss_func(x_data, t_data)

print("Initial error value =", error_val(x_data, t_data), "Initial W =", W, "\n", ", b=", b)

for step in range(10001):
    
    W -= learning_rate * numerical_derivative(f, W)
    b -= learning_rate * numerical_derivative(f, b)
    
    if (step % 400 == 0):
        print("step =", step, "error value", error_val(x_data, t_data), "W =", W, ", b=", b)
    

Initial error value = 32.377090499139406 Initial W = [[0.73766259]] 
 , b= [0.1948421]
step = 0 error value 15.274598988436253 W = [[0.3234422]] , b= [0.14198734]
step = 400 error value 2.9106618162237328 W = [[0.43221359]] , b= [-4.25410853]
step = 800 error value 1.7614092756492976 W = [[0.45906752]] , b= [-5.71713111]
step = 1200 error value 1.5050244590416364 W = [[0.53505266]] , b= [-6.72872379]
step = 1600 error value 1.3437218130159139 W = [[0.595542]] , b= [-7.53185083]
step = 2000 error value 1.2295428418690257 W = [[0.64655731]] , b= [-8.20772921]
step = 2400 error value 1.1427970869805963 W = [[0.69110388]] , b= [-8.79687152]
step = 2800 error value 1.073713590230537 W = [[0.73091415]] , b= [-9.32261099]
step = 3200 error value 1.0168158242978982 W = [[0.76708517]] , b= [-9.79970688]
step = 3600 error value 0.9687608155033726 W = [[0.80035919]] , b= [-10.2381342]
step = 4000 error value 0.9273746380705581 W = [[0.83126384]] , b= [-10.64497566]
step = 4400 error value 0.89117

In [14]:
(real_val, logical_val) = predict(3)

print(real_val, logical_val)

[[1.10868807e-05]] 0


In [15]:
(real_val, logical_val) = predict(17)

print(real_val, logical_val)

[[0.99132124]] 1
