## 입력변수 1개

In [1]:
import numpy as np

x_data = np.array([2,4,6,8,10,12,14,16,18,20]).reshape(10,1)
t_data = np.array([0,0,0,0,0,0,1,1,1,1,]).reshape(10,1)

In [2]:
W = np.random.rand(1,1)
b = np.random.rand(1)

print(W, W.shape, b, b.shape)

[[0.89066521]] (1, 1) [0.98309878] (1,)


In [3]:
def sigmoid(x):
    return 1/(1+np.exp(-x))

def loss_func(x, t):
    
    delta = 1e-7 # log 무한대 발산 방지(입력값 0 안되게)
    
    z = np.dot(x,W) + b
    y = sigmoid(z)
    
    # cross-entropy
    return -np.sum(t*np.log(y + delta) + (1-t)*np.log((1-y)+delta))

In [5]:
def numerical_derivative(f,x):
    delta_x = 1e-4 # 0.0001
    grad = np.zeros_like(x)
    
    it = np.nditer(x, flags = ['multi_index'], op_flags = ['readwrite'])
    
    while not it.finished:
        idx = it.multi_index
        tmp_val = x[idx]
        x[idx] = float(tmp_val) + delta_x
        fx1 = f(x) # f(x+delta_x)
        
        x[idx]  = tmp_val - delta_x
        fx2 = f(x) # f(x-delta_x)
        grad[idx] = (fx1 - fx2) / (2*delta_x)
        
        x[idx] = tmp_val
        it.iternext()
        
    return grad
        
        
        

In [6]:
def predict(x):
    
    z = np.dot(x,W) + b
    y = sigmoid(z)
    
    if y > 0.5:
        result = 1 #True
    else:
        result = 0 #False
        
    return y, result


In [10]:
learning_rate = 1e-2 # 발산하는 경우, 1e-3, 1e-6 등으로 바꾸어서 실행

f = lambda x : loss_func(x_data, t_data) # f(x) = loss_func(x_data, t_data)

print("initial error value = ", loss_func(x_data,t_data), "initial W = ", W, "\n", " , b = ", b)

for step in range(10001):
    
    W -= learning_rate*numerical_derivative(f, W)
    b -= learning_rate*numerical_derivative(f, b)
    
    if(step%400 == 0):
        print("step = ", step, "error value = ", loss_func(x_data, t_data), "W = ", W, ", b = ", b)

initial error value =  25.698460497920124 initial W =  [[0.47402479]] 
  , b =  [0.92524798]
step =  0 error value =  9.880748708104118 W =  [[0.06164088]] , b =  [0.88257421]
step =  400 error value =  3.2553732945448375 W =  [[0.43554418]] , b =  [-4.07859269]
step =  800 error value =  1.7893736564514258 W =  [[0.4519302]] , b =  [-5.6219586]
step =  1200 error value =  1.5211612692637129 W =  [[0.52961814]] , b =  [-6.65647451]
step =  1600 error value =  1.354600202636975 W =  [[0.59107112]] , b =  [-7.47255548]
step =  2000 error value =  1.2375534391423106 W =  [[0.64271448]] , b =  [-8.15686222]
step =  2400 error value =  1.149040100919696 W =  [[0.6877068]] , b =  [-8.75197661]
step =  2800 error value =  1.0787745582280979 W =  [[0.72785204]] , b =  [-9.28219683]
step =  3200 error value =  1.0210388889618958 W =  [[0.76428529]] , b =  [-9.76279538]
step =  3600 error value =  0.9723633918542193 W =  [[0.79777101]] , b =  [-10.20404661]
step =  4000 error value =  0.93050184

In [11]:
(real_val , logical_val) = predict(3)

print(real_val, logical_val)

[[1.12364337e-05]] 0


In [12]:
(real_val , logical_val) = predict(17)

print(real_val, logical_val)

[[0.9912763]] 1
