In [49]:
import numpy as np

#- input data x_data: total study hours
#- result data t_data: fail or pass 
x_data = np.array([2, 4, 6, 8, 10, 12, 14, 16, 18, 20]).reshape(10,1)   
t_data = np.array([0, 0, 0, 0,  0,  0,  1,  1,  1,  1]).reshape(10,1)
delta  = 1e-7

print("x_data.shape = ", x_data.shape, ", t_data.shape = ", t_data.shape)

x_data.shape =  (10, 1) , t_data.shape =  (10, 1)


In [50]:
W = np.random.rand(1,1)  
b = np.random.rand(1)  
print("W = ", W, ", W.shape = ", W.shape, ", b = ", b, ", b.shape = ", b.shape)

W =  [[0.46413202]] , W.shape =  (1, 1) , b =  [0.07976486] , b.shape =  (1,)


In [51]:
def sigmoid(x):
    return 1 / (1+np.exp(-x))

def loss_func(x, t):

    #- X: input data
    #- T: answer data
    #- W: weight
    #- b: bias
    #
    #- z = WX + b
    #- y = sigmoid(z)
    z = np.dot(x,W) + b
    y = sigmoid(z)
    
    # cross-entropy 
    # E(W,b) = -log L(W,b) <-- L(W,b) : likelyhood function
    return  -np.sum( t*np.log(y + delta) + (1-t)*np.log((1 - y)+delta ) )


In [54]:
def numerical_derivative_updated(f, x):
    grad = np.zeros_like(x)
    
    it = np.nditer(x, flags=['multi_index'], op_flags=['readwrite'])
    
    while not it.finished:
        idx = it.multi_index        
        tmp_val = x[idx]
        x[idx] = float(tmp_val) + delta
        fx1 = f(x) # f(x+delta)
        
        x[idx] = tmp_val - delta 
        fx2 = f(x) # f(x-delta)
        grad[idx] = (fx1 - fx2) / (2*delta)
        
        x[idx] = tmp_val 
        it.iternext()   
        
    return grad

def numerical_derivative(f, x):
    fx1 = f(x+delta)
    fx2 = f(x-delta)
    
    return (fx1 - fx2) / (2*delta)
        

def error_val(x, t):
    
    z = np.dot(x,W) + b
    y = sigmoid(z)
    print(delta)
    
    # cross-entropy 
    return  -np.sum( t*np.log(y + delta) + (1-t)*np.log((1 - y) + delta ) ) 


def predict(x):
    
    z = np.dot(x,W) + b
    y = sigmoid(z)
    
    if y >= 0.5:
        result = 1  # True
    else:
        result = 0  # False
    
    return y, result

In [55]:

learning_rate = 1e-4


f = lambda x : loss_func(x_data,t_data)  # f(x) = loss_func(x_data, t_data)

print("Initial error value = ", error_val(x_data, t_data), "Initial W = ", W, "\n", ", b = ", b )

for step in  range(10001):  
    
    W -= learning_rate * numerical_derivative(f, W)
    
    b -= learning_rate * numerical_derivative(f, b)
    
    if (step % 400 == 0):
        print("step = ", step, "error value = ", error_val(x_data, t_data), "W = ", W, ", b = ",b )

1e-07
Initial error value =  4.403154975684961 Initial W =  [[0.14312005]] 
 , b =  [-1.48296243]
1e-07
step =  0 error value =  4.403154975684961 W =  [[0.14312005]] , b =  [-1.48296243]
1e-07
step =  400 error value =  4.403154975684961 W =  [[0.14312005]] , b =  [-1.48296243]
1e-07
step =  800 error value =  4.403154975684961 W =  [[0.14312005]] , b =  [-1.48296243]
1e-07
step =  1200 error value =  4.403154975684961 W =  [[0.14312005]] , b =  [-1.48296243]
1e-07
step =  1600 error value =  4.403154975684961 W =  [[0.14312005]] , b =  [-1.48296243]
1e-07
step =  2000 error value =  4.403154975684961 W =  [[0.14312005]] , b =  [-1.48296243]
1e-07
step =  2400 error value =  4.403154975684961 W =  [[0.14312005]] , b =  [-1.48296243]
1e-07
step =  2800 error value =  4.403154975684961 W =  [[0.14312005]] , b =  [-1.48296243]
1e-07
step =  3200 error value =  4.403154975684961 W =  [[0.14312005]] , b =  [-1.48296243]
1e-07
step =  3600 error value =  4.403154975684961 W =  [[0.14312005]

In [56]:
(real_val, logical_val) = predict(20) 

print(real_val, logical_val)

[[0.79890082]] 1


In [57]:
(real_val, logical_val) = predict(13) 

print(real_val, logical_val)

[[0.59329369]] 1
