#### MultiVariable Classification 구현_CrossEntropy ver
#### 주의해서 볼 함수는 sigmoid,  loss_func,  predict 함수

In [1]:
import numpy as np
from datetime import datetime

def numerical_derivative(f, x):
    delta_x = 1e-4 # 0.0001
    grad = np.zeros_like(x)
    
    it = np.nditer(x, flags=['multi_index'], op_flags=['readwrite'])
    
    while not it.finished:
        idx = it.multi_index        
        tmp_val = x[idx]
        x[idx] = float(tmp_val) + delta_x
        fx1 = f(x) # f(x+delta_x)
        
        x[idx] = tmp_val - delta_x 
        fx2 = f(x) # f(x-delta_x)
        grad[idx] = (fx1 - fx2) / (2*delta_x)
        
        x[idx] = tmp_val 
        it.iternext()   
        
    return grad

In [2]:
# 최종출력은 y = sigmoid(Wx+b) 이며, 손실함수는 cross-entropy 로 나타냄

def sigmoid(z):
    return 1 / (1+np.exp(-z))

In [3]:
# x_data = (예습시간, 복습시간)
# t_data = 1 (Pass), 0 (Fail)

x_data = [ [2, 4], [4, 11], [6, 6], [8, 5], [10, 7], [12, 16], [14, 8], [16, 3], [18, 7] ]
t_data = [0, 0, 0, 0, 1, 1, 1, 1, 1]

In [4]:
W = np.random.rand(2,1)  
b = np.random.rand(1)  

print("W = ", W, ", W.shape = ", W.shape, ", b = ", b, ", b.shape = ", b.shape)

W =  [[0.78777337]
 [0.9559968 ]] , W.shape =  (2, 1) , b =  [0.11868164] , b.shape =  (1,)


In [5]:
def loss_func(x, t):
    
    delta = 1e-7    # log 무한대 발산 방지
    
    z = np.dot(x, W) + b
    y = sigmoid(z)
    
    # cross-entropy 
    return  -np.sum( t*np.log(y + delta) + (1-t)*np.log((1 - y)+delta ) ) 

# 손실함수 값 계산 함수
# 입력변수 x, t : numpy type
def error_val(x, t):
    delta = 1e-7    # log 무한대 발산 방지
    
    z = np.dot(x, W) + b
    y = sigmoid(z)
    
    # cross-entropy 
    return  -np.sum( t*np.log(y + delta) + (1-t)*np.log((1 - y)+delta ) ) 

# 학습을 마친 후, 임의의 데이터에 대해 미래 값 예측 함수
# 입력변수 test_data : numpy type
def predict(test_data):
    
    z = np.dot(test_data, W) + b
    y = sigmoid(z)
    
    if y >= 0.5:
        result = 1  # True
    else:
        result = 0  # False
    
    return y, result

In [6]:
learning_rate = 1e-2  # 1e-2, 1e-3 은 손실함수 값 발산

# x_data, t_data 는 list 이므로 numpy로 바꾸어주어야 함

input_xdata = np.array(x_data)
input_tdata = np.array(t_data).reshape(len(t_data), 1)

f = lambda x : loss_func(input_xdata, input_tdata)

print("Initial error value = ", error_val(input_xdata, input_tdata) )

start_time = datetime.now()

for step in  range(100001):  
    
    W -= learning_rate * numerical_derivative(f, W)
    
    b -= learning_rate * numerical_derivative(f, b)
    
    if (step % 1000 == 0):
        print("step = ", step, "error value = ", error_val(input_xdata, input_tdata) )
        
        
end_time = datetime.now()

print("")
print("Elapsed Time => ", end_time - start_time) 

Initial error value =  40.98626644276797
step =  0 error value =  30.542417062652888
step =  1000 error value =  1.3788796832571937
step =  2000 error value =  0.9654651872091095
step =  3000 error value =  0.7853023375711337
step =  4000 error value =  0.6774090835365838
step =  5000 error value =  0.6023800628206787
step =  6000 error value =  0.545587332330889
step =  7000 error value =  0.500245388136067
step =  8000 error value =  0.4627309075859041
step =  9000 error value =  0.43090825044786896
step =  10000 error value =  0.40342022418749096
step =  11000 error value =  0.3793505660643608
step =  12000 error value =  0.358049318380275
step =  13000 error value =  0.3390364715241446
step =  14000 error value =  0.3219458225703187
step =  15000 error value =  0.3064906238867267
step =  16000 error value =  0.2924416003833731
step =  17000 error value =  0.2796122988403132
step =  18000 error value =  0.26784896580687645
step =  19000 error value =  0.25702333193370347
step =  200

In [7]:
test_data = np.array([3, 17])

(real_val, logical_val) = predict(test_data)

print(real_val, logical_val)

[0.15447241] 0


In [8]:
test_data = np.array([5, 8])

(real_val, logical_val) = predict(test_data)

print(real_val, logical_val)

[0.00071321] 0


In [9]:
test_data = np.array([7, 21])

(real_val, logical_val) = predict(test_data)

print(real_val, logical_val)

[0.99999642] 1


In [10]:
test_data = np.array([12, 0])

(real_val, logical_val) = predict(test_data)

print(real_val, logical_val)

[0.59979436] 1


In [11]:
print('W = ', W, ', b = ', b)

W =  [[2.40866577]
 [1.15137872]] , b =  [-28.49938086]
