### 4개의 입력데이터 연산 (A1-A2+A3-A4) 예측하는 Linear Regression Batch 예제

### data definition

In [2]:
import numpy as np
from datetime import datetime

loaded_data = np.loadtxt('../Data/sps.csv', delimiter=',', dtype=np.float32)

x_data = loaded_data[ :, 1:]
t_data = loaded_data[ :, [0]]

# 데이터 차원 및 shape 확인
print("loaded_data.ndim = ", loaded_data.ndim, ", loaded_data.shape = ", loaded_data.shape)
print("x_data.ndim = ", x_data.ndim, ", x_data.shape = ", x_data.shape)
print("t_data.ndim = ", t_data.ndim, ", t_data.shape = ", t_data.shape) 

loaded_data.ndim =  2 , loaded_data.shape =  (50, 5)
x_data.ndim =  2 , x_data.shape =  (50, 4)
t_data.ndim =  2 , t_data.shape =  (50, 1)


## initialize weights and bias

In [3]:
np.random.seed(0)

W = np.random.rand(4,1)  # 4X1 행렬
b = np.random.rand(1)  
print("W = ", W, ", W.shape = ", W.shape, ", b = ", b, ", b.shape = ", b.shape)

W =  [[0.5488135 ]
 [0.71518937]
 [0.60276338]
 [0.54488318]] , W.shape =  (4, 1) , b =  [0.4236548] , b.shape =  (1,)


## define loss function and output, y

In [4]:
def loss_func(x, t):
    
    y = np.dot(x,W) + b
    
    return ( np.sum( (t - y)**2 ) ) / ( len(x) ) # MSE, loss return, np.sum() == sigma(T-Y)^2 / N

In [5]:
def numerical_derivative(f, x):
    delta_x = 1e-4 # 0.0001
    grad = np.zeros_like(x)
    
    it = np.nditer(x, flags=['multi_index'], op_flags=['readwrite'])
    
    while not it.finished:
        idx = it.multi_index        
        tmp_val = x[idx]
        x[idx] = float(tmp_val) + delta_x
        fx1 = f(x) # f(x+delta_x)
        
        x[idx] = float(tmp_val) - delta_x 
        fx2 = f(x) # f(x-delta_x)
        grad[idx] = (fx1 - fx2) / (2*delta_x)
        
        x[idx] = tmp_val 
        it.iternext()   
        
    return grad

In [6]:
# 손실함수 값 계산 함수
# 입력변수 x, t : numpy type
def error_val(x, t):
    y = np.dot(x,W) + b
    
    return ( np.sum( (t - y)**2 ) ) / ( len(x) )

## learning

최적의 하이퍼파라미터  
lr = 1e-2  
epoch = 2000

In [7]:
learning_rate = 1e-2 #1e-3 

f = lambda x : loss_func(x_data,t_data)

print("Initial error value = ", error_val(x_data, t_data), "Initial W = ", W, "\n", ", b = ", b )

start_time = datetime.now()

for step in  range(30001):    # 3만번 반복수행
    
    W -= learning_rate * numerical_derivative(f, W)
    
    b -= learning_rate * numerical_derivative(f, b)
    
    if (step % 500 == 0):
        print("step = ", step, "error value = ", error_val(x_data, t_data), ' w = ', W, ' b = ', b )
        
end_time = datetime.now()
        
print("")
print("Elapsed Time => ", end_time - start_time)

Initial error value =  64.38302549674624 Initial W =  [[0.5488135 ]
 [0.71518937]
 [0.60276338]
 [0.54488318]] 
 , b =  [0.4236548]
step =  0 error value =  33.91925396320136  w =  [[0.43310237]
 [0.31925416]
 [0.47404918]
 [0.10489796]]  b =  [0.38130549]
step =  500 error value =  1.1402962624026252e-06  w =  [[ 0.99982264]
 [-1.00015027]
 [ 0.9999808 ]
 [-1.000054  ]]  b =  [0.00144918]
step =  1000 error value =  2.5047031755403355e-11  w =  [[ 0.99999917]
 [-1.0000007 ]
 [ 0.99999991]
 [-1.00000025]]  b =  [6.79191219e-06]
step =  1500 error value =  5.501673661157898e-16  w =  [[ 1.]
 [-1.]
 [ 1.]
 [-1.]]  b =  [3.18318109e-08]
step =  2000 error value =  1.2084681492942894e-20  w =  [[ 1.]
 [-1.]
 [ 1.]
 [-1.]]  b =  [1.491869e-10]
step =  2500 error value =  2.658823046021455e-25  w =  [[ 1.]
 [-1.]
 [ 1.]
 [-1.]]  b =  [6.9964243e-13]
step =  3000 error value =  1.6225740905060764e-29  w =  [[ 1.]
 [-1.]
 [ 1.]
 [-1.]]  b =  [4.70002234e-15]
step =  3500 error value =  5.43064

## evaluate and predict

In [8]:
# 학습을 마친 후, 임의의 데이터에 대해 미래 값 예측 함수
# 입력변수 x : numpy type

def predict(x):
    y = np.dot(x,W) + b
    
    return y

In [10]:
ex_data_01 = np.array([4, 4, 4, 4])    #  4 - 4 + 4 - 4 = 0

print("predicted value = ", predict(ex_data_01) ) 

predicted value =  [-2.89877461e-15]


In [11]:
ex_data_02 = np.array([-3, 0, 9, -1])    #  -3 -0 +9 -(-1) = 7

print("predicted value = ", predict(ex_data_02) ) 

predicted value =  [7.]


In [12]:
ex_data_03 = np.array([-7, -9, -2, 8])   # -7 -(-9) + (-2) -8 = -8

print("predicted value = ", predict(ex_data_03) ) 

predicted value =  [-8.]


In [13]:
ex_data_04 = np.array([1, -2, 3, -2])   # 1 -(-2) + 3 -(-2) = 8

print("predicted value = ", predict(ex_data_04) ) 

predicted value =  [8.]


In [14]:
ex_data_05 = np.array([19, -12, 0, -76])   # 19 -(-12) + 0 -(-76) = 107

print("predicted value = ", predict(ex_data_05) ) 

predicted value =  [107.]


In [15]:
ex_data_06 = np.array([2001, -1, 109, 31])   # 2001 -(-1) + 109 -(31) = 2080

print("predicted value = ", predict(ex_data_06) ) 

predicted value =  [2080.]


In [16]:
ex_data_07 = np.array([99999, -8911, 10009, 1231331])   # 99999 -(-8911) + 10009 -(1231331) = -1112412

print("predicted value = ", predict(ex_data_07) ) 

predicted value =  [-1112412.]
