In [1]:
import numpy as np

loaded_data = np.loadtxt('./data-01-test-score.csv', delimiter=',', dtype=np.float32)

x_data = loaded_data[ :, 0:-1]
t_data = loaded_data[ :, [-1]]

# 데이터 차원 및 shape 확인
print("x_data.ndim = ", x_data.ndim, ", x_data.shape = ", x_data.shape)
print("t_data.ndim = ", t_data.ndim, ", t_data.shape = ", t_data.shape) 

x_data.ndim =  2 , x_data.shape =  (25, 3)
t_data.ndim =  2 , t_data.shape =  (25, 1)


In [5]:
loaded_data[:5,:]

array([[ 73.,  80.,  75., 152.],
       [ 93.,  88.,  93., 185.],
       [ 89.,  91.,  90., 180.],
       [ 96.,  98., 100., 196.],
       [ 73.,  66.,  70., 142.]], dtype=float32)

In [6]:
W = np.random.rand(3,1)  # 3X1 행렬
b = np.random.rand(1)  
print("W = ", W.tolist(), ", W.shape = ", W.shape, ", b = ", b, ", b.shape = ", b.shape)

W =  [[0.2131452973781799], [0.6652085608228322], [0.2765537062418685]] , W.shape =  (3, 1) , b =  [0.74876388] , b.shape =  (1,)


In [7]:
def loss_func(x, t):
    y = np.dot(x,W) + b
    
    return ( np.sum( (t - y)**2 ) ) / ( len(x) )

In [8]:
def numerical_derivative(f, x):
    delta_x = 1e-4 # 0.0001
    grad = np.zeros_like(x)
    
    it = np.nditer(x, flags=['multi_index'], op_flags=['readwrite'])
    
    while not it.finished:
        idx = it.multi_index        
        tmp_val = x[idx]
        x[idx] = float(tmp_val) + delta_x
        fx1 = f(x) # f(x+delta_x)
        
        x[idx] = tmp_val - delta_x 
        fx2 = f(x) # f(x-delta_x)
        grad[idx] = (fx1 - fx2) / (2*delta_x)
        
        x[idx] = tmp_val 
        it.iternext()   
        
    return grad

In [9]:
# 손실함수 값 계산 함수
# 입력변수 x, t : numpy type
def error_val(x, t):
    y = np.dot(x,W) + b
    
    return ( np.sum( (t - y)**2 ) ) / ( len(x) )

# 학습을 마친 후, 임의의 데이터에 대해 미래 값 예측 함수
# 입력변수 x : numpy type
def predict(x):
    y = np.dot(x,W) + b
    
    return y

In [10]:
learning_rate = 1e-5  # 1e-2, 1e-3 은 손실함수 값 발산

f = lambda x : loss_func(x_data,t_data)

print("Initial error value = ", error_val(x_data, t_data),'\t', " Initial W = ", W.tolist(),'\t', " b = ", b)

for step in  range(10000001):  
    
    W -= learning_rate * numerical_derivative(f, W)
    
    b -= learning_rate * numerical_derivative(f, b)
    
    if (step % 100000 == 0):
        print("step = ", step,'\t', "error value = ", error_val(x_data, t_data),'\t', "W = ", W.tolist(),'\t', " b = ",b )

Initial error value =  4883.641487226056 	  Initial W =  [[0.2131452973781799], [0.6652085608228322], [0.2765537062418685]] 	  b =  [0.74876388]
step =  0 	 error value =  1816.5065591537068 	 W =  [[0.32457711884638424], [0.7770952194440202], [0.3914891762315006]] 	  b =  [0.74960337]
step =  100000 	 error value =  6.200483166115918 	 W =  [[0.35599051018135086], [0.5287702603831252], [1.1218463026855108]] 	  b =  [0.56225937]
step =  200000 	 error value =  6.1661400520210305 	 W =  [[0.3559885320394247], [0.5292903534654597], [1.123571230071978]] 	  b =  [0.37695882]
step =  300000 	 error value =  6.1343461287847925 	 W =  [[0.35598662873034564], [0.5297907719012019], [1.1252309050315783]] 	  b =  [0.19866802]
step =  400000 	 error value =  6.1049121772811485 	 W =  [[0.35598479742176314], [0.5302722599649333], [1.1268277960047512]] 	  b =  [0.0271218]
step =  500000 	 error value =  6.077663023577181 	 W =  [[0.3559830353898059], [0.5307355337754239], [1.1283642780523575]] 	  b 

In [46]:
test_data = np.array([100, 98, 81])

predict(test_data) 

array([178.86235518])