In [1]:
import numpy as np

x_data = np.array([2, 4, 6, 8, 10, 12, 14, 16, 18, 20]).reshape(10, 1)
t_data = np.array([0, 0, 0, 0, 0, 0, 1, 1, 1, 1]).reshape(10, 1)

print("x_data.shape = ", x_data.shape, ", t_data.shape = ", t_data.shape)


x_data.shape =  (10, 1) , t_data.shape =  (10, 1)


In [2]:
W = np.random.rand(1,1)
b = np.random.rand(1)

print("W = ", W, ", W.shape = ", W.shape, ", b = ", b, ", b.shape = ", b.shape)

W =  [[0.35564794]] , W.shape =  (1, 1) , b =  [0.28020983] , b.shape =  (1,)


In [3]:
def sigmoid(x) :
  return 1 / (1 + np.exp(-x))

def loss_func(x, t) :
  delta = 1e-7

  z = np.dot(x, W) + b
  y = sigmoid(z)

  return -np.sum( t*np.log(y+delta) + (1-t)*np.log((1-y)+delta) )


In [4]:
def numerical_derivative(f, x):
    delta_x = 1e-4 # 0.0001
    grad = np.zeros_like(x)

    it = np.nditer(x, flags=['multi_index'], op_flags=['readwrite'])

    while not it.finished:
        idx = it.multi_index
        tmp_val = x[idx]
        x[idx] = float(tmp_val) + delta_x
        fx1 = f(x) # f(x+delta_x)

        x[idx] = tmp_val - delta_x
        fx2 = f(x) # f(x-delta_x)
        grad[idx] = (fx1 - fx2) / (2*delta_x)

        x[idx] = tmp_val
        it.iternext()

    return grad

In [5]:
def error_val(x, t) :
  delta = 1e-7

  z = np.dot(x, W) + b
  y = sigmoid(z)

  return -np.sum( t*np.log(y+delta) + (1-t)*np.log((1-y)+delta) )

def predict(x) :

  z = np.dot(x, W) + b
  y = sigmoid(z)

  if y >= 0.5 :
    result = 1
  else :
    result = 0

  return y, result


In [9]:
learning_rate = 1e-2

f = lambda x : loss_func(x_data, t_data)

print("Initial error value = ", error_val(x_data, t_data), ", Initial W =", W, "\n", ", Initial b = ", b)

for step in range(10001) :

  W -= learning_rate * numerical_derivative(f, W)
  b -= learning_rate * numerical_derivative(f, b)

  if step % 400 == 0 :
    print("step = ", step, ", error value = ", error_val(x_data, t_data), ", W = ", W, ", b= ", b)

Initial error value =  7.817628107102061 , Initial W = [[-0.03963378]] 
 , Initial b =  [0.27404671]
step =  0 , error value =  10.042074926128882 , W =  [[0.16647765]] , b=  [0.22825765]
step =  400 , error value =  2.9540135757391806 , W =  [[0.43275542]] , b=  [-4.23144316]
step =  800 , error value =  1.7650842801967501 , W =  [[0.45811841]] , b=  [-5.70447675]
step =  1200 , error value =  1.50716102770492 , W =  [[0.5343273]] , b=  [-6.71908142]
step =  1600 , error value =  1.3451678277577424 , W =  [[0.5949441]] , b=  [-7.52392171]
step =  2000 , error value =  1.230610224670257 , W =  [[0.64604279]] , b=  [-8.20091894]
step =  2400 , error value =  1.1436302967152177 , W =  [[0.69064867]] , b=  [-8.79085593]
step =  2800 , error value =  1.0743898273356727 , W =  [[0.7305036]] , b=  [-9.31719264]
step =  3200 , error value =  1.017380595541101 , W =  [[0.76670961]] , b=  [-9.79475597]
step =  3600 , error value =  0.9692429330976344 , W =  [[0.80001191]] , b=  [-10.2335605]
st

In [10]:
real_val, logical_val = predict(3)

print(real_val, logical_val)

[[1.1106865e-05]] 0


In [11]:
real_val, logical_val = predict(17)

print(real_val, logical_val)

[[0.99131522]] 1
