## 3.6 3-layer-NN

In [1]:
import sys, os  # path
sys.path.append(os.pardir)

import numpy as np
import pickle
import Activation_function as fts
from dataset.mnist import load_mnist

In [2]:
# Load MNIST
def get_data():
    (x_train, t_train), (x_test, t_test) = load_mnist(normalize=True,
                                                      flatten=True,
                                                      one_hot_label=False)
    
    return x_test, t_test

In [3]:
# Load weight and bias
# 학습된 가중치 매개변수를 읽기
def init_network():
    with open ("sample_weight.pkl", 'rb') as f:
        network = pickle.load(f)
    return network

In [4]:
# predict
def predict(network, x):
    w1, w2, w3 = network['W1'], network['W2'], network['W3']
    b1, b2, b3 = network['b1'], network['b2'], network['b3']
    
    A1 = np.dot(x, w1) + b1
    z1 = fts.sigmoid(A1)
    A2 = np.dot(z1, w2) + b2
    z2 = fts.sigmoid(A2)
    A3 = np.dot(z2, w3) + b3
    y = fts.softmax(A3)
    
    return y

In [5]:
# Main
x,t = get_data()
network = init_network()

# Accuracy check
accuracy_cnt = 0
for i in range(len(x)):
    y = predict(network, x[i])
    p = np.argmax(y)   # 확률이 가장 높은 원소의 인덱스를 얻음
    if p == t[i]:
        accuracy_cnt += 1
        
print('Accuracy: ' + str(float(accuracy_cnt)/len(x)))

Accuracy: 0.9352


### accuracy check with batch size

In [7]:
# Main
x,t = get_data()
network = init_network()

# Accuracy check with batch
batch_size = 100
accuracy_cnt = 0

for i in range(0, len(x), batch_size):
    x_batch = x[i:i+batch_size]
    y_batch = predict(network, x_batch)
    p = np.argmax(y_batch, axis=1)
    accuracy_cnt += np.sum(p == t[i:i+batch_size])
        
print('Accuracy: ' + str(float(accuracy_cnt)/len(x)))

Accuracy: 0.9352


## 4.2 Loss function

In [19]:
y1 = np.array([0.1, 0.05, 0.6, 0.0, 0.05, 0.1, 0.0, 0.1, 0.0, 0.0])
y2 = np.array([0.1, 0.05, 0.1, 0.0, 0.05, 0.1, 0.0, 0.6, 0.0, 0.0])
t = np.array([0, 0, 1, 0, 0, 0, 0, 0, 0, 0])   # one hot encoding

In [20]:
# MSE

def mean_square_error(y, t):
    return 0.5*np.sum((y-t)**2)

In [21]:
print(mean_square_error(y1, t))
print(mean_square_error(y2, t))

0.09750000000000003
0.5975


In [22]:
# Cross Entropy Error

def cross_entropy_error(y, t):
    delta = 1e-7
    return -np.sum(t*np.log(y+delta))

In [23]:
print(cross_entropy_error(y1, t))
print(cross_entropy_error(y2, t))

0.510825457099338
2.302584092994546
