In [1]:
''' CNN MNIST digits classification

3-layer CNN for MNIST digits classification 
First 2 layers - Conv2D-ReLU-MaxPool
3rd layer - Conv2D-ReLU-Dropout
4th layer - Dense(10)
Output Activation - softmax
Optimizer - Adam

https://github.com/PacktPublishing/Advanced-Deep-Learning-with-Keras
'''

import numpy as np
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Activation, Dense, Dropout
from tensorflow.keras.layers import Conv2D, MaxPooling2D, Flatten
from tensorflow.keras.utils import to_categorical, plot_model
from tensorflow.keras.datasets import mnist

In [2]:
# mnist dataset 로딩
(x_train, y_train), (x_test, y_test) = mnist.load_data()

Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/mnist.npz


In [3]:
# 레이블 개수 계산
num_labels = len(np.unique(y_train))

In [4]:
# one-hot vector로 변환
y_train = to_categorical(y_train)
y_test = to_categorical(y_test)

In [5]:
# 입력 이미지 차원
image_size = x_train.shape[1]

In [6]:
# 크기 조정, 정규화
x_train = np.reshape(x_train,[-1, image_size, image_size, 1])
x_test = np.reshape(x_test,[-1, image_size, image_size, 1])
x_train = x_train.astype('float32') / 255
x_test = x_test.astype('float32') / 255

In [7]:
# 신경망 하이퍼파라미터
# 이미지는 그대로 (정사각형 회식) 처리됨
input_shape = (image_size, image_size, 1)
batch_size = 128
kernel_size = 3
pool_size = 2
filters = 64
dropout = 0.2

In [8]:
# 모델: CNN-ReLU-MaxPooling 순서로 쌓기
model = Sequential()
model.add(Conv2D(filters=filters,
                 kernel_size=kernel_size,
                 activation='relu',
                 input_shape=input_shape))
model.add(MaxPooling2D(pool_size))
model.add(Conv2D(filters=filters,
                 kernel_size=kernel_size,
                 activation='relu'))
model.add(MaxPooling2D(pool_size))
model.add(Conv2D(filters=filters,
                 kernel_size=kernel_size,
                 activation='relu'))
model.add(Flatten())

In [9]:
# regularizer: dropout
model.add(Dropout(dropout))

In [None]:
# 출력: 10차원 one-hot vector
model.add(Dense(num_labels))
model.add(Activation('softmax'))
model.summary()
plot_model(model, to_file='cnn-mnist.png', show_shapes=True)

In [11]:
# one-hot vector의 손실함수
# 최적화: adam optimizer
# 분류 평가 지표: accuracy
model.compile(loss='categorical_crossentropy',
              optimizer='adam',
              metrics=['accuracy'])

In [None]:
# 훈련
model.fit(x_train, y_train, epochs=10, batch_size=batch_size)

In [None]:
# 테스트 테이터셋으로 일반화 검증
loss, acc = model.evaluate(x_test,
                        y_test,
                        batch_size=batch_size,
                        verbose=0)
print("\nTest accuracy: %.1f%%" % (100.0 * acc))