### 학습과 시각화에 필요한 라이브러리 임포트

In [1]:
import tensorflow as tf
from tensorflow.keras import datasets, layers, models
from tensorflow import keras
import numpy as np
import matplotlib.pyplot as plt

print(tf.__version__)

2.3.1


### 데이터

In [2]:
(train_images, train_labels), (test_images, test_labels) = datasets.mnist.load_data()

train_images = train_images.reshape((60000, 28, 28, 1))
test_images = test_images.reshape((10000, 28, 28, 1))

# 픽셀 값을 0~1 사이로 정규화합니다.
train_images, test_images = train_images / 255.0, test_images / 255.0

### 모델 구성 (CNN - 총 5층 layer 구성)

In [3]:
prototype_model = models.Sequential()
prototype_model.add(layers.Conv2D(32, (3, 3), activation='relu', input_shape=(28, 28, 1)))
prototype_model.add(layers.MaxPooling2D((2, 2)))
prototype_model.add(layers.Conv2D(64, (3, 3), activation='relu'))
prototype_model.add(layers.MaxPooling2D((2, 2)))
prototype_model.add(layers.Conv2D(64, (3, 3), activation='relu'))

prototype_model.add(layers.Flatten())
prototype_model.add(layers.Dense(64, activation='relu'))
prototype_model.add(layers.Dense(10, activation='softmax'))

prototype_model.summary()

Model: "sequential"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
conv2d (Conv2D)              (None, 26, 26, 32)        320       
_________________________________________________________________
max_pooling2d (MaxPooling2D) (None, 13, 13, 32)        0         
_________________________________________________________________
conv2d_1 (Conv2D)            (None, 11, 11, 64)        18496     
_________________________________________________________________
max_pooling2d_1 (MaxPooling2 (None, 5, 5, 64)          0         
_________________________________________________________________
conv2d_2 (Conv2D)            (None, 3, 3, 64)          36928     
_________________________________________________________________
flatten (Flatten)            (None, 576)               0         
_________________________________________________________________
dense (Dense)                (None, 64)                3

### 모델 학습

In [4]:
prototype_model.compile(optimizer='adam',
              loss='sparse_categorical_crossentropy',
              metrics=['accuracy'])

prototype_model.fit(train_images, train_labels, epochs=5)

proto_test_loss, proto_test_acc = prototype_model.evaluate(test_images,  test_labels, verbose=2)

print(proto_test_acc)

Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5
313/313 - 1s - loss: 0.0291 - accuracy: 0.9913
0.9912999868392944


### Regularization - l2 기법

In [5]:
l2_model = models.Sequential()
l2_model.add(layers.Conv2D(32, (3, 3), activation='relu', input_shape=(28, 28, 1)))
l2_model.add(layers.MaxPooling2D((2, 2)))
l2_model.add(layers.Conv2D(64, (3, 3), activation='relu'))
l2_model.add(layers.MaxPooling2D((2, 2)))
l2_model.add(layers.Conv2D(64, (3, 3), activation='relu'))

l2_model.add(layers.Flatten())
l2_model.add(layers.Dense(64, activation='relu'))
l2_model.add(layers.Dense(10, activation='softmax'))

l2_model.summary()

Model: "sequential_1"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
conv2d_3 (Conv2D)            (None, 26, 26, 32)        320       
_________________________________________________________________
max_pooling2d_2 (MaxPooling2 (None, 13, 13, 32)        0         
_________________________________________________________________
conv2d_4 (Conv2D)            (None, 11, 11, 64)        18496     
_________________________________________________________________
max_pooling2d_3 (MaxPooling2 (None, 5, 5, 64)          0         
_________________________________________________________________
conv2d_5 (Conv2D)            (None, 3, 3, 64)          36928     
_________________________________________________________________
flatten_1 (Flatten)          (None, 576)               0         
_________________________________________________________________
dense_2 (Dense)              (None, 64)               

### 모델 학습

In [6]:
l2_model.compile(optimizer='adam',
              loss='sparse_categorical_crossentropy',
              metrics=['accuracy'])

l2_model.fit(train_images, train_labels, epochs=5)

l2_test_loss, l2_test_acc = l2_model.evaluate(test_images,  test_labels, verbose=2)

print(l2_test_acc)

Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5
313/313 - 1s - loss: 0.0271 - accuracy: 0.9913
0.9912999868392944


### Regularization - 드롭아웃 기법

In [4]:
dpt_model = models.Sequential()
dpt_model.add(layers.Conv2D(32, (3, 3), activation='relu', input_shape=(28, 28, 1)))
dpt_model.add(layers.MaxPooling2D((2, 2)))

dpt_model.add(layers.Conv2D(64, (3, 3), activation='relu'))
dpt_model.add(layers.MaxPooling2D((2, 2)))
dpt_model.add(layers.Conv2D(64, (3, 3), activation='relu'))

dpt_model.add(layers.Flatten())
dpt_model.add(layers.Dense(64, activation='relu'))
dpt_model.add(layers.Dropout(0.5))
dpt_model.add(layers.Dense(64, activation='relu'))
dpt_model.add(layers.Dropout(0.25))
dpt_model.add(layers.Dense(10, activation='softmax'))

dpt_model.summary()

Model: "sequential_1"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
conv2d_3 (Conv2D)            (None, 26, 26, 32)        320       
_________________________________________________________________
max_pooling2d_2 (MaxPooling2 (None, 13, 13, 32)        0         
_________________________________________________________________
conv2d_4 (Conv2D)            (None, 11, 11, 64)        18496     
_________________________________________________________________
max_pooling2d_3 (MaxPooling2 (None, 5, 5, 64)          0         
_________________________________________________________________
conv2d_5 (Conv2D)            (None, 3, 3, 64)          36928     
_________________________________________________________________
flatten_1 (Flatten)          (None, 576)               0         
_________________________________________________________________
dense_2 (Dense)              (None, 64)               

### 모델 학습 

In [5]:
dpt_model.compile(optimizer='adam',
              loss='sparse_categorical_crossentropy',
              metrics=['accuracy'])

dpt_model.fit(train_images, train_labels, epochs=20)

dpt_test_loss, dpt_test_acc = dpt_model.evaluate(test_images,  test_labels, verbose=2)

print(dpt_test_acc)

Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
313/313 - 1s - loss: 0.0577 - accuracy: 0.9922
0.9922000169754028
