# MNIST 손글씨 - CNN v2


 - 2 Conv2D layers
 - 1 MaxPooling2D layer
 - 1 Fully Connected Network layer
 - 1 Output layer

In [None]:
import numpy as np
import tensorflow as tf
seed = 2022
np.random.seed(seed)
tf.random.set_seed(seed)

- 데이터 전처리

In [None]:
from tensorflow.keras.datasets import mnist
(X_train, y_train), (X_test, y_test) = mnist.load_data()

Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/mnist.npz


In [None]:
# X data: 0-1 사이의 값, 3차원 ==> 4차원
X_train = X_train.reshape(-1,28,28,1) / 255.
X_test = X_test.reshape(-1,28,28,1) / 255.

In [None]:
# One hot encoding
from tensorflow.keras.utils import to_categorical
Y_train = to_categorical(y_train)
Y_test = to_categorical(y_test)

- 모델 정의, 설정, 학습, 평가

In [None]:
from tensorflow.keras.models import Sequential, load_model
from tensorflow.keras.layers import Dense, Conv2D, Flatten, MaxPooling2D  ## 맥스풀링 새로 들어와. 
from tensorflow.keras.callbacks import ModelCheckpoint, EarlyStopping

In [None]:
# del model

In [None]:
# 1은 흑백 3은 컬러
model = Sequential([
    Conv2D(32, kernel_size=(3,3), input_shape=(28, 28, 1), activation='relu'),
    Conv2D(64, (3,3),  activation='relu'),
    MaxPooling2D(),   # 절반으로 줄이기 # MaxPooling(pool_size(2,2))
    Flatten(),
    Dense(512, activation='relu'),
    Dense(10, activation='softmax')
])
model.summary()

Model: "sequential_2"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 conv2d_4 (Conv2D)           (None, 26, 26, 32)        320       
                                                                 
 conv2d_5 (Conv2D)           (None, 24, 24, 64)        18496     
                                                                 
 max_pooling2d_1 (MaxPooling  (None, 12, 12, 64)       0         
 2D)                                                             
                                                                 
 flatten_2 (Flatten)         (None, 9216)              0         
                                                                 
 dense_4 (Dense)             (None, 512)               4719104   
                                                                 
 dense_5 (Dense)             (None, 10)                5130      
                                                      

-  dense 2의 파라미터 확줄어들어

In [None]:
model.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy'])

In [None]:
model_path = 'best-mnist-cnn-v2.h5'
checkpoint = ModelCheckpoint(model_path, save_best_only=True, verbose=1)
early_stop = EarlyStopping(patience=10)

In [None]:
hist = model.fit(
    X_train, Y_train, validation_split=0.2, epochs=100, batch_size=200,
    callbacks=[checkpoint, early_stop], verbose=0
)
# 처음에는 GPU 선착때문에 시간이 걸리나 그후엔 고속으로 돌아가


Epoch 00001: val_loss improved from inf to 0.05852, saving model to best-mnist-cnn-v2.h5

Epoch 00002: val_loss improved from 0.05852 to 0.05336, saving model to best-mnist-cnn-v2.h5

Epoch 00003: val_loss improved from 0.05336 to 0.04189, saving model to best-mnist-cnn-v2.h5

Epoch 00004: val_loss improved from 0.04189 to 0.04025, saving model to best-mnist-cnn-v2.h5

Epoch 00005: val_loss did not improve from 0.04025

Epoch 00006: val_loss did not improve from 0.04025

Epoch 00007: val_loss did not improve from 0.04025

Epoch 00008: val_loss did not improve from 0.04025

Epoch 00009: val_loss did not improve from 0.04025

Epoch 00010: val_loss did not improve from 0.04025

Epoch 00011: val_loss did not improve from 0.04025

Epoch 00012: val_loss did not improve from 0.04025

Epoch 00013: val_loss did not improve from 0.04025

Epoch 00014: val_loss did not improve from 0.04025


In [None]:
best_model=load_model(model_path)
best_model.evaluate(X_test, Y_test)
# [0.040496282279491425, 0.9872000217437744]
# [0.040496282279491425, 0.9872000217437744] ver2



[0.040496282279491425, 0.9872000217437744]