# 資料預處理

In [1]:
from keras.utils import np_utils
import numpy as np
np.random.seed(10)

Using TensorFlow backend.


In [2]:
from keras.datasets import mnist
(x_train_image,y_train_label),\
(x_test_image,y_test_label)= mnist.load_data()

In [3]:
x_Train =x_train_image.reshape(60000, 784).astype('float32')
x_Test = x_test_image.reshape(10000, 784).astype('float32')

In [4]:
x_Train_normalize = x_Train / 255
x_Test_normalize = x_Test / 255

In [5]:
y_Train_OneHot = np_utils.to_categorical(y_train_label)
y_Test_OneHot = np_utils.to_categorical(y_test_label)

# 建立模型

In [6]:
from keras.models import Sequential
from keras.layers import Dense
from keras.layers import Dropout

In [7]:
model = Sequential()

In [8]:
#將「輸入層」與「隱藏層1」加入模型

In [9]:
model.add(Dense(units=1000, 
                input_dim=784, 
                kernel_initializer='normal', 
                activation='relu'))

Instructions for updating:
Colocations handled automatically by placer.


In [10]:
model.add(Dropout(0.5))

Instructions for updating:
Please use `rate` instead of `keep_prob`. Rate should be set to `rate = 1 - keep_prob`.


In [11]:
#將「隱藏層2」加入模型

In [12]:
model.add(Dense(units=1000, 
                kernel_initializer='normal', 
                activation='relu'))

In [13]:
model.add(Dropout(0.5))

In [14]:
#將「輸出層」加入模型

In [15]:
model.add(Dense(units=10, 
                kernel_initializer='normal', 
                activation='softmax'))

In [16]:
print(model.summary())

_________________________________________________________________
Layer (type)                 Output Shape              Param #   
dense_1 (Dense)              (None, 1000)              785000    
_________________________________________________________________
dropout_1 (Dropout)          (None, 1000)              0         
_________________________________________________________________
dense_2 (Dense)              (None, 1000)              1001000   
_________________________________________________________________
dropout_2 (Dropout)          (None, 1000)              0         
_________________________________________________________________
dense_3 (Dense)              (None, 10)                10010     
Total params: 1,796,010
Trainable params: 1,796,010
Non-trainable params: 0
_________________________________________________________________
None


# 訓練模型

In [17]:
model.compile(loss='categorical_crossentropy', 
              optimizer='adam', metrics=['accuracy'])

In [None]:
train_history=model.fit(x=x_Train_normalize,
                        y=y_Train_OneHot,validation_split=0.2, 
                        epochs=10, batch_size=200,verbose=2)

Instructions for updating:
Use tf.cast instead.
Train on 48000 samples, validate on 12000 samples
Epoch 1/10
 - 14s - loss: 0.3635 - acc: 0.8870 - val_loss: 0.1340 - val_acc: 0.9607
Epoch 2/10
 - 12s - loss: 0.1602 - acc: 0.9512 - val_loss: 0.0999 - val_acc: 0.9703
Epoch 3/10
 - 12s - loss: 0.1168 - acc: 0.9639 - val_loss: 0.0848 - val_acc: 0.9742
Epoch 4/10
 - 12s - loss: 0.0976 - acc: 0.9697 - val_loss: 0.0836 - val_acc: 0.9747
Epoch 5/10
 - 12s - loss: 0.0864 - acc: 0.9725 - val_loss: 0.0795 - val_acc: 0.9770
Epoch 6/10
 - 12s - loss: 0.0746 - acc: 0.9763 - val_loss: 0.0764 - val_acc: 0.9765
Epoch 7/10
 - 12s - loss: 0.0654 - acc: 0.9790 - val_loss: 0.0737 - val_acc: 0.9783
Epoch 8/10
 - 12s - loss: 0.0590 - acc: 0.9815 - val_loss: 0.0835 - val_acc: 0.9777
Epoch 9/10


# 以圖形顯示訓練過程

In [None]:
import matplotlib.pyplot as plt
def show_train_history(train_history,train,validation):
    plt.plot(train_history.history[train])
    plt.plot(train_history.history[validation])
    plt.title('Train History')
    plt.ylabel(train)
    plt.xlabel('Epoch')
    plt.legend(['train', 'validation'], loc='upper left')
    plt.show()

In [None]:
show_train_history(train_history,'acc','val_acc')

In [None]:
show_train_history(train_history,'loss','val_loss')

# 評估模型準確率

In [None]:
scores = model.evaluate(x_Test_normalize, y_Test_OneHot)
print()
print('accuracy=',scores[1])

# 進行預測

In [None]:
prediction=model.predict_classes(x_Test)

In [None]:
prediction

In [None]:
import matplotlib.pyplot as plt
def plot_images_labels_prediction(images,labels,
                                  prediction,idx,num=10):
    fig = plt.gcf()
    fig.set_size_inches(12, 14)
    if num>25: num=25 
    for i in range(0, num):
        ax=plt.subplot(5,5, 1+i)
        ax.imshow(images[idx], cmap='binary')
        title= "label=" +str(labels[idx])
        if len(prediction)>0:
            title+=",predict="+str(prediction[idx]) 
            
        ax.set_title(title,fontsize=10) 
        ax.set_xticks([]);ax.set_yticks([])        
        idx+=1 
    plt.show()

In [None]:
plot_images_labels_prediction(x_test_image,y_test_label,
                              prediction,idx=340)

# confusion matrix

In [None]:
import pandas as pd
pd.crosstab(y_test_label,prediction,
            rownames=['label'],colnames=['predict'])

In [None]:
df = pd.DataFrame({'label':y_test_label, 'predict':prediction})
df[:2]

In [None]:
df[(df.label==5)&(df.predict==3)]

In [None]:
plot_images_labels_prediction(x_test_image,y_test_label
                              ,prediction,idx=340,num=1)

In [None]:
plot_images_labels_prediction(x_test_image,y_test_label
                              ,prediction,idx=1289,num=1)