In [None]:
import numpy as np
np.random.seed(1337)  # for reproducibility

import os
os.environ["CUDA_VISIBLE_DEVICES"] = "3"

from keras.datasets import mnist
from keras.utils import np_utils
from keras.models import Sequential
from keras.layers import SimpleRNN, Activation, Dense
from keras.optimizers import Adam

TIME_STEPS = 28     # same as the height of the image
INPUT_SIZE = 28     # same as the width of the image
BATCH_SIZE = 500
BATCH_INDEX = 0
OUTPUT_SIZE = 10
CELL_SIZE = 50
# cell_size 隐藏层个数
LR = 0.001


(X_train, y_train), (X_test, y_test) = mnist.load_data()
X_train = X_train.reshape(-1, 28, 28)/255
X_test = X_test.reshape(-1, 28, 28)/255
y_train = np_utils.to_categorical(y_train, num_classes=10)
y_test = np_utils.to_categorical(y_test, num_classes=10)


model = Sequential()

model.add(SimpleRNN(
    batch_input_shape = (None, TIME_STEPS, INPUT_SIZE),
    units = CELL_SIZE,
    unroll = True,
))

model.add(Dense(OUTPUT_SIZE))
model.add(Activation('softmax'))

adam = Adam(LR)
model.compile(optimizer=adam,
             loss='categorical_crossentropy',
             metrics=['accuracy'])


for step in range(4001):
    X_batch = X_train[BATCH_INDEX: BATCH_INDEX+BATCH_SIZE, :, :]
    Y_batch = y_train[BATCH_INDEX: BATCH_INDEX+BATCH_SIZE, :]
    cost = model.train_on_batch(X_batch, Y_batch)
    BATCH_INDEX += BATCH_SIZE
    BATCH_INDEX = 0 if BATCH_INDEX >= X_train.shape[0] else BATCH_INDEX
    
    if step % 500 == 0:
        cost, accuracy = model.evaluate(X_test, y_test, batch_size=y_test.shape[0], verbose=False)
        print('step', step, 'test cost: ', cost, 'test accuracy: ', accuracy)
    


step 0 test cost:  2.308062791824341 test accuracy:  0.12449999898672104
step 500 test cost:  0.36845862865448 test accuracy:  0.8931999802589417
step 1000 test cost:  0.22872890532016754 test accuracy:  0.9344000220298767
step 1500 test cost:  0.19329142570495605 test accuracy:  0.9445000290870667
step 2000 test cost:  0.1605876088142395 test accuracy:  0.953499972820282
step 2500 test cost:  0.14145895838737488 test accuracy:  0.9567000269889832
