上一个自定义model，训练精度极低，效率极低。主要是没有按照规律设计，不了解原理而硬造出来的模型。

上一个模型是这样的：

input_layer + conv1 + pool1 + conv2 + pool2 + conv3 + pool3 + conv4 + pool4 + dense1 + dense2 + dense3 + dense4 + logits

这个层倒是很多，hidden layers 有12层！

不过，下面是两处关于CNN设计的建议：

https://medium.com/technologymadeeasy/the-best-explanation-of-convolutional-neural-networks-on-the-internet-fbb8b1ad5df8

这里面，有cnn间的shape计算，以及层设计的建议：


![Typical architecture of CNN](https://cdn-images-1.medium.com/max/1600/1*2SWb6CmxzbPZijmevFbe-g.jpeg)

上面的图可能显示不出来，它是这样建议的：

conv + conv + pool + conv + conv + pool + conv + conv + pool + ...

这是另一个地方的建议：

INPUT -> [[CONV -> RELU]*N -> POOL?]*M -> [FC -> RELU]*K -> FC





In [None]:
import tensorflow as tf
import numpy as np
import os
import random
from numpy import array

from skimage.io import imread, imsave
from skimage.color import rgb2gray
from skimage.transform import resize

IMAGE_SIZE = 64
# CHARSET_SIZE = 3755
CHARSET_SIZE = 37

def input(dataset):
    return dataset.images, dataset.labels

def cnn_model_fn(features, labels, mode):
  """Model function for CNN."""
  # Input Layer
  input_layer = tf.reshape(features["x"], [-1, 64, 64, 1])
  print ('shape of input_layer: ', input_layer)
  # with batch_size =100, shape should be: [100, 28, 28, 1]
  # shape of input_layer:  Tensor("Reshape:0", shape=(100, 64, 64, 1), dtype=float32)

  # Convolutional Layer #1
  conv1 = tf.layers.conv2d(
      inputs=input_layer,
      filters=32,
      kernel_size=[5, 5],
      padding="same",
      activation=tf.nn.relu)
  print ('shape of conv1: ', conv1)
  # shape of conv1:  Tensor("conv2d/Relu:0", shape=(100, 64, 64, 32), dtype=float32)
    
  # Pooling Layer #1
  pool1 = tf.layers.max_pooling2d(inputs=conv1, pool_size=[2, 2], strides=2)
  print ('shape of pool1: ', pool1)

  # Convolutional Layer #2 and Pooling Layer #2
  conv2 = tf.layers.conv2d(
      inputs=pool1,
      filters=64,
      kernel_size=[5, 5],
      padding="same",
      activation=tf.nn.relu)
  pool2 = tf.layers.max_pooling2d(inputs=conv2, pool_size=[2, 2], strides=2)
  print ('shape of conv2: ', conv2, '; and shape of pool2 is: ', pool2)
  # shape of conv2:  Tensor("conv2d_2/Relu:0", shape=(100, 32, 32, 64), dtype=float32) ; and shape of pool2 is:  Tensor("max_pooling2d_2/MaxPool:0", shape=(100, 16, 16, 64), dtype=float32)
  
  # Dense Layers
  pool2_flat = tf.reshape(pool2, [-1, 16 * 16 * 64])
  dense1 = tf.layers.dense(inputs=pool2_flat, units=1024, activation=tf.nn.relu)
  dense2 = tf.layers.dense(inputs=dense1, units=1024, activation=tf.nn.relu)
  dense3 = tf.layers.dense(inputs=dense2, units=1024, activation=tf.nn.relu)
  dense4 = tf.layers.dense(inputs=dense3, units=1024, activation=tf.nn.relu)

  dropout = tf.layers.dropout(
      inputs=dense4, rate=0.1, training=mode == tf.estimator.ModeKeys.TRAIN)

  # Logits Layer
  logits = tf.layers.dense(inputs=dropout, units=CHARSET_SIZE)

  predictions = {
      # Generate predictions (for PREDICT and EVAL mode)
      "classes": tf.argmax(input=logits, axis=1),
      # Add `softmax_tensor` to the graph. It is used for PREDICT and by the
      # `logging_hook`.
      "probabilities": tf.nn.softmax(logits, name="softmax_tensor")
  }

  if mode == tf.estimator.ModeKeys.PREDICT:
    return tf.estimator.EstimatorSpec(mode=mode, predictions=predictions)

  # Calculate Loss (for both TRAIN and EVAL modes)
  loss = tf.losses.sparse_softmax_cross_entropy(labels=labels, logits=logits)

  # Configure the Training Op (for TRAIN mode)
  if mode == tf.estimator.ModeKeys.TRAIN:
    optimizer = tf.train.GradientDescentOptimizer(learning_rate=0.0001)
    train_op = optimizer.minimize(
        loss=loss,
        global_step=tf.train.get_global_step())
    return tf.estimator.EstimatorSpec(mode=mode, loss=loss, train_op=train_op)

  # Add evaluation metrics (for EVAL mode)
  eval_metric_ops = {
      "accuracy": tf.metrics.accuracy(
          labels=labels, predictions=predictions["classes"])}
  return tf.estimator.EstimatorSpec(
      mode=mode, loss=loss, eval_metric_ops=eval_metric_ops)


class DataSetLoader:
    def __init__(self, data_dir):
        # Set FLAGS.charset_size to a small value if available computation power is limited.
        truncate_path = data_dir + ('%05d' % CHARSET_SIZE)
        print('Now processing path: ', truncate_path)
        image_names = []
        for root, sub_folder, file_list in os.walk(data_dir):
            if root < truncate_path:
                image_names += [os.path.join(root, file_path) for file_path in file_list]
        random.shuffle(image_names)
        self.labels = [int(file_name[len(data_dir):].split(os.sep)[0]) for file_name in image_names]
        images_rgb = [imread(file_name) for file_name in image_names]
        image_resized = [resize(image, (IMAGE_SIZE, IMAGE_SIZE)) for image in images_rgb]
        self.images = [rgb2gray(item) for item in image_resized]
        print ('self.images: ', self.images[0].dtype)
        self.images = np.float32(self.images)
        print ('self.images: ', self.images[0].dtype)

        # convert list to numpy array
        self.images = array(self.images)
        self.labels = array(self.labels)

    
train_data = DataSetLoader(data_dir='../data/train_/')
print ('Train data loaded ...')


# Specify feature
feature_columns = [tf.feature_column.numeric_column("x", shape=[IMAGE_SIZE, IMAGE_SIZE])]


# Build CNN with customized function ...
classifier = tf.estimator.Estimator(
    model_fn=cnn_model_fn ,
    model_dir='../dfs/checkpoint/customized_model-e')

    

# Define the training inputs
train_input_fn = tf.estimator.inputs.numpy_input_fn(
    x={"x": input(train_data)[0]},
    y=input(train_data)[1],
    num_epochs=None,
    batch_size=100,
    shuffle=True
)
print ('Begin to train ...')

classifier.train(input_fn=train_input_fn, steps=20000)
print ('Train done ...')

test_data = DataSetLoader(data_dir='../data/test_/')
print ('Test data loaded ...')

# Define the test inputs
test_input_fn = tf.estimator.inputs.numpy_input_fn(
    x={"x": input(test_data)[0]},
    y=input(test_data)[1],
    num_epochs=1,
    shuffle=False
)

# Evaluate accuracy
accuracy_score = classifier.evaluate(input_fn=test_input_fn)["accuracy"]
print("\nTest Accuracy: {0:f}%\n".format(accuracy_score*100))

Now processing path:  ../data/train_/00037
self.images:  float64
self.images:  float32
Train data loaded ...
INFO:tensorflow:Using default config.
INFO:tensorflow:Using config: {'_model_dir': '../dfs/checkpoint/customized_model-e', '_tf_random_seed': 1, '_save_summary_steps': 100, '_save_checkpoints_secs': 600, '_save_checkpoints_steps': None, '_session_config': None, '_keep_checkpoint_max': 5, '_keep_checkpoint_every_n_hours': 10000, '_log_step_count_steps': 100}
Begin to train ...
shape of input_layer:  Tensor("Reshape:0", shape=(100, 64, 64, 1), dtype=float32)
shape of conv1:  Tensor("conv2d/Relu:0", shape=(100, 64, 64, 32), dtype=float32)
shape of pool1:  Tensor("max_pooling2d/MaxPool:0", shape=(100, 32, 32, 32), dtype=float32)
shape of conv2:  Tensor("conv2d_2/Relu:0", shape=(100, 32, 32, 64), dtype=float32) ; and shape of pool2 is:  Tensor("max_pooling2d_2/MaxPool:0", shape=(100, 16, 16, 64), dtype=float32)
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensorflow:Saving checkp

INFO:tensorflow:global_step/sec: 1.02306
INFO:tensorflow:loss = 3.60335, step = 6501 (97.745 sec)
INFO:tensorflow:Saving checkpoints for 6519 into ../dfs/checkpoint/customized_model-e/model.ckpt.
INFO:tensorflow:global_step/sec: 1.04383
INFO:tensorflow:loss = 3.60328, step = 6601 (95.801 sec)
INFO:tensorflow:global_step/sec: 1.0463
INFO:tensorflow:loss = 3.60356, step = 6701 (95.575 sec)
INFO:tensorflow:global_step/sec: 1.03814
INFO:tensorflow:loss = 3.60466, step = 6801 (96.326 sec)
INFO:tensorflow:global_step/sec: 1.01617
INFO:tensorflow:loss = 3.604, step = 6901 (98.409 sec)
INFO:tensorflow:global_step/sec: 1.06509
INFO:tensorflow:loss = 3.60256, step = 7001 (93.889 sec)
INFO:tensorflow:global_step/sec: 1.09073
INFO:tensorflow:loss = 3.60473, step = 7101 (91.681 sec)
INFO:tensorflow:Saving checkpoints for 7151 into ../dfs/checkpoint/customized_model-e/model.ckpt.
INFO:tensorflow:global_step/sec: 1.08161
INFO:tensorflow:loss = 3.59938, step = 7201 (92.454 sec)
INFO:tensorflow:global_

INFO:tensorflow:loss = 3.59515, step = 13701 (95.289 sec)
INFO:tensorflow:global_step/sec: 1.05452
INFO:tensorflow:loss = 3.59334, step = 13801 (94.829 sec)
INFO:tensorflow:global_step/sec: 1.00318
INFO:tensorflow:loss = 3.59563, step = 13901 (99.683 sec)
INFO:tensorflow:global_step/sec: 0.967219
INFO:tensorflow:loss = 3.5964, step = 14001 (103.389 sec)
INFO:tensorflow:global_step/sec: 0.986241
INFO:tensorflow:loss = 3.59845, step = 14101 (101.396 sec)
INFO:tensorflow:Saving checkpoints for 14136 into ../dfs/checkpoint/customized_model-e/model.ckpt.
INFO:tensorflow:global_step/sec: 1.0277
INFO:tensorflow:loss = 3.59396, step = 14201 (97.304 sec)
INFO:tensorflow:global_step/sec: 1.05905
INFO:tensorflow:loss = 3.5903, step = 14301 (94.424 sec)
INFO:tensorflow:global_step/sec: 0.975196
INFO:tensorflow:loss = 3.59236, step = 14401 (102.544 sec)
INFO:tensorflow:global_step/sec: 1.05173
INFO:tensorflow:loss = 3.59417, step = 14501 (95.082 sec)
INFO:tensorflow:global_step/sec: 1.09616
INFO:te

INFO:tensorflow:Starting evaluation at 2018-04-30-10:32:08
INFO:tensorflow:Restoring parameters from /tmp/tmp4bp3lczu/model.ckpt-10000
INFO:tensorflow:Finished evaluation at 2018-04-30-10:32:18
INFO:tensorflow:Saving dict for global step 10000: accuracy = 0.0733032, global_step = 10000, loss = 3.59994

Test Accuracy: 7.330317%

