In [1]:
import matplotlib as mpl
import matplotlib.pyplot as plt
%matplotlib inline
import numpy as np
import sklearn
import pandas as pd
import os
import sys
import time
import tensorflow as tf

from tensorflow import keras

print(tf.__version__)
print(sys.version_info)
for module in mpl, np, pd, sklearn, tf, keras:
    print(module.__name__, module.__version__)


1.13.1
sys.version_info(major=3, minor=7, micro=3, releaselevel='final', serial=0)
matplotlib 3.0.3
numpy 1.16.2
pandas 0.24.2
sklearn 0.20.3
tensorflow 1.13.1
tensorflow._api.v1.keras 2.2.4-tf


In [2]:
fashion_mnist = keras.datasets.fashion_mnist
(x_train_all, y_train_all), (x_test, y_test) = fashion_mnist.load_data()
x_valid, x_train = x_train_all[:5000], x_train_all[5000:]
y_valid, y_train = y_train_all[:5000], y_train_all[5000:]

print(x_valid.shape, y_valid.shape)
print(x_train.shape, y_train.shape)
print(x_test.shape, y_test.shape)

(5000, 28, 28) (5000,)
(55000, 28, 28) (55000,)
(10000, 28, 28) (10000,)


In [3]:
print(np.max(x_train), np.min(x_train))

255 0


In [4]:
# x = (x - u) / std   标准化

from sklearn.preprocessing import StandardScaler

scaler = StandardScaler()
# x_train: [None, 28, 28] -> [None, 784]
x_train_scaled = scaler.fit_transform(
    x_train.astype(np.float32).reshape(-1, 1)).reshape(-1, 28 * 28)
x_valid_scaled = scaler.transform(
    x_valid.astype(np.float32).reshape(-1, 1)).reshape(-1, 28 * 28)
x_test_scaled = scaler.transform(
    x_test.astype(np.float32).reshape(-1, 1)).reshape(-1, 28 * 28)


In [5]:
print(np.max(x_train_scaled), np.min(x_train_scaled))

2.023144 -0.8105139


# Tf1.0总结
    构建计算图：
        对于Sequential模型，通过tf.layers.dense（对应2.0中的tf.keras.layers.Dense），来堆叠模型层数。
        通过tf.losses.sparse_softmax_cross_entropy()指定loss计算方式
        指定prediction计算方法
        指定结果矩阵（01矩阵）计算方法
        指定准确值计算方法
        指定模型优化方向train_op
        至此，构建完了计算图。但这只是一个计算图，里面没有任何数据。（数据的位置先用placehloder占了位）
    创建会话（session），输入数据，运行计算图：
        自行指定batch_size，根据数据数量确定batch的数量。
        用for循环执行需要的epoch，用for循环规定一个epoch内的steps。
        在for循环内计算相关数据。
    
    tf.variable_scope():定义变量空间，防止重名。
    tf.get_variable():定义变量

In [6]:
hidden_units = [100, 100]  # 定义隐藏层的神经元数量
class_num = 10  #输出层

'''
tf.placeholder(dtype, shape = None)：占位符，用来传入数据。第一个参数是数据类型，第二个参数是[batch_size, dim],元祖也可以。
为什么需要占位符？
    tf1.0中是先构建数据图再传入数据进行计算的，那么也就是说，在构图阶段使看不到数据的，所以需要先用占位符占取数据的位置。

'''
x = tf.placeholder(tf.float32, [None, 28 * 28]) # 传入的数据应该时一个数字
y = tf.placeholder(tf.int64, [None])

input_for_next_layer = x  # 丁毅输入层
for hidden_unit in hidden_units:
    input_for_next_layer = tf.layers.dense(input_for_next_layer,  # 在输入层上stack隐藏层
                                           hidden_unit,
                                           activation=tf.nn.relu)
logits = tf.layers.dense(input_for_next_layer,  # 在隐藏层上stack输出层
                         class_num)

'''
last_hidden_output * W(logits) -> softmax -> prob
1. logit -> softmax -> prob
2. labels -> one_hot
3. calculate cross entropy

logits:最后一层隐藏层的输出为logits。

将logits传入softmax层可以得到概率。
sparse_softmax_cross_entropy会将标签转为one-hot编码
有了这两个东西就可以计算loss了

'''

loss = tf.losses.sparse_softmax_cross_entropy(labels = y,  # softmax对分类结果进行转化
                                              logits = logits)
# get accuracy.
prediction = tf.argmax(logits, 1)  # 取出预测结果，logits是一个向量，取出想向量值最大的元素就是标签了。
correct_prediction = tf.equal(prediction, y) # 将prediction和y做对比（异或？），得到一个0,1组成的向量
accuracy = tf.reduce_mean(tf.cast(correct_prediction, tf.float64)) #通过01向量，取均值，也就是正确率

# 运行了一遍train_op就相当于训练了一次网络
train_op = tf.train.AdamOptimizer(1e-3).minimize(loss)  # 指定优化器与优化目标，得到train_op

Instructions for updating:
Use keras.layers.dense instead.
Instructions for updating:
Colocations handled automatically by placer.
Instructions for updating:
Use tf.cast instead.


In [7]:
print(x)
print(logits)  
# 由输出结果可知，输入x与logits现在都还只是一种数据类型，没有数据数量，也就说明还没有输入数据

Tensor("Placeholder:0", shape=(?, 784), dtype=float32)
Tensor("dense_2/BiasAdd:0", shape=(?, 10), dtype=float32)


In [8]:
# session

init = tf.global_variables_initializer()
batch_size = 20
epochs = 10
train_steps_per_epoch = x_train.shape[0] // batch_size
valid_steps = x_valid.shape[0] // batch_size

def eval_with_sess(sess, x, y, accuracy, images, labels, batch_size):
    eval_steps = images.shape[0] // batch_size
    eval_accuracies = []
    for step in range(eval_steps):
        batch_data = images[step * batch_size : (step+1) * batch_size]
        batch_label = labels[step * batch_size : (step+1) * batch_size]
        accuracy_val = sess.run(accuracy,
                                feed_dict = {
                                    x: batch_data,
                                    y: batch_label
                                })
        eval_accuracies.append(accuracy_val)  # 对每个batch求accuracy，然后去均值
    return np.mean(eval_accuracies)

with tf.Session() as sess:
    sess.run(init)
    for epoch in range(epochs): # 通过for循环来规定epoch数
        for step in range(train_steps_per_epoch):  # 通过for循环来规定一个epoch内的batch数
            batch_data = x_train_scaled[  # feature每次向后去一个batch
                step * batch_size : (step+1) * batch_size]
            batch_label = y_train[  # label每次向后去一个batch
                step * batch_size : (step+1) * batch_size]
            loss_val, accuracy_val, _ = sess.run( # 训练一个batch的数据
                [loss, accuracy, train_op],
                feed_dict = {
                    x: batch_data,
                    y: batch_label
                })
            print('\r[Train] epoch: %d, step: %d, loss: %3.5f, accuracy: %2.2f' % (
                epoch, step, loss_val, accuracy_val), end="")
        valid_accuracy = eval_with_sess(sess, x, y, accuracy,  # 训练验证集中一个batch的数据
                                        x_valid_scaled, y_valid,
                                        batch_size)
        print("\t[Valid] acc: %2.2f" % (valid_accuracy))

[Train] epoch: 0, step: 2749, loss: 0.29409, accuracy: 0.85	[Valid] acc: 0.86
[Train] epoch: 1, step: 2749, loss: 0.23783, accuracy: 0.90	[Valid] acc: 0.87
[Train] epoch: 2, step: 2749, loss: 0.16557, accuracy: 0.90	[Valid] acc: 0.87
[Train] epoch: 3, step: 2749, loss: 0.16518, accuracy: 0.85	[Valid] acc: 0.88
[Train] epoch: 4, step: 2749, loss: 0.18367, accuracy: 0.90	[Valid] acc: 0.88
[Train] epoch: 5, step: 2749, loss: 0.18992, accuracy: 0.95	[Valid] acc: 0.88
[Train] epoch: 6, step: 2749, loss: 0.13003, accuracy: 0.95	[Valid] acc: 0.88
[Train] epoch: 7, step: 2749, loss: 0.19065, accuracy: 0.95	[Valid] acc: 0.89
[Train] epoch: 8, step: 2749, loss: 0.12379, accuracy: 0.90	[Valid] acc: 0.88
[Train] epoch: 9, step: 2749, loss: 0.11657, accuracy: 0.95	[Valid] acc: 0.89
