### 普通版本RNN
![gereral_RNN](gereral_RNN.PNG)
### TensorFlow版本RNN
![TensorFlow_RNN](TensorFlow_RNN.PNG)

In [66]:
import tensorflow as tf
import numpy as np
from keras import backend as K
K.clear_session()          # 清除之前会话，防止jupyter缓存影响

import matplotlib.pyplot as plt
%matplotlib auto

BATCH_START = 0
TIME_STEPS = 20
BATCH_SIZE = 50
INPUT_SIZE = 1
OUTPUT_SIZE = 1
CELL_SIZE = 10
LR = 0.006
BATCH_START_TEST = 0

def get_batch():
    global BATCH_START, TIME_STEPS
    # xs shape(50 batch, 20 steps)
    # [0, 999].reshape((50, 20))/(10*np.pi)
    xs = np.arange(BATCH_START, BATCH_START+TIME_STEPS*BATCH_SIZE).reshape((BATCH_SIZE, TIME_STEPS))/(10*np.pi)    
    res = np.cos(xs)     # 真实值
    seq = np.sin(xs)     # 预测值
    BATCH_START += TIME_STEPS
    # plt.plot(xs[0, :], res[0, :], 'r', xs[0, :], seq[0, :], 'b--')   # 红色实线为真实值，蓝色虚线为预测值
    # plt.show()
    
    return [seq[:, :, np.newaxis], res[:, :, np.newaxis], xs]           

class LSTMRNN:
    def __init__(self, n_steps, input_size, output_size, cell_size, batch_size):
        self.n_steps = n_steps
        self.input_size = input_size
        self.output_size = output_size
        self.cell_size = cell_size
        self.batch_size = batch_size
        with tf.name_scope('inputs'):
            self.xs = tf.placeholder(tf.float32, [None, n_steps, input_size], name='xs')
            self.ys =tf.placeholder(tf.float32, [None, n_steps, input_size], name='ys')
        with tf.variable_scope('in_hidden'):
            self.add_input_layer()
        with tf.variable_scope('LSTM_cell'):
            self.add_cell()
        with tf.variable_scope('out_hidden'):
            self.add_output_layer()
        with tf.name_scope('cost'):
            self.compute_cost()
        with tf.name_scope('train'):
            self.train_op = tf.train.AdamOptimizer(LR).minimize(self.cost)
            
    def add_input_layer(self,):
        l_in_x = tf.reshape(self.xs, [-1, self.input_size], name='2_2D')   # (batch*n_step, in_size)
        Ws_in = self._weight_variable([self.input_size, self.cell_size])   # Ws(in_size, cell_size)
        bs_in = self._bias_variable([self.cell_size,])                     # bs(cell_size,)
        with tf.name_scope('Wx_plus_b'):
            l_in_y = tf.matmul(l_in_x, Ws_in)+bs_in                        # l_in_y(batch*n_steps, cell_size)
        self.l_in_y = tf.reshape(l_in_y, [-1, self.n_steps, self.cell_size], name='2_3D')  # reshape l_in_y ==> (batch, n_steps, cell_size)
    
    def add_cell(self):
        lstm_cell = tf.nn.rnn_cell.BasicLSTMCell(self.cell_size, forget_bias=1.0, state_is_tuple=True)
        with tf.name_scope('initial_state'):
            self.cell_init_state = lstm_cell.zero_state(self.batch_size, dtype=tf.float32)
            self.cell_outputs, self.cell_final_state = tf.nn.dynamic_rnn(
                lstm_cell, self.l_in_y, initial_state=self.cell_init_state, time_major=False)
            
    
    def add_output_layer(self):
        l_out_x = tf.reshape(self.cell_outputs, [-1, self.cell_size], name='2_2D')   # (batch*steps, cell_size)
        Ws_out = self._weight_variable([self.cell_size, self.output_size])  
        bs_out = self._bias_variable([self.output_size,])                   
        with tf.name_scope('Wx_plus_b'):
            self.pred = tf.matmul(l_out_x, Ws_out)+bs_out                            # (batch*steps, output_size)
       
    def compute_cost(self):
        losses = tf.contrib.legacy_seq2seq.sequence_loss_by_example(
            [tf.reshape(self.pred, [-1], name='reshape_pred')],
            [tf.reshape(self.ys, [-1], name='reshape_target')],
            [tf.ones([self.batch_size*self.n_steps], dtype=tf.float32)],
            average_across_timesteps = True,
            softmax_loss_function = self.msr_error,
            name = 'losses'
            )
        with tf.name_scope('average_cost'):
            self.cost = tf.div(
                tf.reduce_sum(losses, name='losses_sum'),
                tf.cast(self.batch_size, tf.float32),
                name = 'average_cost'
                )
            tf.summary.scalar('cost', self.cost)
    
    def msr_error(self, logits, labels):
        return tf.square(tf.subtract(logits, labels))
    
    def _weight_variable(self, shape, name='weights'):
        initializer = tf.random_normal_initializer(mean=0., stddev=1.,)
        return tf.get_variable(shape=shape, initializer=initializer, name=name)
    
    def _bias_variable(self, shape, name='biases'):
        initializer = tf.constant_initializer(0.1)
        return tf.get_variable(shape=shape, initializer=initializer, name=name)
    
if __name__ == '__main__':
    model = LSTMRNN(TIME_STEPS, INPUT_SIZE, OUTPUT_SIZE, CELL_SIZE, BATCH_SIZE)
    sess = tf.Session()
    merged = tf.summary.merge_all()
    writer = tf.summary.FileWriter('017logs', sess.graph)
    
    sess.run(tf.initialize_all_variables())
    plt.ion()
    plt.show()
    for i in range(200):
        seq, res, xs = get_batch()    # 预测值、真实值、时间点（X）
        if i == 0:
            feed_dict = {model.xs:seq, model.ys:res,}
        else:
            feed_dict = {model.xs:seq, model.ys:res, model.cell_init_state:state}
        
        _, cost, state, pred = sess.run([model.train_op, model.cost, model.cell_final_state, model.pred], feed_dict=feed_dict)
        
        # 绘图
        plt.plot(xs[0, :], res[0].flatten(), 'r', xs[0, :], pred.flatten()[:TIME_STEPS], 'b--')
        plt.ylim((-1.2, 1.2))
        plt.draw()
        plt.pause(0.3)
        
        if i%20 == 0:
            print('cost：', round(cost, 4))
            result = sess.run(merged, feed_dict)
            writer.add_summary(result, i)

Using matplotlib backend: Qt5Agg
cost： 13.4159
cost： 5.1304
cost： 1.8306
cost： 5.1235
cost： 0.7821
cost： 0.287
cost： 0.0778
cost： 0.048
cost： 0.0388
cost： 0.0247


### cmd窗口下：
> E:
> 
> cd E:\wk\GithubProjects\DeepLearning\莫烦教程
>
> tensorboard --logdir=017logs/

### 浏览器打开网址：
http://WIN-Q2DQ03POEFR:6006/

In [50]:
help(tf.contrib.legacy_seq2seq.sequence_loss_by_example)

Help on function sequence_loss_by_example in module tensorflow.contrib.legacy_seq2seq.python.ops.seq2seq:

sequence_loss_by_example(logits, targets, weights, average_across_timesteps=True, softmax_loss_function=None, name=None)
    Weighted cross-entropy loss for a sequence of logits (per example).
    
    Args:
      logits: List of 2D Tensors of shape [batch_size x num_decoder_symbols].
      targets: List of 1D batch-sized int32 Tensors of the same length as logits.
      weights: List of 1D batch-sized float-Tensors of the same length as logits.
      average_across_timesteps: If set, divide the returned cost by the total
        label weight.
      softmax_loss_function: Function (labels, logits) -> loss-batch to be used
        instead of the standard softmax (the default if this is None). **Note that
        to avoid confusion, it is required for the function to accept named
        arguments.**
      name: Optional name for this operation, default: "sequence_loss_by_example".


### np.newaxis的
在np.newaxis所在的位置增加一维

In [26]:
import numpy as np

X = np.array([1, 2, 3])
print(X)
print(X[:, np.newaxis])

[1 2 3]
[[1]
 [2]
 [3]]


In [27]:
print(X[np.newaxis, :])

[[1 2 3]]


In [28]:
X = np.array([[1, 2, 3],
              [4, 5, 6]
             ])
print(X)
print(X[:, :, np.newaxis])

[[1 2 3]
 [4 5 6]]
[[[1]
  [2]
  [3]]

 [[4]
  [5]
  [6]]]


In [29]:
print(X[:, np.newaxis, :])

[[[1 2 3]]

 [[4 5 6]]]


In [30]:
print(X[np.newaxis, :, :])

[[[1 2 3]
  [4 5 6]]]
