In [2]:
import tensorflow as tf
import numpy as np
tf.set_random_seed(777) # reproducibility

In [3]:
sample = " if you want you"
idx2char = list(set(sample)) # index -> char
char2idx = {c: i for i, c in enumerate(idx2char)} # char -> idex

In [4]:
# hyper parameters
dic_size = len(char2idx) # RNN input size (one hot size)
rnn_hidden_size = len(char2idx) # RNN output size
num_classes = len(char2idx) # final output size (RNN or softmax, etc.)
batch_size = 1 # one sample data, one batch
sequence_length = len(sample) - 1 # number of lstm rollings (unit #)
learning_rate = 0.1

In [5]:
sample_idx = [char2idx[c] for c in sample] # char to index
x_data = [sample_idx[:-1]] # X data sample (0 ~ n-1) hello: hell
y_data = [sample_idx[1:]] # Y label sample (1 ~ n) hello: ello

In [6]:
X = tf.placeholder(tf.int32, [None, sequence_length]) # X data
Y = tf.placeholder(tf.int32, [None, sequence_length]) # Y label

In [7]:
# flatten the data (ignore batches for now). No effect if the batch size is 1
X_one_hot = tf.one_hot(X, num_classes) # one hot: 1 -> 0 1 0 0 0 0 0 0 0 0
X_for_softmax = tf.reshape(X_one_hot, [-1, rnn_hidden_size])

In [8]:
# softmax layer (rnn_hidden_size -> num_classes)
softmax_w = tf.get_variable("softmax_w", [rnn_hidden_size, num_classes])
softmax_b = tf.get_variable("softmax_b", [num_classes])
outputs = tf.matmul(X_for_softmax, softmax_w) + softmax_b

In [9]:
# expend the data (revive the batches)
outputs = tf.reshape(outputs, [batch_size, sequence_length, num_classes])
weights = tf.ones([batch_size, sequence_length])

In [10]:
# Compute sequence cost/loss
sequence_loss = tf.contrib.seq2seq.sequence_loss(logits = outputs, targets = Y, weights = weights)
loss = tf.reduce_mean(sequence_loss) # mean all sequence loss
train = tf.train.AdamOptimizer(learning_rate = learning_rate).minimize(loss)

The TensorFlow contrib module will not be included in TensorFlow 2.0.
For more information, please see:
  * https://github.com/tensorflow/community/blob/master/rfcs/20180907-contrib-sunset.md
  * https://github.com/tensorflow/addons
  * https://github.com/tensorflow/io (for I/O related ops)
If you depend on functionality not listed there, please file an issue.



In [11]:
prediction = tf.argmax(outputs, axis = 2)

In [12]:
with tf.Session() as sess:
  sess.run(tf.global_variables_initializer())

  for i in range(3000):
    l, _ = sess.run([loss, train], feed_dict = {X: x_data, Y: y_data})
    result = sess.run(prediction, feed_dict = {X: x_data})

    # print char using dic
    result_str = [idx2char[c] for c in np.squeeze(result)]
    print(i, "loss:", l, "Prediction:", ''.join(result_str))

0 loss: 2.2233877 Prediction: in iouiiiu  iou
1 loss: 2.0227606 Prediction: if iou iiu  iou
2 loss: 1.839122 Prediction: if iou ion  iou
3 loss: 1.672697 Prediction: if iou ion  iou
4 loss: 1.5213573 Prediction: if iou ion  iou
5 loss: 1.3829963 Prediction: if iou iont iou
6 loss: 1.2566348 Prediction: yf you yant you
7 loss: 1.1417198 Prediction: yf you yant you
8 loss: 1.0376819 Prediction: yf you yant you
9 loss: 0.9439465 Prediction: yf you yant you
10 loss: 0.86004406 Prediction: yf you yant you
11 loss: 0.78555715 Prediction: yf you yant you
12 loss: 0.7199922 Prediction: yf you yant you
13 loss: 0.662702 Prediction: yf you yant you
14 loss: 0.61289537 Prediction: yf you yant you
15 loss: 0.56971484 Prediction: yf you yant you
16 loss: 0.5323365 Prediction: yf you yant you
17 loss: 0.50003535 Prediction: yf you yant you
18 loss: 0.47219607 Prediction: yf you yant you
19 loss: 0.4482865 Prediction: yf you yant you
20 loss: 0.42782414 Prediction: yf you yant you
21 loss: 0.41035873