Jupyter Notebook version of https://machinelearningmastery.com/how-to-develop-a-word-level-neural-language-model-in-keras/

In [1]:
from random import randint
from pickle import load
from keras.models import load_model
from keras.preprocessing.sequence import pad_sequences

Using TensorFlow backend.


### Function for loading document



In [0]:
def load_doc(filename):
	# open the file as read only
	file = open(filename, 'r')
	# read all text
	text = file.read()
	# close the file
	file.close()
	return text

### Function for generating sequence from language model

In [0]:
def generate_seq(model, tokenizer, seq_length, seed_text, n_words):
	result = list()
	in_text = seed_text
	# generate a fixed number of words
	for _ in range(n_words):
		# encode the text as integer
		encoded = tokenizer.texts_to_sequences([in_text])[0]
		# truncate sequences to a fixed length
		encoded = pad_sequences([encoded], maxlen=seq_length, truncating='pre')
		# predict probabilities for each word
		yhat = model.predict_classes(encoded, verbose=0)
		# map predicted word index to word
		out_word = ''
		for word, index in tokenizer.word_index.items():
			if index == yhat:
				out_word = word
				break
		# append to input
		in_text += ' ' + out_word
		result.append(out_word)
	return ' '.join(result)

### Run model

Load text sequences

In [0]:
in_filename = '/content/kvv.txt'
doc = load_doc(in_filename)
lines = doc.split('\n')
seq_length = len(lines[0].split()) - 1

Load Model

In [0]:
model = load_model('/content/model.h5')

Load Tokenizer

In [0]:
tokenizer = load(open('tokenizer.pkl', 'rb'))

Select a seed text

In [0]:
seed_text = lines[randint(0,len(lines))]
print(seed_text + '\n')

Generate new text

In [0]:
generated = generate_seq(model, tokenizer, seq_length, seed_text, 50)
print(generated)