In [1]:
import tensorflow as tf
from tensorflow import keras
from keras.layers import TextVectorization, Embedding, SimpleRNN, Dense
from keras import Sequential
import numpy as np

# Using RNN

In [2]:
text="This is a sample text used to demonstrate predictive text with basic RNNs.In this example,we'll predict the next word as you type "

In [3]:
tokenizer = TextVectorization()
tokenizer.adapt(text.split())

In [4]:
text_sequences = tokenizer(text)
text_sequences

<tf.Tensor: shape=(22,), dtype=int64, numpy=
array([ 2, 16, 21, 11,  3,  7,  9, 18, 13,  3,  6, 19, 12,  2, 17, 14, 10,
       15,  5, 20,  4,  8], dtype=int64)>

In [5]:
x = text_sequences[:-1]
y = text_sequences[1:]

`text_sequences[:-1]` is slicing the list of text sequences to create `x`. It *takes all elements from the beginning of the list to the second-to-last element*. This means it creates x with all sequences except the last one.

`text_sequences[1:]` is slicing the list of text sequences to create `y`. It *takes all elements starting from the second element to the end of the list*. This means it creates y with all sequences except the first one.

In [6]:
model = Sequential([
    Embedding(input_dim=len(tokenizer.get_vocabulary()), output_dim=64, input_length=1),
    SimpleRNN(128,return_sequences=True),
    Dense(len(tokenizer.get_vocabulary()),activation='softmax')
])

In [7]:
model.compile(loss='sparse_categorical_crossentropy',optimizer='adam')

In [8]:
model.fit(x,y,epochs=50)

Epoch 1/50
Epoch 2/50
Epoch 3/50
Epoch 4/50
Epoch 5/50
Epoch 6/50
Epoch 7/50
Epoch 8/50
Epoch 9/50
Epoch 10/50
Epoch 11/50
Epoch 12/50
Epoch 13/50
Epoch 14/50
Epoch 15/50
Epoch 16/50
Epoch 17/50
Epoch 18/50
Epoch 19/50
Epoch 20/50
Epoch 21/50
Epoch 22/50
Epoch 23/50
Epoch 24/50
Epoch 25/50
Epoch 26/50
Epoch 27/50
Epoch 28/50
Epoch 29/50
Epoch 30/50
Epoch 31/50
Epoch 32/50
Epoch 33/50
Epoch 34/50
Epoch 35/50
Epoch 36/50
Epoch 37/50
Epoch 38/50
Epoch 39/50
Epoch 40/50
Epoch 41/50
Epoch 42/50
Epoch 43/50
Epoch 44/50
Epoch 45/50
Epoch 46/50
Epoch 47/50
Epoch 48/50
Epoch 49/50
Epoch 50/50


<keras.src.callbacks.History at 0x1132425f5e0>

In [9]:
def generate_next_word(seed_text):
  seed_sequence=tokenizer(seed_text)
  predicted_probabilities=model.predict(seed_sequence)
  predicted_index=np.argmax(predicted_probabilities)
  predicted_word=tokenizer.get_vocabulary()[predicted_index]
  return predicted_word

In [10]:
input_text = "used"
predicted_word = generate_next_word(input_text)
print(f"Input: '{input_text}', Predicted: '{predicted_word}'")

Input: 'used', Predicted: 'to'


# Using LSTM

In [11]:
from keras.layers import LSTM

In [12]:
text="This is a sample text used to demonstrate predictive text with basic LSTM.In this example,we'll predict the next word as you type "

In [13]:
tokenizer = TextVectorization()
tokenizer.adapt(text.split())

In [14]:
text_sequences = tokenizer(text)
text_sequences

<tf.Tensor: shape=(22,), dtype=int64, numpy=
array([ 2, 16, 21, 11,  3,  7,  9, 18, 12,  3,  6, 19, 15,  2, 17, 13, 10,
       14,  5, 20,  4,  8], dtype=int64)>

In [15]:
x = text_sequences[:-1]
y = text_sequences[1:]

`text_sequences[:-1]` is slicing the list of text sequences to create `x`. It *takes all elements from the beginning of the list to the second-to-last element*. This means it creates x with all sequences except the last one.

`text_sequences[1:]` is slicing the list of text sequences to create `y`. It *takes all elements starting from the second element to the end of the list*. This means it creates y with all sequences except the first one.

In [16]:
model = Sequential([
    Embedding(input_dim=len(tokenizer.get_vocabulary()), output_dim=64, input_length=1),
    LSTM(128,return_sequences=True),
    Dense(len(tokenizer.get_vocabulary()),activation='softmax')
])

In [17]:
model.compile(loss='sparse_categorical_crossentropy',optimizer='adam')

In [18]:
model.fit(x,y,epochs=50)

Epoch 1/50
Epoch 2/50
Epoch 3/50
Epoch 4/50
Epoch 5/50
Epoch 6/50
Epoch 7/50
Epoch 8/50
Epoch 9/50
Epoch 10/50
Epoch 11/50
Epoch 12/50
Epoch 13/50
Epoch 14/50
Epoch 15/50
Epoch 16/50
Epoch 17/50
Epoch 18/50
Epoch 19/50
Epoch 20/50
Epoch 21/50
Epoch 22/50
Epoch 23/50
Epoch 24/50
Epoch 25/50
Epoch 26/50
Epoch 27/50
Epoch 28/50
Epoch 29/50
Epoch 30/50
Epoch 31/50
Epoch 32/50
Epoch 33/50
Epoch 34/50
Epoch 35/50
Epoch 36/50
Epoch 37/50
Epoch 38/50
Epoch 39/50
Epoch 40/50
Epoch 41/50
Epoch 42/50
Epoch 43/50
Epoch 44/50
Epoch 45/50
Epoch 46/50
Epoch 47/50
Epoch 48/50
Epoch 49/50
Epoch 50/50


<keras.src.callbacks.History at 0x113266149d0>

In [19]:
def generate_next_word(seed_text):
  seed_sequence=tokenizer(seed_text)
  predicted_probabilities=model.predict(seed_sequence)
  predicted_index=np.argmax(predicted_probabilities)
  predicted_word=tokenizer.get_vocabulary()[predicted_index]
  return predicted_word

In [20]:
input_text = "this"
predicted_word = generate_next_word(input_text)
print(f"Input: '{input_text}', Predicted: '{predicted_word}'")

Input: 'this', Predicted: 'is'
